From a4e38e154da99a6af960ddbec5443c09be3f391b Mon Sep 17 00:00:00 2001 From: Even Zhou Date: Mon, 23 Feb 2026 16:58:30 +0800 Subject: [PATCH 1/7] bump sgl-kernel-npu to 2026.02.01.post2 --- .github/workflows/release-docker-npu.yml | 2 +- scripts/ci/npu/npu_ci_install_dependency.sh | 4 ++-- 2 files changed, 3 insertions(+), 3 deletions(-) diff --git a/.github/workflows/release-docker-npu.yml b/.github/workflows/release-docker-npu.yml index 12f96094925d..77a7bfe2c269 100644 --- a/.github/workflows/release-docker-npu.yml +++ b/.github/workflows/release-docker-npu.yml @@ -87,7 +87,7 @@ jobs: push: ${{ github.repository == 'sgl-project/sglang' && github.event_name != 'pull_request' }} provenance: false build-args: | - SGLANG_KERNEL_NPU_TAG=2026.01.28 + SGLANG_KERNEL_NPU_TAG=2026.02.01.post2 CANN_VERSION=${{ matrix.cann_version }} DEVICE_TYPE=${{ matrix.device_type }} SGLANG_TAG=${{ steps.version.outputs.version }} diff --git a/scripts/ci/npu/npu_ci_install_dependency.sh b/scripts/ci/npu/npu_ci_install_dependency.sh index a138e4aa15a8..fefba577a993 100755 --- a/scripts/ci/npu/npu_ci_install_dependency.sh +++ b/scripts/ci/npu/npu_ci_install_dependency.sh @@ -44,9 +44,9 @@ ${PIP_INSTALL} triton-ascend ### Install sgl-kernel-npu -SGLANG_KERNEL_NPU_TAG="2026.01.21" +SGLANG_KERNEL_NPU_TAG="2026.02.01.post2" mkdir sgl-kernel-npu -(cd sgl-kernel-npu && wget https://github.com/sgl-project/sgl-kernel-npu/releases/download/${SGLANG_KERNEL_NPU_TAG}/sgl-kernel-npu_${SGLANG_KERNEL_NPU_TAG}_8.5.0_${DEVICE_TYPE}.zip \ +(cd sgl-kernel-npu && wget https://github.com/sgl-project/sgl-kernel-npu/releases/download/${SGLANG_KERNEL_NPU_TAG}/sgl-kernel-npu-${SGLANG_KERNEL_NPU_TAG}-torch2.8.0-py311-cann${CANN_VERSION}-${DEVICE_TYPE}-$(arch).zip \ && unzip sgl-kernel-npu_${SGLANG_KERNEL_NPU_TAG}_8.5.0_${DEVICE_TYPE}.zip \ && ${PIP_INSTALL} output/deep_ep*.whl output/sgl_kernel_npu*.whl \ && (cd "$(python3 -m pip show deep-ep | grep -E '^Location:' | awk '{print $2}')" && ln -s deep_ep/deep_ep_cpp*.so)) From dbf7f4a531ebdb312448bcba19e64608f02049a7 Mon Sep 17 00:00:00 2001 From: Even Zhou Date: Mon, 23 Feb 2026 17:06:03 +0800 Subject: [PATCH 2/7] check changes correct when building docker images --- .github/workflows/release-docker-npu-nightly.yml | 5 +++++ .github/workflows/release-docker-npu.yml | 5 +++++ 2 files changed, 10 insertions(+) diff --git a/.github/workflows/release-docker-npu-nightly.yml b/.github/workflows/release-docker-npu-nightly.yml index b5e565119332..7c2b4e55fdcb 100644 --- a/.github/workflows/release-docker-npu-nightly.yml +++ b/.github/workflows/release-docker-npu-nightly.yml @@ -1,5 +1,10 @@ name: Release Docker Images Nightly (NPU) on: + pull_request: + branches: + - 'main' + paths: + - 'docker/npu.Dockerfile' workflow_dispatch: schedule: - cron: "0 0 * * *" diff --git a/.github/workflows/release-docker-npu.yml b/.github/workflows/release-docker-npu.yml index 77a7bfe2c269..f800fb327a69 100644 --- a/.github/workflows/release-docker-npu.yml +++ b/.github/workflows/release-docker-npu.yml @@ -3,6 +3,11 @@ on: push: tags: - 'v[0-9]+.*' + pull_request: + branches: + - 'main' + paths: + - 'docker/npu.Dockerfile' workflow_dispatch: inputs: version: From 16b15532ee5d25b341798cedf6482a647ec51581 Mon Sep 17 00:00:00 2001 From: Even Zhou Date: Mon, 23 Feb 2026 17:09:15 +0800 Subject: [PATCH 3/7] add missing trigger file --- .github/workflows/release-docker-npu-nightly.yml | 1 + .github/workflows/release-docker-npu.yml | 1 + 2 files changed, 2 insertions(+) diff --git a/.github/workflows/release-docker-npu-nightly.yml b/.github/workflows/release-docker-npu-nightly.yml index 7c2b4e55fdcb..fe49016a651b 100644 --- a/.github/workflows/release-docker-npu-nightly.yml +++ b/.github/workflows/release-docker-npu-nightly.yml @@ -4,6 +4,7 @@ on: branches: - 'main' paths: + - '.github/workflows/release-docker-npu-nightly.yml' - 'docker/npu.Dockerfile' workflow_dispatch: schedule: diff --git a/.github/workflows/release-docker-npu.yml b/.github/workflows/release-docker-npu.yml index f800fb327a69..64bf2c5a635e 100644 --- a/.github/workflows/release-docker-npu.yml +++ b/.github/workflows/release-docker-npu.yml @@ -7,6 +7,7 @@ on: branches: - 'main' paths: + - '.github/workflows/release-docker-npu.yml' - 'docker/npu.Dockerfile' workflow_dispatch: inputs: From 83b537cf6f51afe06202cd2b0b0e47d99c190557 Mon Sep 17 00:00:00 2001 From: Even Zhou Date: Mon, 23 Feb 2026 17:16:21 +0800 Subject: [PATCH 4/7] fix build with pull-requests --- .github/workflows/release-docker-npu.yml | 2 ++ 1 file changed, 2 insertions(+) diff --git a/.github/workflows/release-docker-npu.yml b/.github/workflows/release-docker-npu.yml index 64bf2c5a635e..97cbd131692d 100644 --- a/.github/workflows/release-docker-npu.yml +++ b/.github/workflows/release-docker-npu.yml @@ -58,6 +58,8 @@ jobs: run: | if [ "${{ github.event_name }}" = "workflow_dispatch" ]; then VERSION="${{ github.event.inputs.version }}" + elif [ "${{ github.event_name }}" = "pull_request" ]; then + VERSION="${DOCKER_METADATA_OUTPUT_VERSION}" else # Extract version from tag (e.g., v0.5.7 -> 0.5.7) VERSION="${GITHUB_REF_NAME#v}" From 322d582deb157024e834cad4b66cacb8a006c7ef Mon Sep 17 00:00:00 2001 From: Even Zhou Date: Mon, 23 Feb 2026 17:18:46 +0800 Subject: [PATCH 5/7] fix ci install dependency --- scripts/ci/npu/npu_ci_install_dependency.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/scripts/ci/npu/npu_ci_install_dependency.sh b/scripts/ci/npu/npu_ci_install_dependency.sh index fefba577a993..fdcf8a16b8e3 100755 --- a/scripts/ci/npu/npu_ci_install_dependency.sh +++ b/scripts/ci/npu/npu_ci_install_dependency.sh @@ -46,7 +46,7 @@ ${PIP_INSTALL} triton-ascend ### Install sgl-kernel-npu SGLANG_KERNEL_NPU_TAG="2026.02.01.post2" mkdir sgl-kernel-npu -(cd sgl-kernel-npu && wget https://github.com/sgl-project/sgl-kernel-npu/releases/download/${SGLANG_KERNEL_NPU_TAG}/sgl-kernel-npu-${SGLANG_KERNEL_NPU_TAG}-torch2.8.0-py311-cann${CANN_VERSION}-${DEVICE_TYPE}-$(arch).zip \ +(cd sgl-kernel-npu && wget https://github.com/sgl-project/sgl-kernel-npu/releases/download/${SGLANG_KERNEL_NPU_TAG}/sgl-kernel-npu-${SGLANG_KERNEL_NPU_TAG}-torch2.8.0-py311-cann8.5.0-${DEVICE_TYPE}-$(arch).zip \ && unzip sgl-kernel-npu_${SGLANG_KERNEL_NPU_TAG}_8.5.0_${DEVICE_TYPE}.zip \ && ${PIP_INSTALL} output/deep_ep*.whl output/sgl_kernel_npu*.whl \ && (cd "$(python3 -m pip show deep-ep | grep -E '^Location:' | awk '{print $2}')" && ln -s deep_ep/deep_ep_cpp*.so)) From f2306c5712adb76183a8ff09e44ee1ddb9aa406a Mon Sep 17 00:00:00 2001 From: Even Zhou Date: Mon, 23 Feb 2026 17:21:58 +0800 Subject: [PATCH 6/7] make version format checking happy --- .github/workflows/release-docker-npu.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/release-docker-npu.yml b/.github/workflows/release-docker-npu.yml index 97cbd131692d..a9b678861513 100644 --- a/.github/workflows/release-docker-npu.yml +++ b/.github/workflows/release-docker-npu.yml @@ -59,7 +59,7 @@ jobs: if [ "${{ github.event_name }}" = "workflow_dispatch" ]; then VERSION="${{ github.event.inputs.version }}" elif [ "${{ github.event_name }}" = "pull_request" ]; then - VERSION="${DOCKER_METADATA_OUTPUT_VERSION}" + VERSION="0.0.0" else # Extract version from tag (e.g., v0.5.7 -> 0.5.7) VERSION="${GITHUB_REF_NAME#v}" From 706e61b5ced7da97b544ac2c0b866af15d8ff189 Mon Sep 17 00:00:00 2001 From: Even Zhou Date: Mon, 23 Feb 2026 17:39:06 +0800 Subject: [PATCH 7/7] fix ci install dependency --- .github/workflows/release-docker-npu.yml | 8 -------- scripts/ci/npu/npu_ci_install_dependency.sh | 4 ++-- 2 files changed, 2 insertions(+), 10 deletions(-) diff --git a/.github/workflows/release-docker-npu.yml b/.github/workflows/release-docker-npu.yml index a9b678861513..77a7bfe2c269 100644 --- a/.github/workflows/release-docker-npu.yml +++ b/.github/workflows/release-docker-npu.yml @@ -3,12 +3,6 @@ on: push: tags: - 'v[0-9]+.*' - pull_request: - branches: - - 'main' - paths: - - '.github/workflows/release-docker-npu.yml' - - 'docker/npu.Dockerfile' workflow_dispatch: inputs: version: @@ -58,8 +52,6 @@ jobs: run: | if [ "${{ github.event_name }}" = "workflow_dispatch" ]; then VERSION="${{ github.event.inputs.version }}" - elif [ "${{ github.event_name }}" = "pull_request" ]; then - VERSION="0.0.0" else # Extract version from tag (e.g., v0.5.7 -> 0.5.7) VERSION="${GITHUB_REF_NAME#v}" diff --git a/scripts/ci/npu/npu_ci_install_dependency.sh b/scripts/ci/npu/npu_ci_install_dependency.sh index fdcf8a16b8e3..486a908b1714 100755 --- a/scripts/ci/npu/npu_ci_install_dependency.sh +++ b/scripts/ci/npu/npu_ci_install_dependency.sh @@ -47,8 +47,8 @@ ${PIP_INSTALL} triton-ascend SGLANG_KERNEL_NPU_TAG="2026.02.01.post2" mkdir sgl-kernel-npu (cd sgl-kernel-npu && wget https://github.com/sgl-project/sgl-kernel-npu/releases/download/${SGLANG_KERNEL_NPU_TAG}/sgl-kernel-npu-${SGLANG_KERNEL_NPU_TAG}-torch2.8.0-py311-cann8.5.0-${DEVICE_TYPE}-$(arch).zip \ -&& unzip sgl-kernel-npu_${SGLANG_KERNEL_NPU_TAG}_8.5.0_${DEVICE_TYPE}.zip \ -&& ${PIP_INSTALL} output/deep_ep*.whl output/sgl_kernel_npu*.whl \ +&& unzip ./sgl-kernel-npu-${SGLANG_KERNEL_NPU_TAG}-torch2.8.0-py311-cann8.5.0-${DEVICE_TYPE}-$(arch).zip \ +&& ${PIP_INSTALL} ./deep_ep*.whl ./sgl_kernel_npu*.whl \ && (cd "$(python3 -m pip show deep-ep | grep -E '^Location:' | awk '{print $2}')" && ln -s deep_ep/deep_ep_cpp*.so))