From e93fc0305949cf9977e2060a34b79f78bdacfe64 Mon Sep 17 00:00:00 2001 From: hfadzxy Date: Thu, 5 Feb 2026 14:50:37 +0800 Subject: [PATCH] [CI] Change A2 runner Signed-off-by: hfadzxy --- .../_e2e_nightly_single_node_models.yaml | 2 +- .github/workflows/labled_doctest.yaml | 2 +- .github/workflows/labled_download_model.yaml | 2 +- .github/workflows/pr_test_full.yaml | 4 ++-- .github/workflows/pr_test_light.yaml | 4 ++-- .../workflows/schedule_nightly_test_a2.yaml | 20 +++++++++---------- .../workflows/schedule_test_vllm_main.yaml | 2 +- .../e2e/models/configs/InternVL3_5-8B-hf.yaml | 1 - .../single_node/models/test_qwen3_32b_int8.py | 4 ++-- .../single_node/models/test_qwen3_next.py | 4 ++-- 10 files changed, 22 insertions(+), 23 deletions(-) diff --git a/.github/workflows/_e2e_nightly_single_node_models.yaml b/.github/workflows/_e2e_nightly_single_node_models.yaml index 0064d2e8780..82b8e28f778 100644 --- a/.github/workflows/_e2e_nightly_single_node_models.yaml +++ b/.github/workflows/_e2e_nightly_single_node_models.yaml @@ -108,7 +108,7 @@ jobs: pip install -v -e . - name: Install tensorflow (for Molmo-7B-D-0924) - if: ${{ inputs.runner == 'linux-aarch64-a2-1' && contains(inputs.model_list, 'Molmo-7B-D-0924') }} + if: ${{ inputs.runner == 'linux-aarch64-a2b3-1' && contains(inputs.model_list, 'Molmo-7B-D-0924') }} shell: bash -l {0} run: | pip install tensorflow==2.19.1 --no-cache-dir diff --git a/.github/workflows/labled_doctest.yaml b/.github/workflows/labled_doctest.yaml index fc822559198..cdfed7eaed7 100644 --- a/.github/workflows/labled_doctest.yaml +++ b/.github/workflows/labled_doctest.yaml @@ -46,7 +46,7 @@ jobs: matrix: vllm_verison: [releases-v0.13.0, releases-v0.13.0-openeuler, main, main-openeuler] name: vLLM Ascend test - runs-on: linux-aarch64-a2-1 + runs-on: linux-aarch64-a2b3-1 container: image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/vllm-ascend:${{ matrix.vllm_verison }} steps: diff --git a/.github/workflows/labled_download_model.yaml b/.github/workflows/labled_download_model.yaml index 2a5ccedc7ca..7f50536f3fe 100644 --- a/.github/workflows/labled_download_model.yaml +++ b/.github/workflows/labled_download_model.yaml @@ -19,7 +19,7 @@ jobs: download-models: if: contains(github.event.pull_request.labels.*.name, 'model-download') name: Download models from ModelScope - runs-on: linux-aarch64-a2-0 + runs-on: linux-aarch64-a2b3-0 container: image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/vllm-ascend:nightly-cpu diff --git a/.github/workflows/pr_test_full.yaml b/.github/workflows/pr_test_full.yaml index 99817ed1627..1a5a9246061 100644 --- a/.github/workflows/pr_test_full.yaml +++ b/.github/workflows/pr_test_full.yaml @@ -39,7 +39,7 @@ concurrency: jobs: changes: - runs-on: linux-aarch64-a2-0 + runs-on: linux-aarch64-a2b3-0 if: ${{ contains(github.event.pull_request.labels.*.name, 'ready') && contains(github.event.pull_request.labels.*.name, 'ready-for-test') }} outputs: e2e_tracker: ${{ steps.filter.outputs.e2e_tracker }} @@ -81,7 +81,7 @@ jobs: uses: ./.github/workflows/_e2e_test.yaml with: vllm: ${{ matrix.vllm_version }} - runner: linux-aarch64-a2 + runner: linux-aarch64-a2b3 image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.5.0-910b-ubuntu22.04-py3.11 contains_310: false type: full diff --git a/.github/workflows/pr_test_light.yaml b/.github/workflows/pr_test_light.yaml index 7a5eb5b9dfe..7fb8a43a2cb 100644 --- a/.github/workflows/pr_test_light.yaml +++ b/.github/workflows/pr_test_light.yaml @@ -43,7 +43,7 @@ jobs: with: vllm: v0.15.0 changes: - runs-on: linux-aarch64-a2-0 + runs-on: linux-aarch64-a2b3-0 outputs: e2e_tracker: ${{ steps.filter.outputs.e2e_tracker }} ut_tracker: ${{ steps.filter.outputs.ut_tracker }} @@ -107,7 +107,7 @@ jobs: uses: ./.github/workflows/_e2e_test.yaml with: vllm: ${{ matrix.vllm_version }} - runner: linux-aarch64-a2 + runner: linux-aarch64-a2b3 image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.5.0-910b-ubuntu22.04-py3.11 contains_310: ${{ needs.changes.outputs._310_tracker == 'true' }} type: light diff --git a/.github/workflows/schedule_nightly_test_a2.yaml b/.github/workflows/schedule_nightly_test_a2.yaml index c24e60603c9..6bca7a904ed 100644 --- a/.github/workflows/schedule_nightly_test_a2.yaml +++ b/.github/workflows/schedule_nightly_test_a2.yaml @@ -50,19 +50,19 @@ jobs: matrix: test_config: - name: qwen3-next - os: linux-aarch64-a2-4 + os: linux-aarch64-a2b3-4 tests: tests/e2e/nightly/single_node/models/test_qwen3_next.py - name: qwen3-32b - os: linux-aarch64-a2-4 + os: linux-aarch64-a2b3-4 tests: tests/e2e/nightly/single_node/models/test_qwen3_32b.py - name: qwen3-32b-in8-a2 - os: linux-aarch64-a2-4 + os: linux-aarch64-a2b3-4 tests: tests/e2e/nightly/single_node/models/test_qwen3_32b_int8.py - name: test_custom_op - os: linux-aarch64-a2-1 + os: linux-aarch64-a2b3-1 tests: tests/e2e/nightly/single_node/ops/singlecard_ops - name: test_custom_op_multi_card - os: linux-aarch64-a2-4 + os: linux-aarch64-a2b3-4 tests: tests/e2e/nightly/single_node/ops/multicard_ops_a2/ uses: ./.github/workflows/_e2e_nightly_single_node.yaml with: @@ -108,26 +108,26 @@ jobs: fail-fast: false matrix: test_config: - - os: linux-aarch64-a2-1 + - os: linux-aarch64-a2b3-1 model_list: - Qwen3-8B - Qwen2-Audio-7B-Instruct - Qwen3-8B-W8A8 - Qwen3-VL-8B-Instruct - Qwen2.5-Omni-7B - - os: linux-aarch64-a2-1 + - os: linux-aarch64-a2b3-1 model_list: - ERNIE-4.5-21B-A3B-PT - InternVL3_5-8B-hf - Molmo-7B-D-0924 - Llama-3.2-3B-Instruct - llava-onevision-qwen2-0.5b-ov-hf - - os: linux-aarch64-a2-2 + - os: linux-aarch64-a2b3-2 model_list: - Qwen3-30B-A3B - Qwen3-VL-30B-A3B-Instruct - Qwen3-30B-A3B-W8A8 - - os: linux-aarch64-a2-4 + - os: linux-aarch64-a2b3-4 model_list: - Qwen3-Next-80B-A3B-Instruct - Qwen3-Omni-30B-A3B-Instruct @@ -147,7 +147,7 @@ jobs: fail-fast: false matrix: vllm_verison: [releases-v0.13.0, releases-v0.13.0-openeuler, main, main-openeuler] - runs-on: linux-aarch64-a2-1 + runs-on: linux-aarch64-a2b3-1 container: image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/vllm-ascend:${{ matrix.vllm_verison }} steps: diff --git a/.github/workflows/schedule_test_vllm_main.yaml b/.github/workflows/schedule_test_vllm_main.yaml index 3a73af74c0e..6e736a4eb20 100644 --- a/.github/workflows/schedule_test_vllm_main.yaml +++ b/.github/workflows/schedule_test_vllm_main.yaml @@ -34,7 +34,7 @@ jobs: uses: ./.github/workflows/_e2e_test.yaml with: vllm: main - runner: linux-aarch64-a2 + runner: linux-aarch64-a2b3 image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.5.0-910b-ubuntu22.04-py3.11 contains_310: false type: full diff --git a/tests/e2e/models/configs/InternVL3_5-8B-hf.yaml b/tests/e2e/models/configs/InternVL3_5-8B-hf.yaml index 3628785adbb..6aae094b4a7 100644 --- a/tests/e2e/models/configs/InternVL3_5-8B-hf.yaml +++ b/tests/e2e/models/configs/InternVL3_5-8B-hf.yaml @@ -1,5 +1,4 @@ model_name: "OpenGVLab/InternVL3_5-8B-hf" -runner: "linux-aarch64-a2-1" hardware: "Atlas A2 Series" model: "vllm-vlm" tasks: diff --git a/tests/e2e/nightly/single_node/models/test_qwen3_32b_int8.py b/tests/e2e/nightly/single_node/models/test_qwen3_32b_int8.py index a9c7d7a891c..f2507028bc4 100644 --- a/tests/e2e/nightly/single_node/models/test_qwen3_32b_int8.py +++ b/tests/e2e/nightly/single_node/models/test_qwen3_32b_int8.py @@ -45,10 +45,10 @@ } batch_size_dict = { - "linux-aarch64-a2-4": 72, + "linux-aarch64-a2b3-4": 72, "linux-aarch64-a3-4": 76, } -VLLM_CI_RUNNER = os.getenv("VLLM_CI_RUNNER", "linux-aarch64-a2-4") +VLLM_CI_RUNNER = os.getenv("VLLM_CI_RUNNER", "linux-aarch64-a2b3-4") performance_batch_size = batch_size_dict.get(VLLM_CI_RUNNER, 1) aisbench_cases = [{ diff --git a/tests/e2e/nightly/single_node/models/test_qwen3_next.py b/tests/e2e/nightly/single_node/models/test_qwen3_next.py index 7d35c8f4dc1..c05fab6a923 100644 --- a/tests/e2e/nightly/single_node/models/test_qwen3_next.py +++ b/tests/e2e/nightly/single_node/models/test_qwen3_next.py @@ -27,10 +27,10 @@ } batch_size_dict = { - "linux-aarch64-a2-4": 64, + "linux-aarch64-a2b3-4": 64, "linux-aarch64-a3-4": 64, } -VLLM_CI_RUNNER = os.getenv("VLLM_CI_RUNNER", "linux-aarch64-a2-4") +VLLM_CI_RUNNER = os.getenv("VLLM_CI_RUNNER", "linux-aarch64-a2b3-4") performance_batch_size = batch_size_dict.get(VLLM_CI_RUNNER, 1) aisbench_cases = [{