Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion .github/workflows/_e2e_nightly_single_node_models.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -108,7 +108,7 @@ jobs:
pip install -v -e .

- name: Install tensorflow (for Molmo-7B-D-0924)
if: ${{ inputs.runner == 'linux-aarch64-a2-1' && contains(inputs.model_list, 'Molmo-7B-D-0924') }}
if: ${{ inputs.runner == 'linux-aarch64-a2b3-1' && contains(inputs.model_list, 'Molmo-7B-D-0924') }}
shell: bash -l {0}
run: |
pip install tensorflow==2.19.1 --no-cache-dir
Expand Down
2 changes: 1 addition & 1 deletion .github/workflows/labled_doctest.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -46,7 +46,7 @@ jobs:
matrix:
vllm_verison: [releases-v0.13.0, releases-v0.13.0-openeuler, main, main-openeuler]
name: vLLM Ascend test
runs-on: linux-aarch64-a2-1
runs-on: linux-aarch64-a2b3-1
container:
image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/vllm-ascend:${{ matrix.vllm_verison }}
steps:
Expand Down
2 changes: 1 addition & 1 deletion .github/workflows/labled_download_model.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -19,7 +19,7 @@ jobs:
download-models:
if: contains(github.event.pull_request.labels.*.name, 'model-download')
name: Download models from ModelScope
runs-on: linux-aarch64-a2-0
runs-on: linux-aarch64-a2b3-0
container:
image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/vllm-ascend:nightly-cpu

Expand Down
4 changes: 2 additions & 2 deletions .github/workflows/pr_test_full.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -39,7 +39,7 @@ concurrency:

jobs:
changes:
runs-on: linux-aarch64-a2-0
runs-on: linux-aarch64-a2b3-0
if: ${{ contains(github.event.pull_request.labels.*.name, 'ready') && contains(github.event.pull_request.labels.*.name, 'ready-for-test') }}
outputs:
e2e_tracker: ${{ steps.filter.outputs.e2e_tracker }}
Expand Down Expand Up @@ -81,7 +81,7 @@ jobs:
uses: ./.github/workflows/_e2e_test.yaml
with:
vllm: ${{ matrix.vllm_version }}
runner: linux-aarch64-a2
runner: linux-aarch64-a2b3
image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.5.0-910b-ubuntu22.04-py3.11
contains_310: false
type: full
4 changes: 2 additions & 2 deletions .github/workflows/pr_test_light.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -43,7 +43,7 @@ jobs:
with:
vllm: v0.15.0
changes:
runs-on: linux-aarch64-a2-0
runs-on: linux-aarch64-a2b3-0
outputs:
e2e_tracker: ${{ steps.filter.outputs.e2e_tracker }}
ut_tracker: ${{ steps.filter.outputs.ut_tracker }}
Expand Down Expand Up @@ -107,7 +107,7 @@ jobs:
uses: ./.github/workflows/_e2e_test.yaml
with:
vllm: ${{ matrix.vllm_version }}
runner: linux-aarch64-a2
runner: linux-aarch64-a2b3
image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.5.0-910b-ubuntu22.04-py3.11
contains_310: ${{ needs.changes.outputs._310_tracker == 'true' }}
type: light
20 changes: 10 additions & 10 deletions .github/workflows/schedule_nightly_test_a2.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -50,19 +50,19 @@ jobs:
matrix:
test_config:
- name: qwen3-next
os: linux-aarch64-a2-4
os: linux-aarch64-a2b3-4
tests: tests/e2e/nightly/single_node/models/test_qwen3_next.py
- name: qwen3-32b
os: linux-aarch64-a2-4
os: linux-aarch64-a2b3-4
tests: tests/e2e/nightly/single_node/models/test_qwen3_32b.py
- name: qwen3-32b-in8-a2
os: linux-aarch64-a2-4
os: linux-aarch64-a2b3-4
tests: tests/e2e/nightly/single_node/models/test_qwen3_32b_int8.py
- name: test_custom_op
os: linux-aarch64-a2-1
os: linux-aarch64-a2b3-1
tests: tests/e2e/nightly/single_node/ops/singlecard_ops
- name: test_custom_op_multi_card
os: linux-aarch64-a2-4
os: linux-aarch64-a2b3-4
tests: tests/e2e/nightly/single_node/ops/multicard_ops_a2/
uses: ./.github/workflows/_e2e_nightly_single_node.yaml
with:
Expand Down Expand Up @@ -108,26 +108,26 @@ jobs:
fail-fast: false
matrix:
test_config:
- os: linux-aarch64-a2-1
- os: linux-aarch64-a2b3-1
model_list:
- Qwen3-8B
- Qwen2-Audio-7B-Instruct
- Qwen3-8B-W8A8
- Qwen3-VL-8B-Instruct
- Qwen2.5-Omni-7B
- os: linux-aarch64-a2-1
- os: linux-aarch64-a2b3-1
model_list:
- ERNIE-4.5-21B-A3B-PT
- InternVL3_5-8B-hf
- Molmo-7B-D-0924
- Llama-3.2-3B-Instruct
- llava-onevision-qwen2-0.5b-ov-hf
- os: linux-aarch64-a2-2
- os: linux-aarch64-a2b3-2
model_list:
- Qwen3-30B-A3B
- Qwen3-VL-30B-A3B-Instruct
- Qwen3-30B-A3B-W8A8
- os: linux-aarch64-a2-4
- os: linux-aarch64-a2b3-4
model_list:
- Qwen3-Next-80B-A3B-Instruct
- Qwen3-Omni-30B-A3B-Instruct
Expand All @@ -147,7 +147,7 @@ jobs:
fail-fast: false
matrix:
vllm_verison: [releases-v0.13.0, releases-v0.13.0-openeuler, main, main-openeuler]
runs-on: linux-aarch64-a2-1
runs-on: linux-aarch64-a2b3-1
container:
image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/vllm-ascend:${{ matrix.vllm_verison }}
steps:
Expand Down
2 changes: 1 addition & 1 deletion .github/workflows/schedule_test_vllm_main.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -34,7 +34,7 @@ jobs:
uses: ./.github/workflows/_e2e_test.yaml
with:
vllm: main
runner: linux-aarch64-a2
runner: linux-aarch64-a2b3
image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.5.0-910b-ubuntu22.04-py3.11
contains_310: false
type: full
1 change: 0 additions & 1 deletion tests/e2e/models/configs/InternVL3_5-8B-hf.yaml
Original file line number Diff line number Diff line change
@@ -1,5 +1,4 @@
model_name: "OpenGVLab/InternVL3_5-8B-hf"
runner: "linux-aarch64-a2-1"
hardware: "Atlas A2 Series"
model: "vllm-vlm"
tasks:
Expand Down
4 changes: 2 additions & 2 deletions tests/e2e/nightly/single_node/models/test_qwen3_32b_int8.py
Original file line number Diff line number Diff line change
Expand Up @@ -45,10 +45,10 @@
}

batch_size_dict = {
"linux-aarch64-a2-4": 72,
"linux-aarch64-a2b3-4": 72,
"linux-aarch64-a3-4": 76,
}
VLLM_CI_RUNNER = os.getenv("VLLM_CI_RUNNER", "linux-aarch64-a2-4")
VLLM_CI_RUNNER = os.getenv("VLLM_CI_RUNNER", "linux-aarch64-a2b3-4")
Comment thread
zhangxinyuehfad marked this conversation as resolved.
performance_batch_size = batch_size_dict.get(VLLM_CI_RUNNER, 1)

aisbench_cases = [{
Expand Down
4 changes: 2 additions & 2 deletions tests/e2e/nightly/single_node/models/test_qwen3_next.py
Original file line number Diff line number Diff line change
Expand Up @@ -27,10 +27,10 @@
}

batch_size_dict = {
"linux-aarch64-a2-4": 64,
"linux-aarch64-a2b3-4": 64,
"linux-aarch64-a3-4": 64,
}
VLLM_CI_RUNNER = os.getenv("VLLM_CI_RUNNER", "linux-aarch64-a2-4")
VLLM_CI_RUNNER = os.getenv("VLLM_CI_RUNNER", "linux-aarch64-a2b3-4")
Comment thread
zhangxinyuehfad marked this conversation as resolved.
performance_batch_size = batch_size_dict.get(VLLM_CI_RUNNER, 1)

aisbench_cases = [{
Expand Down
Loading