From 2e548574bbc59594456b0cfb686698e2f7ee0143 Mon Sep 17 00:00:00 2001 From: Michael <13900043+michaelzhang-ai@users.noreply.github.com> Date: Tue, 17 Mar 2026 01:24:06 -0500 Subject: [PATCH] [AMD] CI: stop installing transformers from git main in Qwen 3.5 and GLM-5 nightly tests Transformers PR huggingface/transformers#41250 (merged Mar 16) converts PretrainedConfig subclasses to @dataclass via __init_subclass__, which breaks sglang's DeepseekVL2Config (non-default field ordering) and prevents the server from starting at all. Remove `pip install git+https://github.com/huggingface/transformers.git` from all Qwen 3.5 and GLM-5 CI jobs (MI30x, MI35x, ROCm 7.0 and 7.2). Use the stable transformers shipped in the docker image instead, matching all other nightly jobs (Grok2, DeepSeek-V3.2, etc.). Keep mistral-common and lm-eval[api] for Qwen 3.5 tests that need them. --- .github/workflows/nightly-test-amd-rocm720.yml | 8 ++------ .github/workflows/nightly-test-amd.yml | 8 ++------ 2 files changed, 4 insertions(+), 12 deletions(-) diff --git a/.github/workflows/nightly-test-amd-rocm720.yml b/.github/workflows/nightly-test-amd-rocm720.yml index d94c0f86ccd7..464689655cfd 100644 --- a/.github/workflows/nightly-test-amd-rocm720.yml +++ b/.github/workflows/nightly-test-amd-rocm720.yml @@ -608,7 +608,7 @@ jobs: - name: Install dependencies run: | bash scripts/ci/amd/amd_ci_install_dependency.sh --skip-aiter-build --skip-test-time-deps - bash scripts/ci/amd/amd_ci_exec.sh pip install git+https://github.com/huggingface/transformers.git mistral-common "lm-eval[api]" --upgrade + bash scripts/ci/amd/amd_ci_exec.sh pip install mistral-common "lm-eval[api]" - name: Accuracy Test ROCm 7.2 (8-GPU Qwen 3.5) timeout-minutes: 120 @@ -640,8 +640,6 @@ jobs: - name: Install dependencies run: | bash scripts/ci/amd/amd_ci_install_dependency.sh --skip-test-time-deps - # GLM-5 requires latest transformers for glm_moe_dsa architecture - bash scripts/ci/amd/amd_ci_exec.sh pip install git+https://github.com/huggingface/transformers.git - name: Accuracy Test ROCm 7.2 (8-GPU GLM-5 NSA) timeout-minutes: 120 @@ -1196,7 +1194,7 @@ jobs: run: | bash scripts/ci/amd/amd_ci_install_dependency.sh --skip-aiter-build --skip-test-time-deps bash scripts/ci/amd/amd_ci_exec.sh pip install tabulate - bash scripts/ci/amd/amd_ci_exec.sh pip install git+https://github.com/huggingface/transformers.git mistral-common "lm-eval[api]" --upgrade + bash scripts/ci/amd/amd_ci_exec.sh pip install mistral-common "lm-eval[api]" - name: Accuracy Test MI35x ROCm 7.2 (8-GPU Qwen 3.5) timeout-minutes: 120 @@ -1229,8 +1227,6 @@ jobs: bash scripts/ci/amd/amd_ci_install_dependency.sh --skip-test-time-deps # Install tabulate for run_suite.py (missing in MI35x container) bash scripts/ci/amd/amd_ci_exec.sh pip install tabulate - # GLM-5 requires latest transformers for glm_moe_dsa architecture - bash scripts/ci/amd/amd_ci_exec.sh pip install git+https://github.com/huggingface/transformers.git - name: Accuracy Test MI35x ROCm 7.2 (8-GPU GLM-5 NSA) timeout-minutes: 180 diff --git a/.github/workflows/nightly-test-amd.yml b/.github/workflows/nightly-test-amd.yml index 5aa969b73c98..f004580ea6f2 100644 --- a/.github/workflows/nightly-test-amd.yml +++ b/.github/workflows/nightly-test-amd.yml @@ -612,7 +612,7 @@ jobs: - name: Install dependencies run: | bash scripts/ci/amd/amd_ci_install_dependency.sh - bash scripts/ci/amd/amd_ci_exec.sh pip install git+https://github.com/huggingface/transformers.git mistral-common "lm-eval[api]" --upgrade + bash scripts/ci/amd/amd_ci_exec.sh pip install mistral-common "lm-eval[api]" - name: Accuracy Test (8-GPU Qwen 3.5) timeout-minutes: 120 @@ -643,8 +643,6 @@ jobs: - name: Install dependencies run: | bash scripts/ci/amd/amd_ci_install_dependency.sh - # GLM-5 requires latest transformers for glm_moe_dsa architecture - bash scripts/ci/amd/amd_ci_exec.sh pip install git+https://github.com/huggingface/transformers.git - name: Accuracy Test (8-GPU GLM-5 NSA) timeout-minutes: 120 @@ -1202,7 +1200,7 @@ jobs: run: | bash scripts/ci/amd/amd_ci_install_dependency.sh bash scripts/ci/amd/amd_ci_exec.sh pip install tabulate - bash scripts/ci/amd/amd_ci_exec.sh pip install git+https://github.com/huggingface/transformers.git mistral-common "lm-eval[api]" --upgrade + bash scripts/ci/amd/amd_ci_exec.sh pip install mistral-common "lm-eval[api]" - name: Accuracy Test MI35x (8-GPU Qwen 3.5) timeout-minutes: 120 @@ -1235,8 +1233,6 @@ jobs: bash scripts/ci/amd/amd_ci_install_dependency.sh # Install tabulate for run_suite.py (missing in MI35x container) bash scripts/ci/amd/amd_ci_exec.sh pip install tabulate - # GLM-5 requires latest transformers for glm_moe_dsa architecture - bash scripts/ci/amd/amd_ci_exec.sh pip install git+https://github.com/huggingface/transformers.git - name: Accuracy Test MI35x (8-GPU GLM-5 NSA) timeout-minutes: 180