From 8790d220d5e524bdf2236e28622eb0c3a9faf9cf Mon Sep 17 00:00:00 2001 From: Wing Lian Date: Tue, 6 Jan 2026 09:59:03 -0500 Subject: [PATCH 1/8] use vllm v0.13.0 --- .github/workflows/multi-gpu-e2e.yml | 2 +- .github/workflows/tests.yml | 2 +- setup.py | 1 + 3 files changed, 3 insertions(+), 2 deletions(-) diff --git a/.github/workflows/multi-gpu-e2e.yml b/.github/workflows/multi-gpu-e2e.yml index 833dc4f29a..27957aab07 100644 --- a/.github/workflows/multi-gpu-e2e.yml +++ b/.github/workflows/multi-gpu-e2e.yml @@ -40,7 +40,7 @@ jobs: cuda_version: 12.8.1 python_version: "3.11" pytorch: 2.9.1 - axolotl_extras: fbgemm-gpu + axolotl_extras: "fbgemm-gpu,vllm" num_gpus: 2 nightly_build: "true" - cuda: 130 diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml index 75c70a24a1..3154666df6 100644 --- a/.github/workflows/tests.yml +++ b/.github/workflows/tests.yml @@ -325,7 +325,7 @@ jobs: python_version: "3.11" pytorch: 2.9.1 num_gpus: 1 - axolotl_extras: + axolotl_extras: vllm - cuda: 130 cuda_version: 13.0.0 python_version: "3.11" diff --git a/setup.py b/setup.py index 101c5b8c4b..0db31d5553 100644 --- a/setup.py +++ b/setup.py @@ -78,6 +78,7 @@ def parse_requirements(extras_require_map): extras_require_map["vllm"] = ["vllm==0.11.1"] if not install_xformers: _install_requires.pop(_install_requires.index(xformers_version)) + extras_require_map["vllm"] = ["vllm==0.13.0"] elif (major, minor) >= (2, 8): extras_require_map.pop("fbgemm-gpu") extras_require_map["fbgemm-gpu"] = ["fbgemm-gpu-genai==1.3.0"] From 2a088e347d6b9b5790180dba3e5672367c9e1aaf Mon Sep 17 00:00:00 2001 From: Wing Lian Date: Wed, 21 Jan 2026 09:32:09 -0500 Subject: [PATCH 2/8] support vllm 0.14.0 for torch 2.9.1 --- setup.py | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/setup.py b/setup.py index 0db31d5553..00a8486e22 100644 --- a/setup.py +++ b/setup.py @@ -79,6 +79,10 @@ def parse_requirements(extras_require_map): if not install_xformers: _install_requires.pop(_install_requires.index(xformers_version)) extras_require_map["vllm"] = ["vllm==0.13.0"] + if patch == 0: + extras_require_map["vllm"] = ["vllm==0.13.0"] + else: + extras_require_map["vllm"] = ["vllm==0.14.0"] elif (major, minor) >= (2, 8): extras_require_map.pop("fbgemm-gpu") extras_require_map["fbgemm-gpu"] = ["fbgemm-gpu-genai==1.3.0"] From 04c537d75b7fea680fb39b17787ed0ec82e52e60 Mon Sep 17 00:00:00 2001 From: Wing Lian Date: Wed, 21 Jan 2026 14:20:04 -0500 Subject: [PATCH 3/8] upgrade mistral-common --- requirements.txt | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/requirements.txt b/requirements.txt index 2b5ec0c38b..2ec4cde553 100644 --- a/requirements.txt +++ b/requirements.txt @@ -72,4 +72,4 @@ axolotl-contribs-mit==0.0.6 # telemetry posthog==6.7.11 -mistral-common==1.8.6 +mistral-common==1.8.8 From 18ca3992063f34ce546ddf5f6f2f8695b624a07b Mon Sep 17 00:00:00 2001 From: Wing Lian Date: Wed, 21 Jan 2026 15:55:08 -0500 Subject: [PATCH 4/8] cu129 required for vllm with torch 2.9.1 --- .github/workflows/multi-gpu-e2e.yml | 10 ++++++---- .github/workflows/tests.yml | 4 ++-- 2 files changed, 8 insertions(+), 6 deletions(-) diff --git a/.github/workflows/multi-gpu-e2e.yml b/.github/workflows/multi-gpu-e2e.yml index 27957aab07..e91cb65fc3 100644 --- a/.github/workflows/multi-gpu-e2e.yml +++ b/.github/workflows/multi-gpu-e2e.yml @@ -35,14 +35,18 @@ jobs: pytorch: 2.8.0 axolotl_extras: fbgemm-gpu num_gpus: 2 - nightly_build: "true" - cuda: 128 cuda_version: 12.8.1 python_version: "3.11" pytorch: 2.9.1 + axolotl_extras: "fbgemm-gpu" + num_gpus: 2 + - cuda: 129 + cuda_version: 12.9.1 + python_version: "3.12" + pytorch: 2.9.1 axolotl_extras: "fbgemm-gpu,vllm" num_gpus: 2 - nightly_build: "true" - cuda: 130 cuda_version: 13.0.0 python_version: "3.11" @@ -50,7 +54,6 @@ jobs: axolotl_extras: # axolotl_extras: fbgemm-gpu num_gpus: 2 - nightly_build: "true" runs-on: [self-hosted, modal] timeout-minutes: 120 steps: @@ -72,7 +75,6 @@ jobs: echo "AXOLOTL_EXTRAS=${{ matrix.axolotl_extras}}" >> $GITHUB_ENV echo "CUDA=${{ matrix.cuda }}" >> $GITHUB_ENV echo "N_GPUS=${{ matrix.num_gpus }}" >> $GITHUB_ENV - echo "NIGHTLY_BUILD=${{ matrix.nightly_build }}" >> $GITHUB_ENV echo "CODECOV_TOKEN=${{ secrets.CODECOV_TOKEN }}" >> $GITHUB_ENV - name: Run tests job on Modal run: | diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml index 3154666df6..2c0dac7c14 100644 --- a/.github/workflows/tests.yml +++ b/.github/workflows/tests.yml @@ -269,7 +269,7 @@ jobs: python_version: "3.12" pytorch: 2.9.1 num_gpus: 1 - axolotl_extras: + axolotl_extras: vllm dockerfile: "Dockerfile-uv.jinja" steps: - name: Checkout @@ -325,7 +325,7 @@ jobs: python_version: "3.11" pytorch: 2.9.1 num_gpus: 1 - axolotl_extras: vllm + axolotl_extras: - cuda: 130 cuda_version: 13.0.0 python_version: "3.11" From 29677afce3c0a81a0779e6d64018cbe9697fcd59 Mon Sep 17 00:00:00 2001 From: Wing Lian Date: Wed, 21 Jan 2026 16:56:57 -0500 Subject: [PATCH 5/8] support dockerfile arg for multigpu ci for uv support --- .github/workflows/multi-gpu-e2e.yml | 2 ++ cicd/multigpu.py | 6 +++++- 2 files changed, 7 insertions(+), 1 deletion(-) diff --git a/.github/workflows/multi-gpu-e2e.yml b/.github/workflows/multi-gpu-e2e.yml index e91cb65fc3..c9af70a720 100644 --- a/.github/workflows/multi-gpu-e2e.yml +++ b/.github/workflows/multi-gpu-e2e.yml @@ -54,6 +54,7 @@ jobs: axolotl_extras: # axolotl_extras: fbgemm-gpu num_gpus: 2 + dockerfile: "Dockerfile-uv.jinja" runs-on: [self-hosted, modal] timeout-minutes: 120 steps: @@ -76,6 +77,7 @@ jobs: echo "CUDA=${{ matrix.cuda }}" >> $GITHUB_ENV echo "N_GPUS=${{ matrix.num_gpus }}" >> $GITHUB_ENV echo "CODECOV_TOKEN=${{ secrets.CODECOV_TOKEN }}" >> $GITHUB_ENV + echo "E2E_DOCKERFILE=${{ matrix.dockerfile || 'Dockerfile.jinja'}}" >> $GITHUB_ENV - name: Run tests job on Modal run: | modal run -m cicd.multigpu diff --git a/cicd/multigpu.py b/cicd/multigpu.py index 5bd8d3c044..ed022c851f 100644 --- a/cicd/multigpu.py +++ b/cicd/multigpu.py @@ -17,7 +17,8 @@ template_env = jinja2.Environment( loader=template_loader, autoescape=select_autoescape() ) -df_template = template_env.get_template("Dockerfile.jinja") +dockerfile = os.environ.get("E2E_DOCKERFILE", "Dockerfile.jinja") +df_template = template_env.get_template(dockerfile) df_args = { "AXOLOTL_EXTRAS": os.environ.get("AXOLOTL_EXTRAS", ""), @@ -27,8 +28,11 @@ "CUDA": os.environ.get("CUDA", "126"), "GITHUB_REF": os.environ.get("GITHUB_REF", "refs/heads/main"), "GITHUB_SHA": os.environ.get("GITHUB_SHA", ""), + "NIGHTLY_BUILD": os.environ.get("NIGHTLY_BUILD", ""), "CODECOV_TOKEN": os.environ.get("CODECOV_TOKEN", ""), "HF_HOME": "/workspace/data/huggingface-cache/hub", + "PYTHONUNBUFFERED": os.environ.get("PYTHONUNBUFFERED", "1"), + "DEEPSPEED_LOG_LEVEL": os.environ.get("DEEPSPEED_LOG_LEVEL", "WARNING"), } dockerfile_contents = df_template.render(**df_args) From 5813cd4834750442f621dc15cf4bdc1f7b71a4ed Mon Sep 17 00:00:00 2001 From: Wing Lian Date: Wed, 21 Jan 2026 16:58:32 -0500 Subject: [PATCH 6/8] use uv for vllm --- .github/workflows/multi-gpu-e2e.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/multi-gpu-e2e.yml b/.github/workflows/multi-gpu-e2e.yml index c9af70a720..107572ad62 100644 --- a/.github/workflows/multi-gpu-e2e.yml +++ b/.github/workflows/multi-gpu-e2e.yml @@ -47,6 +47,7 @@ jobs: pytorch: 2.9.1 axolotl_extras: "fbgemm-gpu,vllm" num_gpus: 2 + dockerfile: "Dockerfile-uv.jinja" - cuda: 130 cuda_version: 13.0.0 python_version: "3.11" @@ -54,7 +55,6 @@ jobs: axolotl_extras: # axolotl_extras: fbgemm-gpu num_gpus: 2 - dockerfile: "Dockerfile-uv.jinja" runs-on: [self-hosted, modal] timeout-minutes: 120 steps: From 04e2a65b159c26202cde8b30c3c8f614ff3b8dd2 Mon Sep 17 00:00:00 2001 From: Wing Lian Date: Wed, 21 Jan 2026 17:13:44 -0500 Subject: [PATCH 7/8] upgrade packaging to 26.0 --- .github/workflows/pypi.yml | 2 +- .github/workflows/tests-nightly.yml | 2 +- .github/workflows/tests.yml | 4 ++-- README.md | 2 +- cicd/Dockerfile-uv.jinja | 2 +- cicd/Dockerfile.jinja | 2 +- docker/Dockerfile-base | 2 +- docker/Dockerfile-base-nightly | 2 +- examples/apertus/README.md | 2 +- examples/arcee/README.md | 2 +- examples/devstral/README.md | 2 +- examples/gemma3n/README.md | 2 +- examples/gpt-oss/README.md | 2 +- examples/granite4/README.md | 2 +- examples/hunyuan/README.md | 2 +- examples/magistral/README.md | 2 +- examples/qwen3-next/README.md | 2 +- examples/voxtral/README.md | 2 +- pyproject.toml | 2 +- requirements.txt | 2 +- 20 files changed, 21 insertions(+), 21 deletions(-) diff --git a/.github/workflows/pypi.yml b/.github/workflows/pypi.yml index af2ad73a47..3bf66b4975 100644 --- a/.github/workflows/pypi.yml +++ b/.github/workflows/pypi.yml @@ -40,7 +40,7 @@ jobs: - name: Install dependencies run: | - pip3 install wheel packaging==23.2 + pip3 install wheel packaging==26.0 pip3 install --no-build-isolation -e . pip3 install -r requirements-dev.txt -r requirements-tests.txt diff --git a/.github/workflows/tests-nightly.yml b/.github/workflows/tests-nightly.yml index 67b68a7e60..21446e5488 100644 --- a/.github/workflows/tests-nightly.yml +++ b/.github/workflows/tests-nightly.yml @@ -48,7 +48,7 @@ jobs: - name: upgrade pip run: | pip3 install --upgrade pip - pip3 install --upgrade packaging==23.2 setuptools==75.8.0 wheel + pip3 install --upgrade packaging==26.0 setuptools==75.8.0 wheel - name: Install PyTorch run: | diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml index 2c0dac7c14..bcbb76df3d 100644 --- a/.github/workflows/tests.yml +++ b/.github/workflows/tests.yml @@ -87,7 +87,7 @@ jobs: - name: upgrade pip run: | pip3 install --upgrade pip - pip3 install --upgrade packaging==23.2 setuptools==75.8.0 wheel + pip3 install --upgrade packaging==26.0 setuptools==75.8.0 wheel - name: Install PyTorch run: | @@ -182,7 +182,7 @@ jobs: - name: upgrade pip run: | pip3 install --upgrade pip - pip3 install --upgrade packaging==23.2 setuptools==75.8.0 setuptools_scm build wheel psutil + pip3 install --upgrade packaging==26.0 setuptools==75.8.0 setuptools_scm build wheel psutil - name: Install PyTorch run: | diff --git a/README.md b/README.md index 0521f7bedf..b56cdf0e84 100644 --- a/README.md +++ b/README.md @@ -88,7 +88,7 @@ Features: #### Using pip ```bash -pip3 install -U packaging==23.2 setuptools==75.8.0 wheel ninja +pip3 install -U packaging==26.0 setuptools==75.8.0 wheel ninja pip3 install --no-build-isolation axolotl[flash-attn,deepspeed] # Download example axolotl configs, deepspeed configs diff --git a/cicd/Dockerfile-uv.jinja b/cicd/Dockerfile-uv.jinja index 6a4d8a7d33..9a49cfca57 100644 --- a/cicd/Dockerfile-uv.jinja +++ b/cicd/Dockerfile-uv.jinja @@ -31,7 +31,7 @@ RUN if [ "$NIGHTLY_BUILD" = "true" ] ; then \ sed -i 's#^datasets.*#datasets @ git+https://github.com/huggingface/datasets.git@main#' requirements.txt; \ fi -RUN uv pip install packaging==23.2 setuptools==75.8.0 +RUN uv pip install packaging==26.0 setuptools==75.8.0 RUN uv pip install torchvision RUN if [ "$AXOLOTL_EXTRAS" != "" ] ; then \ uv pip install --no-build-isolation -e .[deepspeed,flash-attn,ring-flash-attn,optimizers,ray,$AXOLOTL_EXTRAS] $AXOLOTL_ARGS; \ diff --git a/cicd/Dockerfile.jinja b/cicd/Dockerfile.jinja index 81ed5453e3..1c397b011d 100644 --- a/cicd/Dockerfile.jinja +++ b/cicd/Dockerfile.jinja @@ -32,7 +32,7 @@ RUN if [ "$NIGHTLY_BUILD" = "true" ] ; then \ sed -i 's#^datasets.*#datasets @ git+https://github.com/huggingface/datasets.git@main#' requirements.txt; \ fi -RUN pip install packaging==23.2 setuptools==75.8.0 psutil +RUN pip install packaging==26.0 setuptools==75.8.0 psutil RUN if [ "$AXOLOTL_EXTRAS" != "" ] ; then \ pip install --no-build-isolation -e .[deepspeed,flash-attn,ring-flash-attn,optimizers,ray,$AXOLOTL_EXTRAS] $AXOLOTL_ARGS; \ else \ diff --git a/docker/Dockerfile-base b/docker/Dockerfile-base index 96367207fb..547c45f49f 100644 --- a/docker/Dockerfile-base +++ b/docker/Dockerfile-base @@ -43,7 +43,7 @@ ENV PATH="/root/miniconda3/envs/py${PYTHON_VERSION}/bin:${PATH}" WORKDIR /workspace -RUN python3 -m pip install --upgrade pip && pip3 install -U packaging==23.2 setuptools==75.8.0 wheel psutil && \ +RUN python3 -m pip install --upgrade pip && pip3 install -U packaging==26.0 setuptools==75.8.0 wheel psutil && \ python3 -m pip install --no-cache-dir -U torch==${PYTORCH_VERSION}+cu${CUDA} torchvision --extra-index-url https://download.pytorch.org/whl/cu$CUDA && \ python3 -m pip cache purge diff --git a/docker/Dockerfile-base-nightly b/docker/Dockerfile-base-nightly index cc74e6bb9b..98dc9e8804 100644 --- a/docker/Dockerfile-base-nightly +++ b/docker/Dockerfile-base-nightly @@ -30,7 +30,7 @@ ENV PATH="/root/miniconda3/envs/py${PYTHON_VERSION}/bin:${PATH}" WORKDIR /workspace -RUN python3 -m pip install --upgrade pip && pip3 install -U packaging==23.2 setuptools==75.8.0 wheel && \ +RUN python3 -m pip install --upgrade pip && pip3 install -U packaging==26.0 setuptools==75.8.0 wheel && \ python3 -m pip install --no-cache-dir -U torch --extra-index-url https://download.pytorch.org/whl/nightly/cu$CUDA && \ python3 -m pip install --no-cache-dir "causal_conv1d @ git+https://github.com/Dao-AILab/causal-conv1d.git@main" && \ python3 -m pip install --no-cache-dir "mamba_ssm @ git+https://github.com/state-spaces/mamba.git@main" && \ diff --git a/examples/apertus/README.md b/examples/apertus/README.md index 774286333a..1cb4d413ce 100644 --- a/examples/apertus/README.md +++ b/examples/apertus/README.md @@ -15,7 +15,7 @@ This guide shows how to fine-tune it with Axolotl with multi-turn conversations git clone https://github.com/axolotl-ai-cloud/axolotl.git cd axolotl -pip3 install packaging==23.2 setuptools==75.8.0 wheel ninja +pip3 install packaging==26.0 setuptools==75.8.0 wheel ninja pip3 install --no-build-isolation -e '.[flash-attn]' # Install CCE https://docs.axolotl.ai/docs/custom_integrations.html#cut-cross-entropy diff --git a/examples/arcee/README.md b/examples/arcee/README.md index 23f63663e7..ad554532c1 100644 --- a/examples/arcee/README.md +++ b/examples/arcee/README.md @@ -17,7 +17,7 @@ Thanks to the team at Arcee.ai for using Axolotl in supervised fine-tuning the A git clone https://github.com/axolotl-ai-cloud/axolotl.git cd axolotl -pip3 install packaging==23.2 setuptools==75.8.0 wheel ninja +pip3 install packaging==26.0 setuptools==75.8.0 wheel ninja pip3 install --no-build-isolation -e '.[flash-attn]' # Install CCE https://docs.axolotl.ai/docs/custom_integrations.html#cut-cross-entropy diff --git a/examples/devstral/README.md b/examples/devstral/README.md index ae08606628..5a0145f103 100644 --- a/examples/devstral/README.md +++ b/examples/devstral/README.md @@ -16,7 +16,7 @@ Thanks to the team at MistralAI for giving us early access to prepare for this r ```bash # Ensure you have Pytorch installed (Pytorch 2.6.0 min) -pip3 install packaging==23.2 setuptools==75.8.0 wheel ninja +pip3 install packaging==26.0 setuptools==75.8.0 wheel ninja pip3 install --no-build-isolation 'axolotl[flash-attn]>=0.12.0' ``` diff --git a/examples/gemma3n/README.md b/examples/gemma3n/README.md index ff3946c906..4808ed81be 100644 --- a/examples/gemma3n/README.md +++ b/examples/gemma3n/README.md @@ -10,7 +10,7 @@ Gemma-3n is a family of multimodal models from Google found on [HuggingFace](htt ```bash # Ensure you have Pytorch installed (Pytorch 2.6.0 min) -pip3 install packaging==23.2 setuptools==75.8.0 wheel ninja +pip3 install packaging==26.0 setuptools==75.8.0 wheel ninja pip3 install --no-build-isolation 'axolotl[flash-attn]>=0.12.0' ``` diff --git a/examples/gpt-oss/README.md b/examples/gpt-oss/README.md index 9ab02b122b..8c407540ed 100644 --- a/examples/gpt-oss/README.md +++ b/examples/gpt-oss/README.md @@ -14,7 +14,7 @@ This guide shows how to fine-tune it with Axolotl with multi-turn conversations ```bash # Ensure you have Pytorch installed (Pytorch 2.6.0 min) -pip3 install packaging==23.2 setuptools==75.8.0 wheel ninja +pip3 install packaging==26.0 setuptools==75.8.0 wheel ninja pip3 install --no-build-isolation 'axolotl[flash-attn]>=0.12.0' ``` diff --git a/examples/granite4/README.md b/examples/granite4/README.md index d5efd3349f..0495394054 100644 --- a/examples/granite4/README.md +++ b/examples/granite4/README.md @@ -15,7 +15,7 @@ This guide shows how to fine-tune it with Axolotl with multi-turn conversations git clone https://github.com/axolotl-ai-cloud/axolotl.git cd axolotl -pip3 install packaging==23.2 setuptools==75.8.0 wheel ninja +pip3 install packaging==26.0 setuptools==75.8.0 wheel ninja pip3 install --no-build-isolation -e '.[flash-attn]' # Install CCE https://docs.axolotl.ai/docs/custom_integrations.html#cut-cross-entropy diff --git a/examples/hunyuan/README.md b/examples/hunyuan/README.md index 96c6bbcfa8..59e9a28c78 100644 --- a/examples/hunyuan/README.md +++ b/examples/hunyuan/README.md @@ -13,7 +13,7 @@ Tencent released a family of opensource models called HunYuan with varying param git clone https://github.com/axolotl-ai-cloud/axolotl.git cd axolotl -pip3 install packaging==23.2 setuptools==75.8.0 wheel ninja +pip3 install packaging==26.0 setuptools==75.8.0 wheel ninja pip3 install --no-build-isolation -e '.[flash-attn]' # Install CCE https://docs.axolotl.ai/docs/custom_integrations.html#cut-cross-entropy diff --git a/examples/magistral/README.md b/examples/magistral/README.md index 40a793f109..2e162df6b6 100644 --- a/examples/magistral/README.md +++ b/examples/magistral/README.md @@ -14,7 +14,7 @@ Thanks to the team at MistralAI for giving us early access to prepare for these ```bash # Ensure you have Pytorch installed (Pytorch 2.7.0 min) -pip3 install packaging==23.2 setuptools==75.8.0 wheel ninja +pip3 install packaging==26.0 setuptools==75.8.0 wheel ninja pip3 install --no-build-isolation 'axolotl[flash-attn]>=0.12.0' ``` diff --git a/examples/qwen3-next/README.md b/examples/qwen3-next/README.md index 678175fd40..3c3a26a762 100644 --- a/examples/qwen3-next/README.md +++ b/examples/qwen3-next/README.md @@ -15,7 +15,7 @@ This guide shows how to fine-tune it with Axolotl with multi-turn conversations git clone https://github.com/axolotl-ai-cloud/axolotl.git cd axolotl -pip3 install packaging==23.2 setuptools==75.8.0 wheel ninja +pip3 install packaging==26.0 setuptools==75.8.0 wheel ninja pip3 install --no-build-isolation -e '.[flash-attn]' # Install CCE https://docs.axolotl.ai/docs/custom_integrations.html#cut-cross-entropy diff --git a/examples/voxtral/README.md b/examples/voxtral/README.md index b77691d72b..2d3cad4e9a 100644 --- a/examples/voxtral/README.md +++ b/examples/voxtral/README.md @@ -12,7 +12,7 @@ Thanks to the team at MistralAI for giving us early access to prepare for this r ```bash # Ensure you have Pytorch installed (Pytorch 2.6.0 min) -pip3 install packaging==23.2 setuptools==75.8.0 wheel ninja +pip3 install packaging==26.0 setuptools==75.8.0 wheel ninja pip3 install --no-build-isolation 'axolotl[flash-attn]>=0.12.0' ``` diff --git a/pyproject.toml b/pyproject.toml index c5b7deb05e..bca758576e 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -1,5 +1,5 @@ [build-system] -requires = ["setuptools>=64", "wheel", "setuptools_scm>=8", "packaging==23.2"] +requires = ["setuptools>=64", "wheel", "setuptools_scm>=8", "packaging==26.0"] build-backend = "setuptools.build_meta" [project] diff --git a/requirements.txt b/requirements.txt index 2ec4cde553..2d5fa12fcc 100644 --- a/requirements.txt +++ b/requirements.txt @@ -8,7 +8,7 @@ xformers>=0.0.23.post1 liger-kernel==0.6.4 # END section -packaging==23.2 +packaging==26.0 huggingface_hub>=0.36.0 peft>=0.18.1 From e5fe9b846413660a0210c59b7b633753eff3debb Mon Sep 17 00:00:00 2001 From: Wing Lian Date: Wed, 21 Jan 2026 17:30:33 -0500 Subject: [PATCH 8/8] build vllm in ci too --- .github/workflows/main.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index e081f21272..0e1ccb89a3 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -38,7 +38,7 @@ jobs: cuda_version: 12.9.1 python_version: "3.12" pytorch: 2.9.1 - axolotl_extras: + axolotl_extras: vllm platforms: "linux/amd64,linux/arm64" - cuda: 130 cuda_version: 13.0.0