From 362a95ffabccd78c93e6e73460e985c670403b7e Mon Sep 17 00:00:00 2001 From: alisonshao Date: Fri, 13 Feb 2026 17:16:57 -0800 Subject: [PATCH] Enable DeepGemm fast warmup in CI to prevent timeout on cold cache When CI runners restart, the DeepGemm cache is lost, causing a full warmup that compiles up to 128K kernel variants (~30 min), which exceeds CI timeouts. Enable SGLANG_JIT_DEEPGEMM_FAST_WARMUP to reduce compilation to ~3K variants (<3 min warmup). --- .github/workflows/pr-test.yml | 1 + 1 file changed, 1 insertion(+) diff --git a/.github/workflows/pr-test.yml b/.github/workflows/pr-test.yml index fbccef8719cf..5678aab4f811 100644 --- a/.github/workflows/pr-test.yml +++ b/.github/workflows/pr-test.yml @@ -62,6 +62,7 @@ concurrency: env: SGLANG_IS_IN_CI: true + SGLANG_JIT_DEEPGEMM_FAST_WARMUP: true permissions: actions: write