Skip to content
Merged
Show file tree
Hide file tree
Changes from 26 commits
Commits
Show all changes
31 commits
Select commit Hold shift + click to select a range
36ca90e
Add Llama 4 to FA3 test
hebiao064 Apr 17, 2025
470c00e
fix
hebiao064 Apr 17, 2025
b337473
Merge branch 'main' into add_llama4_to_fa3_test
hebiao064 Apr 17, 2025
ea771dc
fix
hebiao064 Apr 17, 2025
9b73dab
Merge branch 'add_llama4_to_fa3_test' of https://github.com/hebiao064…
hebiao064 Apr 17, 2025
56b7726
Rename test class for local attention
hebiao064 Apr 17, 2025
1dde6f2
Merge branch 'main' into add_llama4_to_fa3_test
hebiao064 Apr 19, 2025
1d6e882
delete cuda graph disabled test
hebiao064 Apr 19, 2025
edb689b
fix
hebiao064 Apr 19, 2025
5835630
Merge branch 'main' into add_llama4_to_fa3_test
hebiao064 Apr 19, 2025
0141af6
fix
hebiao064 Apr 19, 2025
11f37a0
Merge branch 'add_llama4_to_fa3_test' of https://github.com/hebiao064…
hebiao064 Apr 19, 2025
b0f72fb
Merge branch 'main' into add_llama4_to_fa3_test
hebiao064 Apr 19, 2025
748eec5
Merge branch 'main' into add_llama4_to_fa3_test
hebiao064 Apr 20, 2025
1f97c4f
Merge branch 'main' into add_llama4_to_fa3_test
zhyncs Apr 21, 2025
24199db
fix
hebiao064 Apr 21, 2025
88200a5
fix
hebiao064 Apr 21, 2025
9ddc783
fix
hebiao064 Apr 21, 2025
3b4e9e7
fix
hebiao064 Apr 21, 2025
afae7bc
Merge branch 'main' into add_llama4_to_fa3_test
hebiao064 Apr 21, 2025
4aaa9ff
merge
hebiao064 Apr 22, 2025
db662b4
fix
hebiao064 Apr 22, 2025
d365cfd
fix
hebiao064 Apr 22, 2025
1dcd1d5
Merge branch 'main' into add_llama4_to_fa3_test
merrymercy Apr 23, 2025
8b14fce
Update utils.py
merrymercy Apr 23, 2025
bf98724
fix
hebiao064 Apr 23, 2025
801e705
Merge branch 'main' into add_llama4_to_fa3_test
hebiao064 Apr 25, 2025
414f311
adjust context len for llama 4 to avoid oom
hebiao064 Apr 25, 2025
78e6f3c
Merge branch 'main' into add_llama4_to_fa3_test
hebiao064 Apr 25, 2025
96aaea3
Merge branch 'main' into add_llama4_to_fa3_test
hebiao064 Apr 26, 2025
358fc9c
disable torch compile
hebiao064 Apr 26, 2025
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
20 changes: 20 additions & 0 deletions .github/workflows/pr-test.yml
Original file line number Diff line number Diff line change
Expand Up @@ -87,6 +87,26 @@ jobs:
cd test/srt
python3 run_suite.py --suite per-commit-2-gpu

unit-test-backend-8-gpu:
if: (github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request') &&
github.event.pull_request.draft == false
runs-on: 8-gpu-runner
steps:
- name: Checkout code
uses: actions/checkout@v4

- name: Install dependencies
env:
FLASHINFER_REPO: ${{ inputs.version == 'nightly' && 'https://flashinfer.ai/whl/nightly/cu124/torch2.5/flashinfer-python' || 'https://flashinfer.ai/whl/cu124/torch2.5/flashinfer-python' }}
run: |
bash scripts/ci_install_dependency.sh

- name: Run test
timeout-minutes: 30
run: |
cd test/srt
python3 run_suite.py --suite per-commit-8-gpu

performance-test-1-gpu-part-1:
if: (github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request') &&
github.event.pull_request.draft == false
Expand Down
6 changes: 6 additions & 0 deletions python/sglang/test/test_utils.py
Original file line number Diff line number Diff line change
Expand Up @@ -44,7 +44,13 @@
)

DEFAULT_MODEL_NAME_FOR_TEST = "meta-llama/Llama-3.1-8B-Instruct"
DEFAULT_MODEL_NAME_FOR_TEST_EAGLE3 = "jamesliu1/sglang-EAGLE3-Llama-3.1-Instruct-8B"
DEFAULT_MODEL_NAME_FOR_TEST_MLA = "lmsys/sglang-ci-dsv3-test"
DEFAULT_MODEL_NAME_FOR_TEST_MLA_NEXTN = "lmsys/sglang-ci-dsv3-test-NextN"
DEFAULT_SMALL_MODEL_NAME_FOR_TEST = "meta-llama/Llama-3.2-1B-Instruct"
DEFAULT_MODEL_NAME_FOR_TEST_LOCAL_ATTENTION = (
"meta-llama/Llama-4-Scout-17B-16E-Instruct"
)
DEFAULT_MOE_MODEL_NAME_FOR_TEST = "mistralai/Mixtral-8x7B-Instruct-v0.1"
DEFAULT_SMALL_MOE_MODEL_NAME_FOR_TEST = "Qwen/Qwen1.5-MoE-A2.7B"
DEFAULT_SMALL_EMBEDDING_MODEL_NAME_FOR_TEST = "Alibaba-NLP/gte-Qwen2-1.5B-instruct"
Expand Down
4 changes: 3 additions & 1 deletion test/srt/run_suite.py
Original file line number Diff line number Diff line change
Expand Up @@ -29,7 +29,6 @@ class TestFile:
TestFile("test_chunked_prefill.py", 336),
TestFile("test_eagle_infer.py", 500),
TestFile("test_ebnf_constrained.py"),
TestFile("test_fa3.py", 200),
TestFile("test_fp8_kernel.py", 8),
TestFile("test_embedding_openai_server.py", 36),
TestFile("test_hidden_states.py", 55),
Expand Down Expand Up @@ -90,6 +89,9 @@ class TestFile:
TestFile("test_update_weights_from_distributed.py", 100),
TestFile("test_verl_engine.py", 100),
],
"per-commit-8-gpu": [
TestFile("test_fa3.py", 30),
],
"nightly": [
TestFile("test_nightly_gsm8k_eval.py"),
],
Expand Down
Loading
Loading