Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion docker/Dockerfile
Original file line number Diff line number Diff line change
Expand Up @@ -11,7 +11,7 @@ ARG GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2
ARG HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6
ARG DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee
ARG BUILD_AND_DOWNLOAD_PARALLEL=8
ARG SGL_KERNEL_VERSION=0.4.1
ARG SGL_KERNEL_VERSION=0.4.1.post1
ARG SGL_VERSION
ARG USE_LATEST_SGLANG=0
ARG GDRCOPY_VERSION=2.5.1
Expand Down
2 changes: 1 addition & 1 deletion python/pyproject.toml
Original file line number Diff line number Diff line change
Expand Up @@ -59,7 +59,7 @@ dependencies = [
"sentencepiece",
"setproctitle",
"flash-attn-4>=4.0.0b9",
"sglang-kernel==0.4.1",
"sglang-kernel==0.4.1.post1",
"soundfile==0.13.1",
"tiktoken",
"timm==1.0.16",
Expand Down
2 changes: 1 addition & 1 deletion python/sglang/srt/entrypoints/engine.py
Original file line number Diff line number Diff line change
Expand Up @@ -1170,7 +1170,7 @@ def _set_envs_and_config(server_args: ServerArgs):
if _is_cuda:
assert_pkg_version(
"sglang-kernel",
"0.4.1",
"0.4.1.post1",
"Please reinstall the latest version with `pip install sglang-kernel --force-reinstall`",
)

Expand Down
Original file line number Diff line number Diff line change
@@ -1,8 +1,3 @@
"""
# TODO: Fails on cu13 venv migration. Ref: https://github.com/sgl-project/sglang/actions/runs/24616960626/job/71980705674?pr=23119
# Should move back to registered test after it's fixed
"""

import shutil
import tempfile
import unittest
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -3,11 +3,6 @@
register_cuda_ci(est_time=99, suite="stage-b-test-1-gpu-small")
register_amd_ci(est_time=300, suite="stage-b-test-1-gpu-small-amd")

"""
# TODO: Segmentation fault occurs when upgraded to Cu13. Ref: https://github.com/sgl-project/sglang/actions/runs/24603159715/job/71945537414?pr=23119")
# Should move back to registered test after it's fixed
"""

import time
import unittest

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -2,8 +2,6 @@
Benchmark tests for HiCache Storage with 3FS backend.
Usage:
python3 -m pytest test/registered/hicache/test_hicache_storage_3fs_backend.py -v
# TODO: Segmentation fault occurs when upgraded to Cu13. Ref: https://github.com/sgl-project/sglang/actions/runs/24603159715/job/71945537414?pr=23119")
# Should move back to registered test after it's fixed
"""

import json
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -2,8 +2,6 @@
E2E tests for HiCache Storage functionality.
Usage:
python3 -m pytest test/registered/hicache/test_hicache_storage_file_backend.py -v
# TODO: Segmentation fault occurs when upgraded to Cu13. Ref: https://github.com/sgl-project/sglang/actions/runs/24603159715/job/71945537414?pr=23119")
# Should move back to registered test after it's fixed
"""

import json
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -4,9 +4,6 @@
python3.10 -m pytest test/registered/hicache/test_hicache_storage_mooncake_backend.py -v
"""

# TODO: Segmentation fault occurs when upgraded to Cu13. Ref: https://github.com/sgl-project/sglang/actions/runs/24601791606/job/71942123195?pr=23119")
# Should move back to registered test after it's fixed

import os
import subprocess
import time
Expand All @@ -15,13 +12,16 @@
import requests
from test_hicache_storage_file_backend import HiCacheStorageBaseMixin

from sglang.test.ci.ci_register import register_cuda_ci
from sglang.test.test_utils import (
DEFAULT_MLA_MODEL_NAME_FOR_TEST,
CustomTestCase,
find_available_port,
is_in_ci,
)

register_cuda_ci(est_time=236, suite="stage-b-test-2-gpu-large")


class HiCacheStorageMooncakeBackendBaseMixin(HiCacheStorageBaseMixin):
"""Base mixin class with common setup and utilities"""
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -7,8 +7,6 @@

Usage:
python3 -m pytest test/registered/hicache/test_hicache_storage_runtime_attach_detach.py -v
# TODO: Segmentation fault occurs when upgraded to Cu13. Ref: https://github.com/sgl-project/sglang/actions/runs/24603159715/job/71945537414?pr=23119")
# Should move back to registered test after it's fixed
"""

import json
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -5,8 +5,6 @@
"""
Consolidated HiCache variant tests.
Tests HiCache with different configurations: standard, MLA, EAGLE, and page size variants.
# TODO: Segmentation fault occurs when upgraded to Cu13. Ref: https://github.com/sgl-project/sglang/actions/runs/24603159715/job/71945537414?pr=23119")
# Should move back to registered test after it's fixed
"""

import unittest
Expand Down
Loading