diff --git a/python/sglang/srt/managers/scheduler.py b/python/sglang/srt/managers/scheduler.py index 5b3f3b301593..5b6bd51754be 100644 --- a/python/sglang/srt/managers/scheduler.py +++ b/python/sglang/srt/managers/scheduler.py @@ -289,9 +289,6 @@ def __init__( self.enable_metrics_for_all_schedulers = ( server_args.enable_metrics_for_all_schedulers ) - self.enable_kv_cache_events = bool( - server_args.kv_events_config and tp_rank == 0 - ) self.enable_trace = server_args.enable_trace self.stream_interval = server_args.stream_interval self.spec_algorithm = SpeculativeAlgorithm.from_string( @@ -313,6 +310,10 @@ def __init__( ) ) + self.enable_kv_cache_events = bool( + server_args.kv_events_config and self.attn_tp_rank == 0 + ) + # Init model configs self.init_model_config() diff --git a/test/manual/test_kv_events.py b/test/manual/test_kv_events.py index 4693140e548f..0f657333c6f9 100644 --- a/test/manual/test_kv_events.py +++ b/test/manual/test_kv_events.py @@ -13,6 +13,7 @@ ) from sglang.srt.utils import kill_process_tree from sglang.test.test_utils import ( + DEFAULT_MLA_MODEL_NAME_FOR_TEST, DEFAULT_SMALL_MODEL_NAME_FOR_TEST, DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH, DEFAULT_URL_FOR_TEST, @@ -154,6 +155,8 @@ def test_kv_events_enabled(self): pass finally: + sub.close() + context.term() kill_process_tree(process.pid) def test_kv_events_attn_dp(self): @@ -175,7 +178,7 @@ def test_kv_events_attn_dp(self): # Launch sglang server with DP attention enabled process = popen_launch_server( - "silence09/DeepSeek-R1-Small-2layers", + DEFAULT_MLA_MODEL_NAME_FOR_TEST, DEFAULT_URL_FOR_TEST, timeout=DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH, other_args=[