diff --git a/.buildkite/vllm_lkg.version b/.buildkite/vllm_lkg.version index 736f427393..7b952fd527 100644 --- a/.buildkite/vllm_lkg.version +++ b/.buildkite/vllm_lkg.version @@ -1 +1 @@ -ee8a29511fc69e3f0f6291fa6ff1cf6e47f7750d +e5ff140216272c529261b02b6fd13fc480713735 diff --git a/tests/platforms/test_tpu_platform.py b/tests/platforms/test_tpu_platform.py index 7dfe112cb1..07ee7dec14 100644 --- a/tests/platforms/test_tpu_platform.py +++ b/tests/platforms/test_tpu_platform.py @@ -27,7 +27,6 @@ class TestTpuPlatform: def vllm_config(self): cache_config = CacheConfig(block_size=16, gpu_memory_utilization=0.9, - swap_space=4, cache_dtype="fp8") vllm_config = MagicMock(spec=VllmConfig) diff --git a/tests/runner/test_kv_cache_manager.py b/tests/runner/test_kv_cache_manager.py index 86b37098dd..2ac46edc95 100644 --- a/tests/runner/test_kv_cache_manager.py +++ b/tests/runner/test_kv_cache_manager.py @@ -63,7 +63,6 @@ def _setup_runner(self, use_mla: bool = False): cache_config = CacheConfig( block_size=16, gpu_memory_utilization=0.9, - swap_space=4, cache_dtype="auto", ) scheduler_config = SchedulerConfig(max_num_seqs=16, diff --git a/tests/runner/test_multimodal_manager.py b/tests/runner/test_multimodal_manager.py index 648560bf56..9bf1739667 100644 --- a/tests/runner/test_multimodal_manager.py +++ b/tests/runner/test_multimodal_manager.py @@ -53,7 +53,6 @@ def setup_method(self): cache_config = CacheConfig( block_size=16, gpu_memory_utilization=0.9, - swap_space=4, cache_dtype="auto", ) scheduler_config = SchedulerConfig(max_num_seqs=16, diff --git a/tests/runner/test_speculative_decoding_manager.py b/tests/runner/test_speculative_decoding_manager.py index 4bd897ce2c..259c8b1a81 100644 --- a/tests/runner/test_speculative_decoding_manager.py +++ b/tests/runner/test_speculative_decoding_manager.py @@ -52,7 +52,6 @@ def setup_method(self): cache_config = CacheConfig( block_size=16, gpu_memory_utilization=0.9, - swap_space=4, cache_dtype="auto", ) scheduler_config = SchedulerConfig(max_num_seqs=16, diff --git a/tests/runner/test_structured_decoding_manager.py b/tests/runner/test_structured_decoding_manager.py index b0e460500e..74a4a30e49 100644 --- a/tests/runner/test_structured_decoding_manager.py +++ b/tests/runner/test_structured_decoding_manager.py @@ -50,7 +50,6 @@ def setup_method(self): cache_config = CacheConfig( block_size=16, gpu_memory_utilization=0.9, - swap_space=4, cache_dtype="auto", ) scheduler_config = SchedulerConfig(max_num_seqs=16, diff --git a/tests/runner/test_tpu_runner.py b/tests/runner/test_tpu_runner.py index 4fa1956836..5bce0f0020 100644 --- a/tests/runner/test_tpu_runner.py +++ b/tests/runner/test_tpu_runner.py @@ -45,7 +45,6 @@ def setup_method(self): cache_config = CacheConfig( block_size=16, gpu_memory_utilization=0.9, - swap_space=4, cache_dtype="auto", ) scheduler_config = SchedulerConfig(max_num_seqs=16, @@ -202,7 +201,6 @@ def setup_method(self): cache_config = CacheConfig( block_size=16, gpu_memory_utilization=0.9, - swap_space=4, cache_dtype="auto", ) scheduler_config = SchedulerConfig(max_num_seqs=16,