Skip to content

Commit fca0d37

Browse files
authored
[None][fix] update nemotron nas tests free_gpu_memory_fraction=0.8 (#6552)
Signed-off-by: Xin He (SW-GPU) <[email protected]>
1 parent 137413f commit fca0d37

File tree

1 file changed

+2
-1
lines changed

1 file changed

+2
-1
lines changed

tests/integration/defs/accuracy/test_llm_api_pytorch.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1495,9 +1495,10 @@ class TestNemotronNas(LlmapiAccuracyTestHarness):
14951495
MODEL_NAME = "nemotron-nas/Llama-3_1-Nemotron-51B-Instruct"
14961496
MODEL_PATH = f"{llm_models_root()}/nemotron-nas/Llama-3_1-Nemotron-51B-Instruct"
14971497

1498+
@pytest.mark.skip_less_device_memory(80000)
14981499
@pytest.mark.skip_less_device(8)
14991500
def test_auto_dtype_tp8(self):
1500-
kv_cache_config = KvCacheConfig(free_gpu_memory_fraction=0.9)
1501+
kv_cache_config = KvCacheConfig(free_gpu_memory_fraction=0.8)
15011502
pytorch_config = dict()
15021503

15031504
with LLM(self.MODEL_PATH,

0 commit comments

Comments
 (0)