Skip to content

Commit cd72148

Browse files
committed
update nemotron nas tests
Signed-off-by: Xin He (SW-GPU) <[email protected]>
1 parent 147ad69 commit cd72148

File tree

1 file changed

+2
-1
lines changed

1 file changed

+2
-1
lines changed

tests/integration/defs/accuracy/test_llm_api_pytorch.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1485,9 +1485,10 @@ class TestNemotronNas(LlmapiAccuracyTestHarness):
14851485
MODEL_NAME = "nemotron-nas/Llama-3_1-Nemotron-51B-Instruct"
14861486
MODEL_PATH = f"{llm_models_root()}/nemotron-nas/Llama-3_1-Nemotron-51B-Instruct"
14871487

1488+
@pytest.mark.skip_less_device_memory(80000)
14881489
@pytest.mark.skip_less_device(8)
14891490
def test_auto_dtype_tp8(self):
1490-
kv_cache_config = KvCacheConfig(free_gpu_memory_fraction=0.9)
1491+
kv_cache_config = KvCacheConfig(free_gpu_memory_fraction=0.8)
14911492
pytorch_config = dict()
14921493

14931494
with LLM(self.MODEL_PATH,

0 commit comments

Comments
 (0)