We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 147ad69 commit cd72148Copy full SHA for cd72148
tests/integration/defs/accuracy/test_llm_api_pytorch.py
@@ -1485,9 +1485,10 @@ class TestNemotronNas(LlmapiAccuracyTestHarness):
1485
MODEL_NAME = "nemotron-nas/Llama-3_1-Nemotron-51B-Instruct"
1486
MODEL_PATH = f"{llm_models_root()}/nemotron-nas/Llama-3_1-Nemotron-51B-Instruct"
1487
1488
+ @pytest.mark.skip_less_device_memory(80000)
1489
@pytest.mark.skip_less_device(8)
1490
def test_auto_dtype_tp8(self):
- kv_cache_config = KvCacheConfig(free_gpu_memory_fraction=0.9)
1491
+ kv_cache_config = KvCacheConfig(free_gpu_memory_fraction=0.8)
1492
pytorch_config = dict()
1493
1494
with LLM(self.MODEL_PATH,
0 commit comments