We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 137413f commit fca0d37Copy full SHA for fca0d37
tests/integration/defs/accuracy/test_llm_api_pytorch.py
@@ -1495,9 +1495,10 @@ class TestNemotronNas(LlmapiAccuracyTestHarness):
1495
MODEL_NAME = "nemotron-nas/Llama-3_1-Nemotron-51B-Instruct"
1496
MODEL_PATH = f"{llm_models_root()}/nemotron-nas/Llama-3_1-Nemotron-51B-Instruct"
1497
1498
+ @pytest.mark.skip_less_device_memory(80000)
1499
@pytest.mark.skip_less_device(8)
1500
def test_auto_dtype_tp8(self):
- kv_cache_config = KvCacheConfig(free_gpu_memory_fraction=0.9)
1501
+ kv_cache_config = KvCacheConfig(free_gpu_memory_fraction=0.8)
1502
pytorch_config = dict()
1503
1504
with LLM(self.MODEL_PATH,
0 commit comments