Skip to content

Commit 0b82b35

Browse files
committed
fix
Signed-off-by: Superjomn <[email protected]>
1 parent 707ec59 commit 0b82b35

File tree

1 file changed

+6
-1
lines changed

1 file changed

+6
-1
lines changed

tensorrt_llm/llmapi/llm_args.py

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2014,8 +2014,13 @@ def validate_cuda_graph_config(self) -> 'TorchLlmArgs':
20142014

20152015
@model_validator(mode='after')
20162016
def sync_quant_config_with_kv_cache_config_dtype(self) -> 'TorchLlmArgs':
2017+
if self.kv_cache_config is None:
2018+
return self
2019+
20172020
assert self.quant_config is not None
2018-
if self.kv_cache_config.dtype == 'fp8':
2021+
if self.kv_cache_config.dtype == "auto":
2022+
return self
2023+
elif self.kv_cache_config.dtype == 'fp8':
20192024
self.quant_config.kv_cache_quant_algo = QuantAlgo.FP8
20202025
else:
20212026
logger.warning(

0 commit comments

Comments
 (0)