diff --git a/vllm_gaudi/platform.py b/vllm_gaudi/platform.py index 4bd084519c..bb19666a4b 100644 --- a/vllm_gaudi/platform.py +++ b/vllm_gaudi/platform.py @@ -154,7 +154,8 @@ def set_torch_compile(cls) -> None: os.environ['PT_HPU_ENABLE_LAZY_COLLECTIVES'] = 'true' @classmethod - def is_kv_cache_dtype_supported(cls, kv_cache_dtype: str) -> bool: + def is_kv_cache_dtype_supported(cls, kv_cache_dtype: str, + model_config: ModelConfig) -> bool: return kv_cache_dtype == "fp8_inc" @classmethod