diff --git a/vllm/model_executor/layers/quantization/modelopt.py b/vllm/model_executor/layers/quantization/modelopt.py index 0862efbea294..b2ed35cf92fd 100644 --- a/vllm/model_executor/layers/quantization/modelopt.py +++ b/vllm/model_executor/layers/quantization/modelopt.py @@ -245,7 +245,7 @@ def _extract_modelopt_quant_algo( """ if hf_quant_cfg is None: return None - if hf_quant_cfg.get("quant_method", "").lower() != "modelopt": + if not hf_quant_cfg.get("quant_method", "").lower().startswith("modelopt"): return None if "quantization" in hf_quant_cfg: quant_config = hf_quant_cfg["quantization"]