From 46720235d69a557e2c3c2ee17b3ad79e5c5e6663 Mon Sep 17 00:00:00 2001 From: Kyle Sayers Date: Sun, 16 Feb 2025 21:02:22 -0500 Subject: [PATCH] add arctic SupportsQuant Signed-off-by: Kyle Sayers --- vllm/model_executor/models/arctic.py | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/vllm/model_executor/models/arctic.py b/vllm/model_executor/models/arctic.py index d015682aab47..27df448e63f7 100644 --- a/vllm/model_executor/models/arctic.py +++ b/vllm/model_executor/models/arctic.py @@ -33,7 +33,7 @@ from vllm.sequence import IntermediateTensors from vllm.transformers_utils.configs.arctic import ArcticConfig -from .interfaces import SupportsPP +from .interfaces import SupportsPP, SupportsQuant from .utils import (extract_layer_index, is_pp_missing_parameter, make_empty_intermediate_tensors_factory, make_layers, maybe_prefix) @@ -423,7 +423,8 @@ def forward( return hidden_states -class ArcticForCausalLM(nn.Module, SupportsPP): +class ArcticForCausalLM(nn.Module, SupportsPP, SupportsQuant): + packed_modules_mapping = {"qkv_proj": ["q_proj", "k_proj", "v_proj"]} def __init__(self, *, vllm_config: VllmConfig, prefix: str = ""): super().__init__()