File tree Expand file tree Collapse file tree 1 file changed +3
-2
lines changed
vllm/model_executor/models Expand file tree Collapse file tree 1 file changed +3
-2
lines changed Original file line number Diff line number Diff line change 3333from vllm .sequence import IntermediateTensors
3434from vllm .transformers_utils .configs .arctic import ArcticConfig
3535
36- from .interfaces import SupportsPP
36+ from .interfaces import SupportsPP , SupportsQuant
3737from .utils import (extract_layer_index , is_pp_missing_parameter ,
3838 make_empty_intermediate_tensors_factory , make_layers ,
3939 maybe_prefix )
@@ -423,7 +423,8 @@ def forward(
423423 return hidden_states
424424
425425
426- class ArcticForCausalLM (nn .Module , SupportsPP ):
426+ class ArcticForCausalLM (nn .Module , SupportsPP , SupportsQuant ):
427+ packed_modules_mapping = {"qkv_proj" : ["q_proj" , "k_proj" , "v_proj" ]}
427428
428429 def __init__ (self , * , vllm_config : VllmConfig , prefix : str = "" ):
429430 super ().__init__ ()
You can’t perform that action at this time.
0 commit comments