Skip to content

Commit 00294e1

Browse files
authored
[Quant] Arctic SupportsQuant (#13366)
1 parent 88787bc commit 00294e1

File tree

1 file changed

+3
-2
lines changed

1 file changed

+3
-2
lines changed

vllm/model_executor/models/arctic.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -33,7 +33,7 @@
3333
from vllm.sequence import IntermediateTensors
3434
from vllm.transformers_utils.configs.arctic import ArcticConfig
3535

36-
from .interfaces import SupportsPP
36+
from .interfaces import SupportsPP, SupportsQuant
3737
from .utils import (extract_layer_index, is_pp_missing_parameter,
3838
make_empty_intermediate_tensors_factory, make_layers,
3939
maybe_prefix)
@@ -423,7 +423,8 @@ def forward(
423423
return hidden_states
424424

425425

426-
class ArcticForCausalLM(nn.Module, SupportsPP):
426+
class ArcticForCausalLM(nn.Module, SupportsPP, SupportsQuant):
427+
packed_modules_mapping = {"qkv_proj": ["q_proj", "k_proj", "v_proj"]}
427428

428429
def __init__(self, *, vllm_config: VllmConfig, prefix: str = ""):
429430
super().__init__()

0 commit comments

Comments
 (0)