Skip to content

Commit

Permalink
[Quant] Arctic SupportsQuant (vllm-project#13366)
Browse files Browse the repository at this point in the history
  • Loading branch information
kylesayrs authored Feb 18, 2025
1 parent 88787bc commit 00294e1
Showing 1 changed file with 3 additions and 2 deletions.
5 changes: 3 additions & 2 deletions vllm/model_executor/models/arctic.py
Original file line number Diff line number Diff line change
Expand Up @@ -33,7 +33,7 @@
from vllm.sequence import IntermediateTensors
from vllm.transformers_utils.configs.arctic import ArcticConfig

from .interfaces import SupportsPP
from .interfaces import SupportsPP, SupportsQuant
from .utils import (extract_layer_index, is_pp_missing_parameter,
make_empty_intermediate_tensors_factory, make_layers,
maybe_prefix)
Expand Down Expand Up @@ -423,7 +423,8 @@ def forward(
return hidden_states


class ArcticForCausalLM(nn.Module, SupportsPP):
class ArcticForCausalLM(nn.Module, SupportsPP, SupportsQuant):
packed_modules_mapping = {"qkv_proj": ["q_proj", "k_proj", "v_proj"]}

def __init__(self, *, vllm_config: VllmConfig, prefix: str = ""):
super().__init__()
Expand Down

0 comments on commit 00294e1

Please sign in to comment.