Skip to content

Commit d5ca211

Browse files
authored
[Quant] BaiChuan SupportsQuant (#13710)
1 parent 2c5e637 commit d5ca211

File tree

1 file changed

+3
-2
lines changed

1 file changed

+3
-2
lines changed

vllm/model_executor/models/baichuan.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -46,7 +46,7 @@
4646
from vllm.model_executor.sampling_metadata import SamplingMetadata
4747
from vllm.sequence import IntermediateTensors
4848

49-
from .interfaces import SupportsLoRA, SupportsPP
49+
from .interfaces import SupportsLoRA, SupportsPP, SupportsQuant
5050
from .utils import (is_pp_missing_parameter,
5151
make_empty_intermediate_tensors_factory, make_layers)
5252

@@ -334,7 +334,8 @@ def forward(
334334
return hidden_states
335335

336336

337-
class BaiChuanBaseForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
337+
class BaiChuanBaseForCausalLM(nn.Module, SupportsLoRA, SupportsPP,
338+
SupportsQuant):
338339
packed_modules_mapping = {
339340
"W_pack": ["W_pack"],
340341
"gate_up_proj": [

0 commit comments

Comments
 (0)