Skip to content

Commit dcf2a59

Browse files
authored
Allow torchao quantization in SiglipMLP (#15575)
1 parent 54aa619 commit dcf2a59

File tree

1 file changed

+4
-2
lines changed

1 file changed

+4
-2
lines changed

vllm/model_executor/models/siglip.py

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -208,8 +208,10 @@ def __init__(
208208

209209
self.config = config
210210
self.activation_fn = get_act_fn(config.hidden_act)
211-
# Special handling for BNB quantization
212-
if quant_config and quant_config.get_name() == "bitsandbytes":
211+
# Special handling for BNB and torchao quantization
212+
if quant_config and quant_config.get_name() in [
213+
"bitsandbytes", "torchao"
214+
]:
213215
quantizable = True
214216
else:
215217
# For other quantization, we require the hidden size to be a

0 commit comments

Comments
 (0)