We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 914eaec commit 49543bdCopy full SHA for 49543bd
vllm/model_executor/layers/quantization/modelopt.py
@@ -1303,13 +1303,13 @@ def create_weights(
1303
1304
w13_input_scale = PerTensorScaleParameter(
1305
data=torch.empty(global_num_experts, 2, dtype=torch.float32),
1306
- weight_loader=weight_loader
+ weight_loader=weight_loader,
1307
)
1308
layer.register_parameter("w13_input_scale", w13_input_scale)
1309
1310
w2_input_scale = PerTensorScaleParameter(
1311
data=torch.empty(global_num_experts, dtype=torch.float32),
1312
1313
1314
1315
layer.register_parameter("w2_input_scale", w2_input_scale)
0 commit comments