We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 784c231 commit 213b644Copy full SHA for 213b644
vllm/model_executor/layers/quantization/utils/fp8_utils.py
@@ -360,7 +360,7 @@ def _run_aiter(
360
weight,
361
input_scale,
362
weight_scale,
363
- self.weight_group_shape,
+ list(self.weight_group_shape),
364
input_2d.dtype,
365
)
366
@@ -377,7 +377,7 @@ def _run_triton(
377
378
379
380
381
382
383
0 commit comments