We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 918a847 commit 79a23ffCopy full SHA for 79a23ff
vllm/model_executor/layers/quantization/kernels/mixed_precision/machete.py
@@ -32,12 +32,6 @@ def can_implement(cls,
32
return False, "Act reordering currently not supported by Machete, "\
33
"when the input features are partitioned across "\
34
"devices"
35
- if c.zero_points:
36
- return False, "Zero points currently not supported by "\
37
- " Compressed Tensors + Machete. (Kernel supports it"\
38
- " but CompressedTensorsWNA16 does not so support has"\
39
- " not been added to MacheteWNA16Kernel yet"
40
-
41
if c.zero_points:
42
return False, "Zero points currently not supported by Machete"
43
0 commit comments