We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent b82f430 commit e1ba235Copy full SHA for e1ba235
vllm/config/vllm.py
@@ -597,7 +597,7 @@ def has_blocked_weights():
597
# https://github.com/vllm-project/vllm/issues/25094
598
if has_blocked_weights():
599
custom_ops = self.compilation_config.custom_ops
600
- if "none" not in custom_ops and "-quant_fp8" not in custom_ops:
+ if "-quant_fp8" not in custom_ops:
601
custom_ops.append("+quant_fp8")
602
603
def update_sizes_for_sequence_parallelism(self, possible_sizes: list) -> list:
0 commit comments