[BugFix] Fix failing test quantization/test_compressed_tensors.py::test_compressed_tensors_fp8_block_enabled (#26436)

morrison-turnansky · web-flow · commit e1ba23566891 · 2025-10-08T20:04:12.000Z
Signed-off-by: morrison-turnansky &lt;mturnans@redhat.com&gt;
diff --git a/vllm/config/vllm.py b/vllm/config/vllm.py
@@ -597,7 +597,7 @@ def has_blocked_weights():
         # https://github.com/vllm-project/vllm/issues/25094
         if has_blocked_weights():
             custom_ops = self.compilation_config.custom_ops
-            if "none" not in custom_ops and "-quant_fp8" not in custom_ops:
+            if "-quant_fp8" not in custom_ops:
                 custom_ops.append("+quant_fp8")
 
     def update_sizes_for_sequence_parallelism(self, possible_sizes: list) -> list: