[Bugfix] Use correct key "ignore" for config.json non-quantized layers (#25706)

leejnau · yewentao256 · commit 9555929e1383 · 2025-10-03T13:35:56.000-07:00
Signed-off-by: Lee Nau &lt;lnau@nvidia.com&gt;
Signed-off-by: yewentao256 &lt;zhyanwentao@126.com&gt;
diff --git a/vllm/model_executor/layers/quantization/modelopt.py b/vllm/model_executor/layers/quantization/modelopt.py
@@ -138,13 +138,15 @@ def from_config(cls, config: dict[str, Any]) -> "ModelOptFp8Config":
             if not quant_method:
                 raise ValueError("Missing 'quant_algo' in quantization config")
             kv_cache_quant_method = quant_config.get("kv_cache_quant_algo")
+            # "exclude_modules" is the key in the legacy hf_quant_config.json
             exclude_modules = quant_config.get("exclude_modules")
         else:
             # Compressed-tensors style format:
             # {"quant_algo": "...", "quant_method": "modelopt"}
             quant_method = config.get("quant_algo", "")
             kv_cache_quant_method = config.get("kv_cache_quant_algo")
-            exclude_modules = config.get("exclude_modules")
+            # "ignore" is the key in config.json
+            exclude_modules = config.get("ignore")
 
         if quant_method not in QUANT_ALGOS:
             raise ValueError(
@@ -723,6 +725,7 @@ def from_config(cls, config: dict[str, Any]) -> "ModelOptNvFp4Config":
                     raise ValueError(f"group_size must be an integer, got "
                                      f"{type(group_size_raw)}") from None
 
+            # "exclude_modules" is the key in the legacy hf_quant_config.json
             exclude_modules = quant_config.get("exclude_modules", [])
             if not isinstance(exclude_modules, list):
                 raise ValueError(f"exclude_modules must be a list, got "
@@ -756,7 +759,8 @@ def from_config(cls, config: dict[str, Any]) -> "ModelOptNvFp4Config":
                     raise ValueError(f"group_size must be an integer, got "
                                      f"{type(group_size_raw)}") from None
 
-            exclude_modules = config.get("exclude_modules", [])
+            # "ignore" is the key in config.json
+            exclude_modules = config.get("ignore", [])
             if not isinstance(exclude_modules, list):
                 raise ValueError(f"exclude_modules must be a list, got "
                                  f"{type(exclude_modules)}")