[Bugfix]fix and needs_scalar_to_array logic check (#6238)

Co-authored-by: Robert Shaw <114415538+robertgshaw2-neuralmagic@users.noreply.github.com>
vllm-project · Jul 9, 2024 · d3a2451 · d3a2451
1 parent 673dd4c
commit d3a2451
Showing 1 changed file with 2 additions and 2 deletions.
diff --git a/vllm/model_executor/layers/linear.py b/vllm/model_executor/layers/linear.py
@@ -387,7 +387,7 @@ def weight_loader(self,
         if loaded_shard_id is None:
             # Loaded weight is already fused on disk (qkv/mlp).
             if output_dim is None:
-                if needs_scalar_to_array is not None:
+                if needs_scalar_to_array:
                     param_data, loaded_weight = adjust_scalar_to_fused_array(
                         param_data, loaded_weight, 0)
 
@@ -549,7 +549,7 @@ def weight_loader(self,
         if loaded_shard_id is None:
             # Loaded weight is already fused on disk (qkv/mlp).
             if output_dim is None:
-                if needs_scalar_to_array is not None:
+                if needs_scalar_to_array:
                     param_data, loaded_weight = adjust_scalar_to_fused_array(
                         param_data, loaded_weight, 0)