diff --git a/vllm/model_executor/layers/linear.py b/vllm/model_executor/layers/linear.py index 3cc25783..1dda5d37 100644 --- a/vllm/model_executor/layers/linear.py +++ b/vllm/model_executor/layers/linear.py @@ -387,7 +387,7 @@ class MergedColumnParallelLinear(ColumnParallelLinear): if loaded_shard_id is None: # Loaded weight is already fused on disk (qkv/mlp). if output_dim is None: - if needs_scalar_to_array is not None: + if needs_scalar_to_array: param_data, loaded_weight = adjust_scalar_to_fused_array( param_data, loaded_weight, 0) @@ -549,7 +549,7 @@ class QKVParallelLinear(ColumnParallelLinear): if loaded_shard_id is None: # Loaded weight is already fused on disk (qkv/mlp). if output_dim is None: - if needs_scalar_to_array is not None: + if needs_scalar_to_array: param_data, loaded_weight = adjust_scalar_to_fused_array( param_data, loaded_weight, 0)