diff --git a/vllm/model_executor/layers/linear.py b/vllm/model_executor/layers/linear.py index 60f6fc83..40e681df 100644 --- a/vllm/model_executor/layers/linear.py +++ b/vllm/model_executor/layers/linear.py @@ -73,7 +73,7 @@ class UnquantizedLinearMethod(LinearMethodBase): bias: Optional[torch.Tensor] = None) -> torch.Tensor: weight = weights["weight"] if self.separate_bias_add: - if bias: + if bias is not None: return F.linear(x, weight) + bias return F.linear(x, weight) return F.linear(x, weight, bias)