[ Misc ] Remove separate bias add (#6353)

2025-12-22 20:35:32 +08:00 · 2024-07-12 01:06:09 -04:00 · 2024-07-12 01:06:09 -04:00 · 6047187cd8
commit 6047187cd8
parent b6c16cf8ff
1 changed files with 3 additions and 15 deletions
--- a/vllm/model_executor/layers/linear.py
+++ b/vllm/model_executor/layers/linear.py
@ -99,15 +99,7 @@ class LinearMethodBase(QuantizeMethodBase):
 class UnquantizedLinearMethod(LinearMethodBase):
-    """Linear method without quantization.
+    """Linear method without quantization."""
    Args:
        separate_bias_add: If true, add bias separately after matrix
                           multiplication.
    """
    def __init__(self, separate_bias_add: bool = False):
        self.separate_bias_add = separate_bias_add
    def create_weights(self, layer: torch.nn.Module,
                       input_size_per_partition: int,
@ -126,12 +118,8 @@ class UnquantizedLinearMethod(LinearMethodBase):
              layer: torch.nn.Module,
              x: torch.Tensor,
              bias: Optional[torch.Tensor] = None) -> torch.Tensor:
-        weight = layer.weight
+
-        if self.separate_bias_add:
+        return F.linear(x, layer.weight, bias)
            if bias is not None:
                return F.linear(x, weight) + bias
            return F.linear(x, weight)
        return F.linear(x, weight, bias)
 class LinearBase(torch.nn.Module):