[Pixtral-Large] Pixtral actually has no bias in vision-lang adapter (#…

…10449)
vllm-project · Nov 19, 2024 · 11fd7ea · 11fd7ea
1 parent f028dff
commit 11fd7ea
Showing 1 changed file with 3 additions and 2 deletions.
diff --git a/vllm/model_executor/models/pixtral.py b/vllm/model_executor/models/pixtral.py
@@ -331,6 +331,7 @@ class VisionEncoderArgs:
     num_attention_heads: int
     rope_theta: float  # for rope-2D
     image_token_id: int
+    adapter_bias: bool = True
 
 
 def _reshape_for_broadcast(freqs_cis: torch.Tensor,
@@ -595,10 +596,10 @@ def __init__(self, args: VisionEncoderArgs, dim: int):
         self.w_in = nn.Linear(
             args.hidden_size,
             dim,
-            bias=True,
+            bias=args.adapter_bias,
         )
         self.gelu = nn.GELU()
-        self.w_out = nn.Linear(dim, dim, bias=True)
+        self.w_out = nn.Linear(dim, dim, bias=args.adapter_bias)
 
     def forward(self, x: torch.Tensor) -> torch.Tensor:
         return self.w_out(self.gelu(self.w_in(x)))