Update src/transformers/models/openai_moe/modeling_openai_moe.py

ArthurZucker · web-flow · commit 8bc3475f9919 · 2025-07-07T17:04:38.000+02:00
diff --git a/src/transformers/models/openai_moe/modeling_openai_moe.py b/src/transformers/models/openai_moe/modeling_openai_moe.py
@@ -242,7 +242,7 @@ def eager_attention_forward(
     scores = unnormalized_scores / normalizer
 
     attn_weights = nn.functional.dropout(scores, p=dropout, training=module.training)
-    attn_output = torch.matmul(attn_weights[..., :-1], value_states)  # ignore the sinks
+    attn_output = torch.matmul(attn_weights, value_states)  # ignore the sinks
     attn_output = attn_output.transpose(1, 2).contiguous()
     return attn_output, attn_weights