Update modeling_Llamoe.py
Browse files- modeling_Llamoe.py +1 -1
modeling_Llamoe.py
CHANGED
@@ -599,7 +599,7 @@ class LlamoeSdpaAttention(LlamoeAttention):
|
|
599 |
query_states,
|
600 |
key_states,
|
601 |
value_states,
|
602 |
-
attn_mask=
|
603 |
dropout_p=self.attention_dropout if self.training else 0.0,
|
604 |
)
|
605 |
|
|
|
599 |
query_states,
|
600 |
key_states,
|
601 |
value_states,
|
602 |
+
attn_mask=causal_mask,
|
603 |
dropout_p=self.attention_dropout if self.training else 0.0,
|
604 |
)
|
605 |
|