Update modeling_mixformer_sequential.py

Removes print regarding attention_mask to prevent excessive information from being logged.

Files changed (1) hide show

modeling_mixformer_sequential.py CHANGED Viewed

@@ -756,9 +756,6 @@ class MixFormerSequentialForCausalLM(MixFormerSequentialPreTrainedModel):
         labels: Optional[torch.LongTensor] = None,
         **kwargs,
     ) -> CausalLMOutputWithPast:
-        if attention_mask is not None and self.training:
-            print("`attention_mask` is not supported during training. Using it might lead to unexpected results.")
         if past_key_values is None and attention_mask is None:
             lm_logits = self.layers(input_ids)
         else:

         labels: Optional[torch.LongTensor] = None,
         **kwargs,
     ) -> CausalLMOutputWithPast:
         if past_key_values is None and attention_mask is None:
             lm_logits = self.layers(input_ids)
         else: