nomic-ai
/

nomic-bert-2048

Model card Files Files and versions Community

zpn commited on 4 days ago

Commit

359596a

·

1 Parent(s): f69b8d1

fix: local

Files changed (1) hide show

modeling_hf_nomic_bert.py +0 -8

modeling_hf_nomic_bert.py CHANGED Viewed

@@ -1244,18 +1244,10 @@ class NomicMoELayer(nn.Module):
     def forward(self, x: torch.Tensor, attention_mask: Optional[torch.Tensor] = None):
         batch_size, seq_len, hidden_dim = x.shape
-        if attention_mask is not None:
-            valid_indices = attention_mask.bool().view(-1)
-            x_valid = x.view(-1, hidden_dim)[valid_indices]
         weights, top_weights, top_experts = self.router(x)
         out = self.experts(x, weights, top_weights, top_experts)
-        if attention_mask is not None:
-            full_out = torch.zeros(batch_size * seq_len, hidden_dim, dtype=out.dtype, device=out.device)
-            full_out[valid_indices] = out
-            out = full_out.view(batch_size, seq_len, hidden_dim)
         return out

     def forward(self, x: torch.Tensor, attention_mask: Optional[torch.Tensor] = None):
         batch_size, seq_len, hidden_dim = x.shape
         weights, top_weights, top_experts = self.router(x)
         out = self.experts(x, weights, top_weights, top_experts)
         return out