katuni4ka
/

tiny-random-baichuan2-13b

Text Generation

text-generation-inference

Model card Files Files and versions

katuni4ka commited on Apr 24, 2024

Commit

7ad5482

·

verified ·

1 Parent(s): 19f906c

Upload modeling_baichuan.py

Files changed (1) hide show

modeling_baichuan.py +3 -3

modeling_baichuan.py CHANGED Viewed

@@ -405,10 +405,10 @@ class BaichuanModel(BaichuanPreTrainedModel):
         if attention_mask is not None:
             if len(attention_mask.shape) == 2:
-                expanded_mask = attention_mask.to(alibi_mask.dtype)
                 expanded_mask = torch.tril(
-                    torch.gt(expanded_mask[:, :, None] * expanded_mask[:, None, :], 0)
-                ) * torch.eq(expanded_mask[:, :, None] - expanded_mask[:, None, :], 0)
             else:
                 expanded_mask = attention_mask
             bsz = inputs_embeds.size(0)

         if attention_mask is not None:
             if len(attention_mask.shape) == 2:
+                expanded_mask = attention_mask.to(torch.float32)
                 expanded_mask = torch.tril(
+                    torch.gt(expanded_mask[:, :, None] * expanded_mask[:, None, :], 0).to(torch.float32)
+                ) * torch.eq(expanded_mask[:, :, None] - expanded_mask[:, None, :], 0).to(torch.float32)
             else:
                 expanded_mask = attention_mask
             bsz = inputs_embeds.size(0)