zen-E commited on
Commit
e3d1d72
·
verified ·
1 Parent(s): 8341ba0

Update modeling_llama_nsa.py

Browse files
Files changed (1) hide show
  1. modeling_llama_nsa.py +1 -1
modeling_llama_nsa.py CHANGED
@@ -307,7 +307,7 @@ class LlamaNSAAttention(nn.Module):
307
  window_size=self.config.window_size,
308
  head_first=False,
309
  )
310
- #attn_weights = None
311
 
312
  sa_loss = 0 #torch.nn.SmoothL1Loss()(attn_output_mha, attn_output.detach()) + torch.nn.SmoothL1Loss()(attn_output_mha.detach(), attn_output)
313
 
 
307
  window_size=self.config.window_size,
308
  head_first=False,
309
  )
310
+ attn_weights = None
311
 
312
  sa_loss = 0 #torch.nn.SmoothL1Loss()(attn_output_mha, attn_output.detach()) + torch.nn.SmoothL1Loss()(attn_output_mha.detach(), attn_output)
313