klemenk commited on
Commit
d9b6bca
·
verified ·
1 Parent(s): dd150a3

Update modeling_auristream.py

Browse files
Files changed (1) hide show
  1. modeling_auristream.py +1 -1
modeling_auristream.py CHANGED
@@ -511,7 +511,7 @@ class CausalSelfAttention(nn.Module):
511
  # output projection
512
  self.c_proj = nn.Linear(self.n_embd, self.n_embd, bias=False)
513
 
514
- rope_theta = 500000
515
  if hasattr(config, 'rope_theta') and config.rope_theta is not None:
516
  rope_theta = config.rope_theta
517
 
 
511
  # output projection
512
  self.c_proj = nn.Linear(self.n_embd, self.n_embd, bias=False)
513
 
514
+ rope_theta = 10000
515
  if hasattr(config, 'rope_theta') and config.rope_theta is not None:
516
  rope_theta = config.rope_theta
517