klemenk commited on
Commit
6bb6180
·
verified ·
1 Parent(s): d533175

Update modeling_auristream.py

Browse files
Files changed (1) hide show
  1. modeling_auristream.py +2 -2
modeling_auristream.py CHANGED
@@ -425,8 +425,8 @@ class CausalSelfAttention(nn.Module):
425
  self.c_attn = nn.Linear(self.n_embd, 3 * self.n_embd, bias=False)
426
  # output projection
427
  self.c_proj = nn.Linear(self.n_embd, self.n_embd, bias=False)
428
-
429
- rope_theta = 500000
430
  if hasattr(config, 'rope_theta') and config.rope_theta is not None:
431
  rope_theta = config.rope_theta
432
 
 
425
  self.c_attn = nn.Linear(self.n_embd, 3 * self.n_embd, bias=False)
426
  # output projection
427
  self.c_proj = nn.Linear(self.n_embd, self.n_embd, bias=False)
428
+
429
+ rope_theta = 10000
430
  if hasattr(config, 'rope_theta') and config.rope_theta is not None:
431
  rope_theta = config.rope_theta
432