Update modeling_auristream.py
Browse files- modeling_auristream.py +2 -2
modeling_auristream.py
CHANGED
|
@@ -425,8 +425,8 @@ class CausalSelfAttention(nn.Module):
|
|
| 425 |
self.c_attn = nn.Linear(self.n_embd, 3 * self.n_embd, bias=False)
|
| 426 |
# output projection
|
| 427 |
self.c_proj = nn.Linear(self.n_embd, self.n_embd, bias=False)
|
| 428 |
-
|
| 429 |
-
rope_theta =
|
| 430 |
if hasattr(config, 'rope_theta') and config.rope_theta is not None:
|
| 431 |
rope_theta = config.rope_theta
|
| 432 |
|
|
|
|
| 425 |
self.c_attn = nn.Linear(self.n_embd, 3 * self.n_embd, bias=False)
|
| 426 |
# output projection
|
| 427 |
self.c_proj = nn.Linear(self.n_embd, self.n_embd, bias=False)
|
| 428 |
+
|
| 429 |
+
rope_theta = 10000
|
| 430 |
if hasattr(config, 'rope_theta') and config.rope_theta is not None:
|
| 431 |
rope_theta = config.rope_theta
|
| 432 |
|