Update configuration_HelpingAI.py
Browse files
configuration_HelpingAI.py
CHANGED
|
@@ -34,6 +34,7 @@ class HelpingAIConfig(PretrainedConfig):
|
|
| 34 |
use_cache=True,
|
| 35 |
hidden_activation=None,
|
| 36 |
rope_theta=10000,
|
|
|
|
| 37 |
attention_bias=False,
|
| 38 |
attention_dropout=0.0,
|
| 39 |
num_experts_per_tok=2,
|
|
@@ -63,5 +64,5 @@ class HelpingAIConfig(PretrainedConfig):
|
|
| 63 |
self.num_local_experts = num_local_experts
|
| 64 |
self.router_aux_loss_coef = router_aux_loss_coef
|
| 65 |
self.output_router_logits = output_router_logits
|
| 66 |
-
self.rope_pct = rope_pct
|
| 67 |
super().__init__(**kwargs)
|
|
|
|
| 34 |
use_cache=True,
|
| 35 |
hidden_activation=None,
|
| 36 |
rope_theta=10000,
|
| 37 |
+
rope_pct=0.25
|
| 38 |
attention_bias=False,
|
| 39 |
attention_dropout=0.0,
|
| 40 |
num_experts_per_tok=2,
|
|
|
|
| 64 |
self.num_local_experts = num_local_experts
|
| 65 |
self.router_aux_loss_coef = router_aux_loss_coef
|
| 66 |
self.output_router_logits = output_router_logits
|
| 67 |
+
self.rope_pct = rope_pct
|
| 68 |
super().__init__(**kwargs)
|