yagizdevre commited on
Commit
413ea27
·
1 Parent(s): 2955790

config fix

Browse files
__pycache__/attn.cpython-312.pyc CHANGED
Binary files a/__pycache__/attn.cpython-312.pyc and b/__pycache__/attn.cpython-312.pyc differ
 
configuration_minitransformer.py CHANGED
@@ -7,13 +7,13 @@ class MiniTransformerConfig(PretrainedConfig):
7
  def __init__(
8
  self,
9
  bsz: int = 1,
10
- dim: int = 1536,
11
- num_heads: int = 8,
12
- num_layers: int = 26,
13
  seq_len: int = 8192,
14
- window_size: int = 1024,
15
  vocab_size: int = 200064,
16
- mlp_scale: int = 12,
17
  bias: bool = False,
18
  dropout: float = 0.0,
19
  softcap: float = 50.0,
 
7
  def __init__(
8
  self,
9
  bsz: int = 1,
10
+ dim: int = 768,
11
+ num_heads: int = 24,
12
+ num_layers: int = 27,
13
  seq_len: int = 8192,
14
+ window_size: int = 8192,
15
  vocab_size: int = 200064,
16
+ mlp_scale: int = 4,
17
  bias: bool = False,
18
  dropout: float = 0.0,
19
  softcap: float = 50.0,