Upload xlstm_config.yaml
Browse files- xlstm_config.yaml +19 -0
xlstm_config.yaml
ADDED
|
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
vocab_size: 50304
|
| 2 |
+
tie_weights: True
|
| 3 |
+
mlstm_block:
|
| 4 |
+
mlstm:
|
| 5 |
+
conv1d_kernel_size: 4
|
| 6 |
+
qkv_proj_blocksize: 4
|
| 7 |
+
num_heads: 4
|
| 8 |
+
slstm_block:
|
| 9 |
+
slstm:
|
| 10 |
+
num_heads: 4
|
| 11 |
+
conv1d_kernel_size: 4
|
| 12 |
+
bias_init: powerlaw_blockdependent
|
| 13 |
+
feedforward:
|
| 14 |
+
proj_factor: 1.3
|
| 15 |
+
act_fn: gelu
|
| 16 |
+
context_length: 256
|
| 17 |
+
num_blocks: 24
|
| 18 |
+
embedding_dim: 768
|
| 19 |
+
slstm_at: [3, 20]
|