| { | |
| "device": "cuda", | |
| "dropout": 0.2, | |
| "n_blocks": 3, | |
| "transformer_config": { | |
| "block_size": 250, | |
| "dropout": 0.2, | |
| "n_embd": 396, | |
| "n_head": 8 | |
| }, | |
| "vocab_size": 8011, | |
| "xlstm_config": { | |
| "batch_size": 8, | |
| "block_size": 250, | |
| "config_block": "msm", | |
| "device": "cuda", | |
| "n_embd": 396 | |
| } | |
| } |