| { | |
| "device": "cuda", | |
| "dropout": 0.2, | |
| "n_blocks": 3, | |
| "transformer_config": { | |
| "block_size": 154, | |
| "dropout": 0.2, | |
| "n_embd": 192, | |
| "n_head": 4 | |
| }, | |
| "vocab_size": 8010, | |
| "xlstm_config": { | |
| "batch_size": 8, | |
| "block_size": 154, | |
| "config_block": "msm", | |
| "device": "cuda", | |
| "n_embd": 192 | |
| } | |
| } |