| { | |
| "vocab_size": 1000, | |
| "emb_dim": 256, | |
| "n_heads": 8, | |
| "n_layers": 4, | |
| "max_seq_len": 128, | |
| "dropout": 0.1, | |
| "model_type": "MiniTransformer" | |
| } |
| { | |
| "vocab_size": 1000, | |
| "emb_dim": 256, | |
| "n_heads": 8, | |
| "n_layers": 4, | |
| "max_seq_len": 128, | |
| "dropout": 0.1, | |
| "model_type": "MiniTransformer" | |
| } |