| { | |
| "vocab_size": 30000, | |
| "d_model": 256, | |
| "num_heads": 4, | |
| "num_layers": 4, | |
| "d_ff": 1024, | |
| "max_seq_len": 128, | |
| "pad_token_id": 0, | |
| "size_name": "mini" | |
| } |
| { | |
| "vocab_size": 30000, | |
| "d_model": 256, | |
| "num_heads": 4, | |
| "num_layers": 4, | |
| "d_ff": 1024, | |
| "max_seq_len": 128, | |
| "pad_token_id": 0, | |
| "size_name": "mini" | |
| } |