| { | |
| "model_name": "AgLM", | |
| "block_size": 128, | |
| "n_embd": 128, | |
| "n_head": 4, | |
| "n_layer": 4, | |
| "vocab_size": 8000, | |
| "batch_size": 8, | |
| "grad_accum": 4, | |
| "max_epochs": 3, | |
| "end_token_id": 4 | |
| } |
| { | |
| "model_name": "AgLM", | |
| "block_size": 128, | |
| "n_embd": 128, | |
| "n_head": 4, | |
| "n_layer": 4, | |
| "vocab_size": 8000, | |
| "batch_size": 8, | |
| "grad_accum": 4, | |
| "max_epochs": 3, | |
| "end_token_id": 4 | |
| } |