| { | |
| "d_model": 128, | |
| "nhead": 4, | |
| "num_layers": 4, | |
| "vocab_size": 257, | |
| "avg_loss": 0.054804470509290694, | |
| "avg_bpb": 0.07906613782229914 | |
| } |
| { | |
| "d_model": 128, | |
| "nhead": 4, | |
| "num_layers": 4, | |
| "vocab_size": 257, | |
| "avg_loss": 0.054804470509290694, | |
| "avg_bpb": 0.07906613782229914 | |
| } |