| { | |
| "context_length": 256, | |
| "vocab_size": 50304, | |
| "num_layers": 12, | |
| "embd_size": 768, | |
| "num_heads": 12, | |
| "step": 100, | |
| "val_loss": 5.318082332611084 | |
| } |
| { | |
| "context_length": 256, | |
| "vocab_size": 50304, | |
| "num_layers": 12, | |
| "embd_size": 768, | |
| "num_heads": 12, | |
| "step": 100, | |
| "val_loss": 5.318082332611084 | |
| } |