| { | |
| "model_type": "ChemQ3MTPForCausalLM", | |
| "num_future_tokens": 3, | |
| "horizon_loss_enabled": true, | |
| "mtp_head_enabled": true, | |
| "training_phases": [ | |
| "mtp_horizon_training" | |
| ], | |
| "total_parameters": 9857155, | |
| "epochs_trained": 1, | |
| "total_steps": 145628 | |
| } |
| { | |
| "model_type": "ChemQ3MTPForCausalLM", | |
| "num_future_tokens": 3, | |
| "horizon_loss_enabled": true, | |
| "mtp_head_enabled": true, | |
| "training_phases": [ | |
| "mtp_horizon_training" | |
| ], | |
| "total_parameters": 9857155, | |
| "epochs_trained": 1, | |
| "total_steps": 145628 | |
| } |