| { | |
| "phase_results": [ | |
| { | |
| "phase": "phase0a", | |
| "skipped": true | |
| }, | |
| { | |
| "phase": "phase0b", | |
| "best_validation_loss": 1.5795909994765147, | |
| "best_metrics": { | |
| "loss": 1.5795909994765147, | |
| "token_count": 60099.0, | |
| "example_count": 1109.0, | |
| "first_token_correct": 546.0, | |
| "first_token_count": 1109.0, | |
| "first_token_exact_match": 0.49233543733092877, | |
| "phase": "phase0b" | |
| }, | |
| "global_step": 398, | |
| "run_step_end": 398, | |
| "train_dataset": { | |
| "example_count": 50865, | |
| "observation_steps_mean": 1.0, | |
| "observation_steps_max": 1, | |
| "input_tokens_mean": 25.618814508994397, | |
| "input_tokens_max": 540, | |
| "target_tokens_mean": 56.929185097807924, | |
| "target_tokens_max": 1024, | |
| "dataset_counts": { | |
| "alpaca": 50865 | |
| } | |
| }, | |
| "validation_dataset": { | |
| "example_count": 1109, | |
| "observation_steps_mean": 1.0, | |
| "observation_steps_max": 1, | |
| "input_tokens_mean": 25.237150586113614, | |
| "input_tokens_max": 274, | |
| "target_tokens_mean": 54.19206492335437, | |
| "target_tokens_max": 534, | |
| "dataset_counts": { | |
| "alpaca": 1109 | |
| } | |
| }, | |
| "wandb_enabled": true | |
| } | |
| ] | |
| } |