{ "phase_results": [ { "phase": "phase0a", "skipped": true }, { "phase": "phase0b", "best_validation_loss": 1.5795909994765147, "best_metrics": { "loss": 1.5795909994765147, "token_count": 60099.0, "example_count": 1109.0, "first_token_correct": 546.0, "first_token_count": 1109.0, "first_token_exact_match": 0.49233543733092877, "phase": "phase0b" }, "global_step": 398, "run_step_end": 398, "train_dataset": { "example_count": 50865, "observation_steps_mean": 1.0, "observation_steps_max": 1, "input_tokens_mean": 25.618814508994397, "input_tokens_max": 540, "target_tokens_mean": 56.929185097807924, "target_tokens_max": 1024, "dataset_counts": { "alpaca": 50865 } }, "validation_dataset": { "example_count": 1109, "observation_steps_mean": 1.0, "observation_steps_max": 1, "input_tokens_mean": 25.237150586113614, "input_tokens_max": 274, "target_tokens_mean": 54.19206492335437, "target_tokens_max": 534, "dataset_counts": { "alpaca": 1109 } }, "wandb_enabled": true } ] }