| { |
| "best_metric": 0.8055555555555556, |
| "best_model_checkpoint": "test/checkpoint-6", |
| "epoch": 19.727272727272727, |
| "global_step": 40, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.73, |
| "eval_accuracy": 0.6388888888888888, |
| "eval_f1": 0.6477582846003898, |
| "eval_loss": 0.679732084274292, |
| "eval_precision": 0.6572420634920635, |
| "eval_recall": 0.6388888888888888, |
| "eval_runtime": 5.9427, |
| "eval_samples_per_second": 6.058, |
| "eval_steps_per_second": 0.168, |
| "step": 2 |
| }, |
| { |
| "epoch": 1.73, |
| "eval_accuracy": 0.75, |
| "eval_f1": 0.6904761904761904, |
| "eval_loss": 0.6750033497810364, |
| "eval_precision": 0.6397058823529411, |
| "eval_recall": 0.75, |
| "eval_runtime": 4.9005, |
| "eval_samples_per_second": 7.346, |
| "eval_steps_per_second": 0.204, |
| "step": 4 |
| }, |
| { |
| "epoch": 2.73, |
| "eval_accuracy": 0.8055555555555556, |
| "eval_f1": 0.7188034188034188, |
| "eval_loss": 0.6533546447753906, |
| "eval_precision": 0.6489197530864197, |
| "eval_recall": 0.8055555555555556, |
| "eval_runtime": 4.9351, |
| "eval_samples_per_second": 7.295, |
| "eval_steps_per_second": 0.203, |
| "step": 6 |
| }, |
| { |
| "epoch": 3.73, |
| "eval_accuracy": 0.8055555555555556, |
| "eval_f1": 0.7188034188034188, |
| "eval_loss": 0.6294739842414856, |
| "eval_precision": 0.6489197530864197, |
| "eval_recall": 0.8055555555555556, |
| "eval_runtime": 4.7154, |
| "eval_samples_per_second": 7.635, |
| "eval_steps_per_second": 0.212, |
| "step": 8 |
| }, |
| { |
| "epoch": 4.73, |
| "learning_rate": 0.0001, |
| "loss": 0.8452, |
| "step": 10 |
| }, |
| { |
| "epoch": 4.73, |
| "eval_accuracy": 0.8055555555555556, |
| "eval_f1": 0.7188034188034188, |
| "eval_loss": 0.6180709600448608, |
| "eval_precision": 0.6489197530864197, |
| "eval_recall": 0.8055555555555556, |
| "eval_runtime": 5.3103, |
| "eval_samples_per_second": 6.779, |
| "eval_steps_per_second": 0.188, |
| "step": 10 |
| }, |
| { |
| "epoch": 5.73, |
| "eval_accuracy": 0.8055555555555556, |
| "eval_f1": 0.7188034188034188, |
| "eval_loss": 0.6019383668899536, |
| "eval_precision": 0.6489197530864197, |
| "eval_recall": 0.8055555555555556, |
| "eval_runtime": 4.7577, |
| "eval_samples_per_second": 7.567, |
| "eval_steps_per_second": 0.21, |
| "step": 12 |
| }, |
| { |
| "epoch": 6.73, |
| "eval_accuracy": 0.8055555555555556, |
| "eval_f1": 0.7188034188034188, |
| "eval_loss": 0.6006457805633545, |
| "eval_precision": 0.6489197530864197, |
| "eval_recall": 0.8055555555555556, |
| "eval_runtime": 4.7756, |
| "eval_samples_per_second": 7.538, |
| "eval_steps_per_second": 0.209, |
| "step": 14 |
| }, |
| { |
| "epoch": 7.73, |
| "eval_accuracy": 0.8055555555555556, |
| "eval_f1": 0.7188034188034188, |
| "eval_loss": 0.584420919418335, |
| "eval_precision": 0.6489197530864197, |
| "eval_recall": 0.8055555555555556, |
| "eval_runtime": 5.7897, |
| "eval_samples_per_second": 6.218, |
| "eval_steps_per_second": 0.173, |
| "step": 16 |
| }, |
| { |
| "epoch": 8.73, |
| "eval_accuracy": 0.8055555555555556, |
| "eval_f1": 0.7188034188034188, |
| "eval_loss": 0.5822530388832092, |
| "eval_precision": 0.6489197530864197, |
| "eval_recall": 0.8055555555555556, |
| "eval_runtime": 4.7388, |
| "eval_samples_per_second": 7.597, |
| "eval_steps_per_second": 0.211, |
| "step": 18 |
| }, |
| { |
| "epoch": 9.73, |
| "learning_rate": 6.666666666666667e-05, |
| "loss": 0.7824, |
| "step": 20 |
| }, |
| { |
| "epoch": 9.73, |
| "eval_accuracy": 0.8055555555555556, |
| "eval_f1": 0.7188034188034188, |
| "eval_loss": 0.5739169716835022, |
| "eval_precision": 0.6489197530864197, |
| "eval_recall": 0.8055555555555556, |
| "eval_runtime": 4.8104, |
| "eval_samples_per_second": 7.484, |
| "eval_steps_per_second": 0.208, |
| "step": 20 |
| }, |
| { |
| "epoch": 10.73, |
| "eval_accuracy": 0.8055555555555556, |
| "eval_f1": 0.7188034188034188, |
| "eval_loss": 0.5697076916694641, |
| "eval_precision": 0.6489197530864197, |
| "eval_recall": 0.8055555555555556, |
| "eval_runtime": 4.6974, |
| "eval_samples_per_second": 7.664, |
| "eval_steps_per_second": 0.213, |
| "step": 22 |
| }, |
| { |
| "epoch": 11.73, |
| "eval_accuracy": 0.8055555555555556, |
| "eval_f1": 0.7188034188034188, |
| "eval_loss": 0.5695454478263855, |
| "eval_precision": 0.6489197530864197, |
| "eval_recall": 0.8055555555555556, |
| "eval_runtime": 4.9353, |
| "eval_samples_per_second": 7.294, |
| "eval_steps_per_second": 0.203, |
| "step": 24 |
| }, |
| { |
| "epoch": 12.73, |
| "eval_accuracy": 0.8055555555555556, |
| "eval_f1": 0.7188034188034188, |
| "eval_loss": 0.5626423954963684, |
| "eval_precision": 0.6489197530864197, |
| "eval_recall": 0.8055555555555556, |
| "eval_runtime": 5.8521, |
| "eval_samples_per_second": 6.152, |
| "eval_steps_per_second": 0.171, |
| "step": 26 |
| }, |
| { |
| "epoch": 13.73, |
| "eval_accuracy": 0.8055555555555556, |
| "eval_f1": 0.7188034188034188, |
| "eval_loss": 0.5666201710700989, |
| "eval_precision": 0.6489197530864197, |
| "eval_recall": 0.8055555555555556, |
| "eval_runtime": 5.1217, |
| "eval_samples_per_second": 7.029, |
| "eval_steps_per_second": 0.195, |
| "step": 28 |
| }, |
| { |
| "epoch": 14.73, |
| "learning_rate": 3.3333333333333335e-05, |
| "loss": 0.7149, |
| "step": 30 |
| }, |
| { |
| "epoch": 14.73, |
| "eval_accuracy": 0.8055555555555556, |
| "eval_f1": 0.7188034188034188, |
| "eval_loss": 0.5559208989143372, |
| "eval_precision": 0.6489197530864197, |
| "eval_recall": 0.8055555555555556, |
| "eval_runtime": 5.1084, |
| "eval_samples_per_second": 7.047, |
| "eval_steps_per_second": 0.196, |
| "step": 30 |
| }, |
| { |
| "epoch": 15.73, |
| "eval_accuracy": 0.8055555555555556, |
| "eval_f1": 0.7188034188034188, |
| "eval_loss": 0.5556015372276306, |
| "eval_precision": 0.6489197530864197, |
| "eval_recall": 0.8055555555555556, |
| "eval_runtime": 6.0749, |
| "eval_samples_per_second": 5.926, |
| "eval_steps_per_second": 0.165, |
| "step": 32 |
| }, |
| { |
| "epoch": 16.73, |
| "eval_accuracy": 0.8055555555555556, |
| "eval_f1": 0.7188034188034188, |
| "eval_loss": 0.5465428233146667, |
| "eval_precision": 0.6489197530864197, |
| "eval_recall": 0.8055555555555556, |
| "eval_runtime": 4.8659, |
| "eval_samples_per_second": 7.398, |
| "eval_steps_per_second": 0.206, |
| "step": 34 |
| }, |
| { |
| "epoch": 17.73, |
| "eval_accuracy": 0.8055555555555556, |
| "eval_f1": 0.7188034188034188, |
| "eval_loss": 0.5558464527130127, |
| "eval_precision": 0.6489197530864197, |
| "eval_recall": 0.8055555555555556, |
| "eval_runtime": 4.8604, |
| "eval_samples_per_second": 7.407, |
| "eval_steps_per_second": 0.206, |
| "step": 36 |
| }, |
| { |
| "epoch": 18.73, |
| "eval_accuracy": 0.8055555555555556, |
| "eval_f1": 0.7188034188034188, |
| "eval_loss": 0.5543624758720398, |
| "eval_precision": 0.6489197530864197, |
| "eval_recall": 0.8055555555555556, |
| "eval_runtime": 4.7553, |
| "eval_samples_per_second": 7.57, |
| "eval_steps_per_second": 0.21, |
| "step": 38 |
| }, |
| { |
| "epoch": 19.73, |
| "learning_rate": 0.0, |
| "loss": 0.6869, |
| "step": 40 |
| }, |
| { |
| "epoch": 19.73, |
| "eval_accuracy": 0.8055555555555556, |
| "eval_f1": 0.7188034188034188, |
| "eval_loss": 0.5504012107849121, |
| "eval_precision": 0.6489197530864197, |
| "eval_recall": 0.8055555555555556, |
| "eval_runtime": 5.3116, |
| "eval_samples_per_second": 6.778, |
| "eval_steps_per_second": 0.188, |
| "step": 40 |
| }, |
| { |
| "epoch": 19.73, |
| "step": 40, |
| "total_flos": 2.8684782950326272e+17, |
| "train_loss": 0.7573485970497131, |
| "train_runtime": 850.4827, |
| "train_samples_per_second": 16.085, |
| "train_steps_per_second": 0.047 |
| } |
| ], |
| "max_steps": 40, |
| "num_train_epochs": 20, |
| "total_flos": 2.8684782950326272e+17, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|