| { |
| "best_metric": 0.9345950946320974, |
| "best_model_checkpoint": "../output/roberta-base-sst_bin/checkpoint-700", |
| "epoch": 3.225806451612903, |
| "global_step": 700, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.46, |
| "eval_accuracy": 0.9071100917431193, |
| "eval_f1": 0.9068620534601686, |
| "eval_loss": 0.2708713114261627, |
| "eval_precision": 0.9092790114821938, |
| "eval_recall": 0.9064683842721226, |
| "eval_runtime": 4.3371, |
| "eval_samples_per_second": 201.055, |
| "step": 100 |
| }, |
| { |
| "epoch": 0.92, |
| "eval_accuracy": 0.9220183486238532, |
| "eval_f1": 0.9218539136302294, |
| "eval_loss": 0.22453300654888153, |
| "eval_precision": 0.9236269780824236, |
| "eval_recall": 0.9214869074682159, |
| "eval_runtime": 4.3383, |
| "eval_samples_per_second": 201.001, |
| "step": 200 |
| }, |
| { |
| "epoch": 1.38, |
| "eval_accuracy": 0.9277522935779816, |
| "eval_f1": 0.9277248238707003, |
| "eval_loss": 0.26203280687332153, |
| "eval_precision": 0.9277451780122622, |
| "eval_recall": 0.9277069125199966, |
| "eval_runtime": 4.3399, |
| "eval_samples_per_second": 200.924, |
| "step": 300 |
| }, |
| { |
| "epoch": 1.84, |
| "eval_accuracy": 0.9288990825688074, |
| "eval_f1": 0.9288990825688074, |
| "eval_loss": 0.27323779463768005, |
| "eval_precision": 0.9292119222025764, |
| "eval_recall": 0.9292119222025764, |
| "eval_runtime": 4.3401, |
| "eval_samples_per_second": 200.916, |
| "step": 400 |
| }, |
| { |
| "epoch": 2.3, |
| "learning_rate": 1.0783410138248848e-05, |
| "loss": 0.2545, |
| "step": 500 |
| }, |
| { |
| "epoch": 2.3, |
| "eval_accuracy": 0.9288990825688074, |
| "eval_f1": 0.928763802145097, |
| "eval_loss": 0.3416966497898102, |
| "eval_precision": 0.9303050804456754, |
| "eval_recall": 0.9284120569167298, |
| "eval_runtime": 4.3403, |
| "eval_samples_per_second": 200.908, |
| "step": 500 |
| }, |
| { |
| "epoch": 2.76, |
| "eval_accuracy": 0.9288990825688074, |
| "eval_f1": 0.9288256977356504, |
| "eval_loss": 0.250255286693573, |
| "eval_precision": 0.9293817476383266, |
| "eval_recall": 0.9286225477814263, |
| "eval_runtime": 4.3388, |
| "eval_samples_per_second": 200.976, |
| "step": 600 |
| }, |
| { |
| "epoch": 3.23, |
| "eval_accuracy": 0.9346330275229358, |
| "eval_f1": 0.9345950946320974, |
| "eval_loss": 0.3421626687049866, |
| "eval_precision": 0.9347459813507295, |
| "eval_recall": 0.9345057674496927, |
| "eval_runtime": 4.3413, |
| "eval_samples_per_second": 200.862, |
| "step": 700 |
| } |
| ], |
| "max_steps": 1085, |
| "num_train_epochs": 5, |
| "total_flos": 2137477265246208, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|