| { |
| "best_metric": 0.8408180526634443, |
| "best_model_checkpoint": "/chronos_data/smangalik/beliefs_modeling/models/self-belief-classifier-roberta-large-4/checkpoint-400", |
| "epoch": 11.926605504587156, |
| "eval_steps": 50, |
| "global_step": 650, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.92, |
| "learning_rate": 9.800000000000001e-06, |
| "loss": 0.6617, |
| "step": 50 |
| }, |
| { |
| "epoch": 0.92, |
| "eval_accuracy": 0.8205128205128205, |
| "eval_f1": 0.819110295968641, |
| "eval_loss": 0.4295506179332733, |
| "eval_precision": 0.8192280280764046, |
| "eval_recall": 0.8205128205128205, |
| "eval_runtime": 3.9576, |
| "eval_samples_per_second": 128.108, |
| "eval_steps_per_second": 16.171, |
| "step": 50 |
| }, |
| { |
| "epoch": 1.83, |
| "learning_rate": 9.815094339622643e-06, |
| "loss": 0.3715, |
| "step": 100 |
| }, |
| { |
| "epoch": 1.83, |
| "eval_accuracy": 0.8303747534516766, |
| "eval_f1": 0.8353461502742431, |
| "eval_loss": 0.4670024514198303, |
| "eval_precision": 0.8434047624966725, |
| "eval_recall": 0.8303747534516766, |
| "eval_runtime": 3.9366, |
| "eval_samples_per_second": 128.79, |
| "eval_steps_per_second": 16.258, |
| "step": 100 |
| }, |
| { |
| "epoch": 2.75, |
| "learning_rate": 9.626415094339624e-06, |
| "loss": 0.2344, |
| "step": 150 |
| }, |
| { |
| "epoch": 2.75, |
| "eval_accuracy": 0.814595660749507, |
| "eval_f1": 0.8244485345966336, |
| "eval_loss": 0.6940962672233582, |
| "eval_precision": 0.8428588493485568, |
| "eval_recall": 0.814595660749507, |
| "eval_runtime": 3.4428, |
| "eval_samples_per_second": 147.263, |
| "eval_steps_per_second": 18.589, |
| "step": 150 |
| }, |
| { |
| "epoch": 3.67, |
| "learning_rate": 9.437735849056604e-06, |
| "loss": 0.1797, |
| "step": 200 |
| }, |
| { |
| "epoch": 3.67, |
| "eval_accuracy": 0.8264299802761341, |
| "eval_f1": 0.8329637103282812, |
| "eval_loss": 0.7602464556694031, |
| "eval_precision": 0.8480073311662002, |
| "eval_recall": 0.8264299802761341, |
| "eval_runtime": 3.5906, |
| "eval_samples_per_second": 141.203, |
| "eval_steps_per_second": 17.824, |
| "step": 200 |
| }, |
| { |
| "epoch": 4.59, |
| "learning_rate": 9.252830188679246e-06, |
| "loss": 0.1187, |
| "step": 250 |
| }, |
| { |
| "epoch": 4.59, |
| "eval_accuracy": 0.8165680473372781, |
| "eval_f1": 0.8260410505358732, |
| "eval_loss": 1.040390133857727, |
| "eval_precision": 0.8445598652695405, |
| "eval_recall": 0.8165680473372781, |
| "eval_runtime": 3.1667, |
| "eval_samples_per_second": 160.104, |
| "eval_steps_per_second": 20.21, |
| "step": 250 |
| }, |
| { |
| "epoch": 5.5, |
| "learning_rate": 9.067924528301889e-06, |
| "loss": 0.067, |
| "step": 300 |
| }, |
| { |
| "epoch": 5.5, |
| "eval_accuracy": 0.8264299802761341, |
| "eval_f1": 0.8313863456050801, |
| "eval_loss": 1.0527454614639282, |
| "eval_precision": 0.8389317220188415, |
| "eval_recall": 0.8264299802761341, |
| "eval_runtime": 4.2619, |
| "eval_samples_per_second": 118.962, |
| "eval_steps_per_second": 15.017, |
| "step": 300 |
| }, |
| { |
| "epoch": 6.42, |
| "learning_rate": 8.879245283018869e-06, |
| "loss": 0.0635, |
| "step": 350 |
| }, |
| { |
| "epoch": 6.42, |
| "eval_accuracy": 0.8303747534516766, |
| "eval_f1": 0.8376041385770543, |
| "eval_loss": 1.1337926387786865, |
| "eval_precision": 0.8504492855502807, |
| "eval_recall": 0.8303747534516766, |
| "eval_runtime": 4.0094, |
| "eval_samples_per_second": 126.454, |
| "eval_steps_per_second": 15.963, |
| "step": 350 |
| }, |
| { |
| "epoch": 7.34, |
| "learning_rate": 8.69433962264151e-06, |
| "loss": 0.0254, |
| "step": 400 |
| }, |
| { |
| "epoch": 7.34, |
| "eval_accuracy": 0.8382642998027613, |
| "eval_f1": 0.8408180526634443, |
| "eval_loss": 1.1419103145599365, |
| "eval_precision": 0.8458355761491414, |
| "eval_recall": 0.8382642998027613, |
| "eval_runtime": 3.6866, |
| "eval_samples_per_second": 137.524, |
| "eval_steps_per_second": 17.36, |
| "step": 400 |
| }, |
| { |
| "epoch": 8.26, |
| "learning_rate": 8.505660377358492e-06, |
| "loss": 0.0374, |
| "step": 450 |
| }, |
| { |
| "epoch": 8.26, |
| "eval_accuracy": 0.8284023668639053, |
| "eval_f1": 0.8320464737199128, |
| "eval_loss": 1.2373206615447998, |
| "eval_precision": 0.8369363588201497, |
| "eval_recall": 0.8284023668639053, |
| "eval_runtime": 4.0231, |
| "eval_samples_per_second": 126.021, |
| "eval_steps_per_second": 15.908, |
| "step": 450 |
| }, |
| { |
| "epoch": 9.17, |
| "learning_rate": 8.316981132075472e-06, |
| "loss": 0.013, |
| "step": 500 |
| }, |
| { |
| "epoch": 9.17, |
| "eval_accuracy": 0.834319526627219, |
| "eval_f1": 0.8376685641339108, |
| "eval_loss": 1.2268174886703491, |
| "eval_precision": 0.8421800999981714, |
| "eval_recall": 0.834319526627219, |
| "eval_runtime": 4.1413, |
| "eval_samples_per_second": 122.425, |
| "eval_steps_per_second": 15.454, |
| "step": 500 |
| }, |
| { |
| "epoch": 10.09, |
| "learning_rate": 8.128301886792453e-06, |
| "loss": 0.0213, |
| "step": 550 |
| }, |
| { |
| "epoch": 10.09, |
| "eval_accuracy": 0.834319526627219, |
| "eval_f1": 0.8396773850135992, |
| "eval_loss": 1.2791889905929565, |
| "eval_precision": 0.8499112935552067, |
| "eval_recall": 0.834319526627219, |
| "eval_runtime": 4.1859, |
| "eval_samples_per_second": 121.122, |
| "eval_steps_per_second": 15.29, |
| "step": 550 |
| }, |
| { |
| "epoch": 11.01, |
| "learning_rate": 7.939622641509435e-06, |
| "loss": 0.0003, |
| "step": 600 |
| }, |
| { |
| "epoch": 11.01, |
| "eval_accuracy": 0.8303747534516766, |
| "eval_f1": 0.8359161169722349, |
| "eval_loss": 1.3518141508102417, |
| "eval_precision": 0.8446374502780472, |
| "eval_recall": 0.8303747534516766, |
| "eval_runtime": 3.09, |
| "eval_samples_per_second": 164.08, |
| "eval_steps_per_second": 20.712, |
| "step": 600 |
| }, |
| { |
| "epoch": 11.93, |
| "learning_rate": 7.750943396226415e-06, |
| "loss": 0.0313, |
| "step": 650 |
| }, |
| { |
| "epoch": 11.93, |
| "eval_accuracy": 0.8382642998027613, |
| "eval_f1": 0.8405182086840655, |
| "eval_loss": 1.3090877532958984, |
| "eval_precision": 0.8442165138341221, |
| "eval_recall": 0.8382642998027613, |
| "eval_runtime": 4.7065, |
| "eval_samples_per_second": 107.722, |
| "eval_steps_per_second": 13.598, |
| "step": 650 |
| } |
| ], |
| "logging_steps": 50, |
| "max_steps": 2700, |
| "num_train_epochs": 50, |
| "save_steps": 50, |
| "total_flos": 2261979798655680.0, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|