| { | |
| "best_metric": 0.8408180526634443, | |
| "best_model_checkpoint": "/chronos_data/smangalik/beliefs_modeling/models/self-belief-classifier-roberta-large-4/checkpoint-400", | |
| "epoch": 11.926605504587156, | |
| "eval_steps": 50, | |
| "global_step": 650, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 0.92, | |
| "learning_rate": 9.800000000000001e-06, | |
| "loss": 0.6617, | |
| "step": 50 | |
| }, | |
| { | |
| "epoch": 0.92, | |
| "eval_accuracy": 0.8205128205128205, | |
| "eval_f1": 0.819110295968641, | |
| "eval_loss": 0.4295506179332733, | |
| "eval_precision": 0.8192280280764046, | |
| "eval_recall": 0.8205128205128205, | |
| "eval_runtime": 3.9576, | |
| "eval_samples_per_second": 128.108, | |
| "eval_steps_per_second": 16.171, | |
| "step": 50 | |
| }, | |
| { | |
| "epoch": 1.83, | |
| "learning_rate": 9.815094339622643e-06, | |
| "loss": 0.3715, | |
| "step": 100 | |
| }, | |
| { | |
| "epoch": 1.83, | |
| "eval_accuracy": 0.8303747534516766, | |
| "eval_f1": 0.8353461502742431, | |
| "eval_loss": 0.4670024514198303, | |
| "eval_precision": 0.8434047624966725, | |
| "eval_recall": 0.8303747534516766, | |
| "eval_runtime": 3.9366, | |
| "eval_samples_per_second": 128.79, | |
| "eval_steps_per_second": 16.258, | |
| "step": 100 | |
| }, | |
| { | |
| "epoch": 2.75, | |
| "learning_rate": 9.626415094339624e-06, | |
| "loss": 0.2344, | |
| "step": 150 | |
| }, | |
| { | |
| "epoch": 2.75, | |
| "eval_accuracy": 0.814595660749507, | |
| "eval_f1": 0.8244485345966336, | |
| "eval_loss": 0.6940962672233582, | |
| "eval_precision": 0.8428588493485568, | |
| "eval_recall": 0.814595660749507, | |
| "eval_runtime": 3.4428, | |
| "eval_samples_per_second": 147.263, | |
| "eval_steps_per_second": 18.589, | |
| "step": 150 | |
| }, | |
| { | |
| "epoch": 3.67, | |
| "learning_rate": 9.437735849056604e-06, | |
| "loss": 0.1797, | |
| "step": 200 | |
| }, | |
| { | |
| "epoch": 3.67, | |
| "eval_accuracy": 0.8264299802761341, | |
| "eval_f1": 0.8329637103282812, | |
| "eval_loss": 0.7602464556694031, | |
| "eval_precision": 0.8480073311662002, | |
| "eval_recall": 0.8264299802761341, | |
| "eval_runtime": 3.5906, | |
| "eval_samples_per_second": 141.203, | |
| "eval_steps_per_second": 17.824, | |
| "step": 200 | |
| }, | |
| { | |
| "epoch": 4.59, | |
| "learning_rate": 9.252830188679246e-06, | |
| "loss": 0.1187, | |
| "step": 250 | |
| }, | |
| { | |
| "epoch": 4.59, | |
| "eval_accuracy": 0.8165680473372781, | |
| "eval_f1": 0.8260410505358732, | |
| "eval_loss": 1.040390133857727, | |
| "eval_precision": 0.8445598652695405, | |
| "eval_recall": 0.8165680473372781, | |
| "eval_runtime": 3.1667, | |
| "eval_samples_per_second": 160.104, | |
| "eval_steps_per_second": 20.21, | |
| "step": 250 | |
| }, | |
| { | |
| "epoch": 5.5, | |
| "learning_rate": 9.067924528301889e-06, | |
| "loss": 0.067, | |
| "step": 300 | |
| }, | |
| { | |
| "epoch": 5.5, | |
| "eval_accuracy": 0.8264299802761341, | |
| "eval_f1": 0.8313863456050801, | |
| "eval_loss": 1.0527454614639282, | |
| "eval_precision": 0.8389317220188415, | |
| "eval_recall": 0.8264299802761341, | |
| "eval_runtime": 4.2619, | |
| "eval_samples_per_second": 118.962, | |
| "eval_steps_per_second": 15.017, | |
| "step": 300 | |
| }, | |
| { | |
| "epoch": 6.42, | |
| "learning_rate": 8.879245283018869e-06, | |
| "loss": 0.0635, | |
| "step": 350 | |
| }, | |
| { | |
| "epoch": 6.42, | |
| "eval_accuracy": 0.8303747534516766, | |
| "eval_f1": 0.8376041385770543, | |
| "eval_loss": 1.1337926387786865, | |
| "eval_precision": 0.8504492855502807, | |
| "eval_recall": 0.8303747534516766, | |
| "eval_runtime": 4.0094, | |
| "eval_samples_per_second": 126.454, | |
| "eval_steps_per_second": 15.963, | |
| "step": 350 | |
| }, | |
| { | |
| "epoch": 7.34, | |
| "learning_rate": 8.69433962264151e-06, | |
| "loss": 0.0254, | |
| "step": 400 | |
| }, | |
| { | |
| "epoch": 7.34, | |
| "eval_accuracy": 0.8382642998027613, | |
| "eval_f1": 0.8408180526634443, | |
| "eval_loss": 1.1419103145599365, | |
| "eval_precision": 0.8458355761491414, | |
| "eval_recall": 0.8382642998027613, | |
| "eval_runtime": 3.6866, | |
| "eval_samples_per_second": 137.524, | |
| "eval_steps_per_second": 17.36, | |
| "step": 400 | |
| }, | |
| { | |
| "epoch": 8.26, | |
| "learning_rate": 8.505660377358492e-06, | |
| "loss": 0.0374, | |
| "step": 450 | |
| }, | |
| { | |
| "epoch": 8.26, | |
| "eval_accuracy": 0.8284023668639053, | |
| "eval_f1": 0.8320464737199128, | |
| "eval_loss": 1.2373206615447998, | |
| "eval_precision": 0.8369363588201497, | |
| "eval_recall": 0.8284023668639053, | |
| "eval_runtime": 4.0231, | |
| "eval_samples_per_second": 126.021, | |
| "eval_steps_per_second": 15.908, | |
| "step": 450 | |
| }, | |
| { | |
| "epoch": 9.17, | |
| "learning_rate": 8.316981132075472e-06, | |
| "loss": 0.013, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 9.17, | |
| "eval_accuracy": 0.834319526627219, | |
| "eval_f1": 0.8376685641339108, | |
| "eval_loss": 1.2268174886703491, | |
| "eval_precision": 0.8421800999981714, | |
| "eval_recall": 0.834319526627219, | |
| "eval_runtime": 4.1413, | |
| "eval_samples_per_second": 122.425, | |
| "eval_steps_per_second": 15.454, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 10.09, | |
| "learning_rate": 8.128301886792453e-06, | |
| "loss": 0.0213, | |
| "step": 550 | |
| }, | |
| { | |
| "epoch": 10.09, | |
| "eval_accuracy": 0.834319526627219, | |
| "eval_f1": 0.8396773850135992, | |
| "eval_loss": 1.2791889905929565, | |
| "eval_precision": 0.8499112935552067, | |
| "eval_recall": 0.834319526627219, | |
| "eval_runtime": 4.1859, | |
| "eval_samples_per_second": 121.122, | |
| "eval_steps_per_second": 15.29, | |
| "step": 550 | |
| }, | |
| { | |
| "epoch": 11.01, | |
| "learning_rate": 7.939622641509435e-06, | |
| "loss": 0.0003, | |
| "step": 600 | |
| }, | |
| { | |
| "epoch": 11.01, | |
| "eval_accuracy": 0.8303747534516766, | |
| "eval_f1": 0.8359161169722349, | |
| "eval_loss": 1.3518141508102417, | |
| "eval_precision": 0.8446374502780472, | |
| "eval_recall": 0.8303747534516766, | |
| "eval_runtime": 3.09, | |
| "eval_samples_per_second": 164.08, | |
| "eval_steps_per_second": 20.712, | |
| "step": 600 | |
| }, | |
| { | |
| "epoch": 11.93, | |
| "learning_rate": 7.750943396226415e-06, | |
| "loss": 0.0313, | |
| "step": 650 | |
| }, | |
| { | |
| "epoch": 11.93, | |
| "eval_accuracy": 0.8382642998027613, | |
| "eval_f1": 0.8405182086840655, | |
| "eval_loss": 1.3090877532958984, | |
| "eval_precision": 0.8442165138341221, | |
| "eval_recall": 0.8382642998027613, | |
| "eval_runtime": 4.7065, | |
| "eval_samples_per_second": 107.722, | |
| "eval_steps_per_second": 13.598, | |
| "step": 650 | |
| } | |
| ], | |
| "logging_steps": 50, | |
| "max_steps": 2700, | |
| "num_train_epochs": 50, | |
| "save_steps": 50, | |
| "total_flos": 2261979798655680.0, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |