| { |
| "best_global_step": 2088, |
| "best_metric": 0.8285096878151668, |
| "best_model_checkpoint": "./robertalarge_multiclass/checkpoint-2088", |
| "epoch": 4.0, |
| "eval_steps": 500, |
| "global_step": 2088, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 1.0, |
| "grad_norm": 38.4963493347168, |
| "learning_rate": 1.996168582375479e-05, |
| "loss": 0.7634037061669361, |
| "step": 522 |
| }, |
| { |
| "epoch": 1.0, |
| "eval_Nomove_f1": 0.8534048976853404, |
| "eval_Nomove_precision": 0.8588791357191087, |
| "eval_Nomove_recall": 0.848, |
| "eval_Nomove_support": 3000, |
| "eval_PressAccuracy_f1": 0.875776397515528, |
| "eval_PressAccuracy_precision": 0.8788469029996104, |
| "eval_PressAccuracy_recall": 0.8727272727272727, |
| "eval_PressAccuracy_support": 2585, |
| "eval_PressReasoning_f1": 0.7333333333333333, |
| "eval_PressReasoning_precision": 0.6212624584717608, |
| "eval_PressReasoning_recall": 0.8947368421052632, |
| "eval_PressReasoning_support": 209, |
| "eval_Uptake (Restating or revoicing)_f1": 0.597979797979798, |
| "eval_Uptake (Restating or revoicing)_precision": 0.5025466893039049, |
| "eval_Uptake (Restating or revoicing)_recall": 0.7381546134663342, |
| "eval_Uptake (Restating or revoicing)_support": 401, |
| "eval_accuracy": 0.8313151900251768, |
| "eval_loss": 0.5038919448852539, |
| "eval_macro_f1": 0.7744391016253172, |
| "eval_macro_precision": 0.7441072454154222, |
| "eval_macro_recall": 0.8245914064239864, |
| "eval_mcc": 0.7642954946246379, |
| "eval_participation management_f1": 0.811701081612586, |
| "eval_participation management_precision": 0.8590010405827263, |
| "eval_participation management_recall": 0.7693383038210625, |
| "eval_participation management_support": 2146, |
| "eval_runtime": 7.1557, |
| "eval_samples_per_second": 1165.647, |
| "eval_steps_per_second": 18.307, |
| "eval_weighted_f1": 0.8343200776202896, |
| "eval_weighted_precision": 0.8420139024976997, |
| "eval_weighted_recall": 0.8313151900251768, |
| "step": 522 |
| }, |
| { |
| "epoch": 2.0, |
| "grad_norm": 6.410867214202881, |
| "learning_rate": 1.7782034908471692e-05, |
| "loss": 0.4319716997987009, |
| "step": 1044 |
| }, |
| { |
| "epoch": 2.0, |
| "eval_Nomove_f1": 0.8761967646087818, |
| "eval_Nomove_precision": 0.8678875081752779, |
| "eval_Nomove_recall": 0.8846666666666667, |
| "eval_Nomove_support": 3000, |
| "eval_PressAccuracy_f1": 0.8749497386409328, |
| "eval_PressAccuracy_precision": 0.9108413562159899, |
| "eval_PressAccuracy_recall": 0.8417794970986461, |
| "eval_PressAccuracy_support": 2585, |
| "eval_PressReasoning_f1": 0.7859078590785908, |
| "eval_PressReasoning_precision": 0.90625, |
| "eval_PressReasoning_recall": 0.69377990430622, |
| "eval_PressReasoning_support": 209, |
| "eval_Uptake (Restating or revoicing)_f1": 0.6924101198402132, |
| "eval_Uptake (Restating or revoicing)_precision": 0.7428571428571429, |
| "eval_Uptake (Restating or revoicing)_recall": 0.6483790523690773, |
| "eval_Uptake (Restating or revoicing)_support": 401, |
| "eval_accuracy": 0.8515765495743916, |
| "eval_loss": 0.4433172047138214, |
| "eval_macro_f1": 0.8108377087957347, |
| "eval_macro_precision": 0.8422786108456553, |
| "eval_macro_recall": 0.7878123568001445, |
| "eval_mcc": 0.7898141732587503, |
| "eval_participation management_f1": 0.8247240618101546, |
| "eval_participation management_precision": 0.7835570469798657, |
| "eval_participation management_recall": 0.8704566635601119, |
| "eval_participation management_support": 2146, |
| "eval_runtime": 7.1565, |
| "eval_samples_per_second": 1165.511, |
| "eval_steps_per_second": 18.305, |
| "eval_weighted_f1": 0.8514691770124805, |
| "eval_weighted_precision": 0.8544530412958486, |
| "eval_weighted_recall": 0.8515765495743916, |
| "step": 1044 |
| }, |
| { |
| "epoch": 3.0, |
| "grad_norm": 15.955626487731934, |
| "learning_rate": 1.555981268624947e-05, |
| "loss": 0.33474684675077826, |
| "step": 1566 |
| }, |
| { |
| "epoch": 3.0, |
| "eval_Nomove_f1": 0.8818949809508034, |
| "eval_Nomove_precision": 0.8765228844254198, |
| "eval_Nomove_recall": 0.8873333333333333, |
| "eval_Nomove_support": 3000, |
| "eval_PressAccuracy_f1": 0.895219512195122, |
| "eval_PressAccuracy_precision": 0.9031496062992126, |
| "eval_PressAccuracy_recall": 0.8874274661508704, |
| "eval_PressAccuracy_support": 2585, |
| "eval_PressReasoning_f1": 0.7851851851851851, |
| "eval_PressReasoning_precision": 0.8112244897959183, |
| "eval_PressReasoning_recall": 0.7607655502392344, |
| "eval_PressReasoning_support": 209, |
| "eval_Uptake (Restating or revoicing)_f1": 0.7187079407806191, |
| "eval_Uptake (Restating or revoicing)_precision": 0.7807017543859649, |
| "eval_Uptake (Restating or revoicing)_recall": 0.6658354114713217, |
| "eval_Uptake (Restating or revoicing)_support": 401, |
| "eval_accuracy": 0.8676417695719938, |
| "eval_loss": 0.4420914053916931, |
| "eval_macro_f1": 0.8259179007665363, |
| "eval_macro_precision": 0.8409864136479698, |
| "eval_macro_recall": 0.8131521285670041, |
| "eval_mcc": 0.8119580097491912, |
| "eval_participation management_f1": 0.8485818847209515, |
| "eval_participation management_precision": 0.8333333333333334, |
| "eval_participation management_recall": 0.8643988816402609, |
| "eval_participation management_support": 2146, |
| "eval_runtime": 7.1677, |
| "eval_samples_per_second": 1163.701, |
| "eval_steps_per_second": 18.277, |
| "eval_weighted_f1": 0.867184953176441, |
| "eval_weighted_precision": 0.8674200984017715, |
| "eval_weighted_recall": 0.8676417695719938, |
| "step": 1566 |
| }, |
| { |
| "epoch": 4.0, |
| "grad_norm": 36.6058464050293, |
| "learning_rate": 1.3337590464027246e-05, |
| "loss": 0.2601611257969648, |
| "step": 2088 |
| }, |
| { |
| "epoch": 4.0, |
| "eval_Nomove_f1": 0.881498224087827, |
| "eval_Nomove_precision": 0.8547276142767689, |
| "eval_Nomove_recall": 0.91, |
| "eval_Nomove_support": 3000, |
| "eval_PressAccuracy_f1": 0.8888455538221529, |
| "eval_PressAccuracy_precision": 0.8961856075501377, |
| "eval_PressAccuracy_recall": 0.8816247582205029, |
| "eval_PressAccuracy_support": 2585, |
| "eval_PressReasoning_f1": 0.8066037735849058, |
| "eval_PressReasoning_precision": 0.7953488372093023, |
| "eval_PressReasoning_recall": 0.8181818181818182, |
| "eval_PressReasoning_support": 209, |
| "eval_Uptake (Restating or revoicing)_f1": 0.7253613666228647, |
| "eval_Uptake (Restating or revoicing)_precision": 0.7666666666666667, |
| "eval_Uptake (Restating or revoicing)_recall": 0.6882793017456359, |
| "eval_Uptake (Restating or revoicing)_support": 401, |
| "eval_accuracy": 0.8644047476321784, |
| "eval_loss": 0.45752763748168945, |
| "eval_macro_f1": 0.8285096878151668, |
| "eval_macro_precision": 0.8354787959044984, |
| "eval_macro_recall": 0.8230840908206446, |
| "eval_mcc": 0.8074382310097558, |
| "eval_participation management_f1": 0.8402395209580839, |
| "eval_participation management_precision": 0.8644652538196156, |
| "eval_participation management_recall": 0.8173345759552656, |
| "eval_participation management_support": 2146, |
| "eval_runtime": 7.1558, |
| "eval_samples_per_second": 1165.633, |
| "eval_steps_per_second": 18.307, |
| "eval_weighted_f1": 0.8637770696037415, |
| "eval_weighted_precision": 0.8643599464517906, |
| "eval_weighted_recall": 0.8644047476321784, |
| "step": 2088 |
| } |
| ], |
| "logging_steps": 500, |
| "max_steps": 5220, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 10, |
| "save_steps": 500, |
| "stateful_callbacks": { |
| "TrainerControl": { |
| "args": { |
| "should_epoch_stop": false, |
| "should_evaluate": false, |
| "should_log": false, |
| "should_save": true, |
| "should_training_stop": false |
| }, |
| "attributes": {} |
| } |
| }, |
| "total_flos": 1.1956807869597816e+16, |
| "train_batch_size": 64, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|