| { | |
| "best_metric": 0.9321585507595793, | |
| "best_model_checkpoint": "tmp_ner_fantastic-bale-10_45/run-33/checkpoint-875", | |
| "epoch": 7.0, | |
| "eval_steps": 500, | |
| "global_step": 875, | |
| "is_hyper_param_search": true, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.0, | |
| "eval_accuracy": 0.9730935342517575, | |
| "eval_loss": 0.08587262034416199, | |
| "eval_macro_f1": 0.9170047043200686, | |
| "eval_macro_precision": 0.9278276425309375, | |
| "eval_macro_recall": 0.90752738549263, | |
| "eval_runtime": 5.7832, | |
| "eval_samples_per_second": 172.914, | |
| "eval_steps_per_second": 21.614, | |
| "step": 125 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_accuracy": 0.9750480754074587, | |
| "eval_loss": 0.08141306042671204, | |
| "eval_macro_f1": 0.9264657139223695, | |
| "eval_macro_precision": 0.9157927892781152, | |
| "eval_macro_recall": 0.9377952332788448, | |
| "eval_runtime": 6.0324, | |
| "eval_samples_per_second": 165.773, | |
| "eval_steps_per_second": 20.722, | |
| "step": 250 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "eval_accuracy": 0.9743781721887709, | |
| "eval_loss": 0.08608711510896683, | |
| "eval_macro_f1": 0.9247086477797719, | |
| "eval_macro_precision": 0.9173611315562689, | |
| "eval_macro_recall": 0.933305032585042, | |
| "eval_runtime": 6.0132, | |
| "eval_samples_per_second": 166.3, | |
| "eval_steps_per_second": 20.787, | |
| "step": 375 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "grad_norm": 0.6703500151634216, | |
| "learning_rate": 5.4624258845588244e-05, | |
| "loss": 0.1282, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "eval_accuracy": 0.9770420226348476, | |
| "eval_loss": 0.09856158494949341, | |
| "eval_macro_f1": 0.9314150814858593, | |
| "eval_macro_precision": 0.9211465798788551, | |
| "eval_macro_recall": 0.9421883284262093, | |
| "eval_runtime": 5.932, | |
| "eval_samples_per_second": 168.577, | |
| "eval_steps_per_second": 21.072, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "eval_accuracy": 0.9750086693357712, | |
| "eval_loss": 0.11021321266889572, | |
| "eval_macro_f1": 0.9267488028708639, | |
| "eval_macro_precision": 0.9153942226603791, | |
| "eval_macro_recall": 0.9386080517042859, | |
| "eval_runtime": 5.9689, | |
| "eval_samples_per_second": 167.536, | |
| "eval_steps_per_second": 20.942, | |
| "step": 625 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "eval_accuracy": 0.9760253459853094, | |
| "eval_loss": 0.11098870635032654, | |
| "eval_macro_f1": 0.9287954097228024, | |
| "eval_macro_precision": 0.9205523043756338, | |
| "eval_macro_recall": 0.9374208211553338, | |
| "eval_runtime": 5.9208, | |
| "eval_samples_per_second": 168.896, | |
| "eval_steps_per_second": 21.112, | |
| "step": 750 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "eval_accuracy": 0.9773021027079852, | |
| "eval_loss": 0.11490638554096222, | |
| "eval_macro_f1": 0.9321585507595793, | |
| "eval_macro_precision": 0.9266098427277691, | |
| "eval_macro_recall": 0.9378807443139501, | |
| "eval_runtime": 6.075, | |
| "eval_samples_per_second": 164.61, | |
| "eval_steps_per_second": 20.576, | |
| "step": 875 | |
| } | |
| ], | |
| "logging_steps": 500, | |
| "max_steps": 4000, | |
| "num_input_tokens_seen": 0, | |
| "num_train_epochs": 32, | |
| "save_steps": 500, | |
| "stateful_callbacks": { | |
| "EarlyStoppingCallback": { | |
| "args": { | |
| "early_stopping_patience": 3, | |
| "early_stopping_threshold": 0.001 | |
| }, | |
| "attributes": { | |
| "early_stopping_patience_counter": 3 | |
| } | |
| }, | |
| "TrainerControl": { | |
| "args": { | |
| "should_epoch_stop": false, | |
| "should_evaluate": false, | |
| "should_log": false, | |
| "should_save": true, | |
| "should_training_stop": true | |
| }, | |
| "attributes": {} | |
| } | |
| }, | |
| "total_flos": 723885139142880.0, | |
| "train_batch_size": 8, | |
| "trial_name": null, | |
| "trial_params": { | |
| "learning_rate": 6.150691546013236e-05, | |
| "per_device_train_batch_size": 8, | |
| "warmup_ratio": 0.014555287490025246, | |
| "weight_decay": 0.02919246813677108 | |
| } | |
| } | |