| { | |
| "best_metric": 0.03481420502066612, | |
| "best_model_checkpoint": "results_bert-base-french-europeana-cased/epoch20_bs64/checkpoint-48", | |
| "epoch": 11.0, | |
| "eval_steps": 500, | |
| "global_step": 176, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.0, | |
| "grad_norm": 0.47372615337371826, | |
| "learning_rate": 4.75e-05, | |
| "loss": 0.3883, | |
| "step": 16 | |
| }, | |
| { | |
| "epoch": 1.0, | |
| "eval_accurracy": { | |
| "accuracy": 0.9764285714285714 | |
| }, | |
| "eval_f1": [ | |
| 0.9799147900182593, | |
| 0.8114285714285714, | |
| 1.0 | |
| ], | |
| "eval_loss": 0.08146535605192184, | |
| "eval_precision": [ | |
| 0.971049457177322, | |
| 0.8875, | |
| 1.0 | |
| ], | |
| "eval_recall": [ | |
| 0.9889434889434889, | |
| 0.7473684210526316, | |
| 1.0 | |
| ], | |
| "eval_runtime": 4.1114, | |
| "eval_samples_per_second": 12.161, | |
| "eval_steps_per_second": 0.243, | |
| "step": 16 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "grad_norm": 0.4207443296909332, | |
| "learning_rate": 4.5e-05, | |
| "loss": 0.0566, | |
| "step": 32 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_accurracy": { | |
| "accuracy": 0.9878571428571429 | |
| }, | |
| "eval_f1": [ | |
| 0.9895641497851443, | |
| 0.91005291005291, | |
| 1.0 | |
| ], | |
| "eval_loss": 0.04085615277290344, | |
| "eval_precision": [ | |
| 0.9889570552147239, | |
| 0.9148936170212766, | |
| 1.0 | |
| ], | |
| "eval_recall": [ | |
| 0.9901719901719902, | |
| 0.9052631578947369, | |
| 1.0 | |
| ], | |
| "eval_runtime": 3.9019, | |
| "eval_samples_per_second": 12.814, | |
| "eval_steps_per_second": 0.256, | |
| "step": 32 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "grad_norm": 0.4004434049129486, | |
| "learning_rate": 4.25e-05, | |
| "loss": 0.0291, | |
| "step": 48 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "eval_accurracy": { | |
| "accuracy": 0.99 | |
| }, | |
| "eval_f1": [ | |
| 0.991389913899139, | |
| 0.9270833333333334, | |
| 1.0 | |
| ], | |
| "eval_loss": 0.03481420502066612, | |
| "eval_precision": [ | |
| 0.9926108374384236, | |
| 0.9175257731958762, | |
| 1.0 | |
| ], | |
| "eval_recall": [ | |
| 0.9901719901719902, | |
| 0.9368421052631579, | |
| 1.0 | |
| ], | |
| "eval_runtime": 3.5383, | |
| "eval_samples_per_second": 14.131, | |
| "eval_steps_per_second": 0.283, | |
| "step": 48 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "grad_norm": 0.3703693747520447, | |
| "learning_rate": 4e-05, | |
| "loss": 0.0169, | |
| "step": 64 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "eval_accurracy": { | |
| "accuracy": 0.9885714285714285 | |
| }, | |
| "eval_f1": [ | |
| 0.9901719901719902, | |
| 0.9157894736842105, | |
| 1.0 | |
| ], | |
| "eval_loss": 0.03665424883365631, | |
| "eval_precision": [ | |
| 0.9901719901719902, | |
| 0.9157894736842105, | |
| 1.0 | |
| ], | |
| "eval_recall": [ | |
| 0.9901719901719902, | |
| 0.9157894736842105, | |
| 1.0 | |
| ], | |
| "eval_runtime": 3.4858, | |
| "eval_samples_per_second": 14.344, | |
| "eval_steps_per_second": 0.287, | |
| "step": 64 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "grad_norm": 0.3292807936668396, | |
| "learning_rate": 3.7500000000000003e-05, | |
| "loss": 0.0109, | |
| "step": 80 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "eval_accurracy": { | |
| "accuracy": 0.9878571428571429 | |
| }, | |
| "eval_f1": [ | |
| 0.9894867037724181, | |
| 0.9154228855721394, | |
| 1.0 | |
| ], | |
| "eval_loss": 0.03761892020702362, | |
| "eval_precision": [ | |
| 0.9962640099626401, | |
| 0.8679245283018868, | |
| 1.0 | |
| ], | |
| "eval_recall": [ | |
| 0.9828009828009828, | |
| 0.968421052631579, | |
| 1.0 | |
| ], | |
| "eval_runtime": 3.6656, | |
| "eval_samples_per_second": 13.64, | |
| "eval_steps_per_second": 0.273, | |
| "step": 80 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "grad_norm": 0.17665812373161316, | |
| "learning_rate": 3.5e-05, | |
| "loss": 0.0073, | |
| "step": 96 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "eval_accurracy": { | |
| "accuracy": 0.9878571428571429 | |
| }, | |
| "eval_f1": [ | |
| 0.9895897121861604, | |
| 0.9081081081081082, | |
| 1.0 | |
| ], | |
| "eval_loss": 0.04045535624027252, | |
| "eval_precision": [ | |
| 0.9865689865689866, | |
| 0.9333333333333333, | |
| 1.0 | |
| ], | |
| "eval_recall": [ | |
| 0.9926289926289926, | |
| 0.8842105263157894, | |
| 1.0 | |
| ], | |
| "eval_runtime": 3.1662, | |
| "eval_samples_per_second": 15.792, | |
| "eval_steps_per_second": 0.316, | |
| "step": 96 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "grad_norm": 0.46033716201782227, | |
| "learning_rate": 3.2500000000000004e-05, | |
| "loss": 0.0043, | |
| "step": 112 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "eval_accurracy": { | |
| "accuracy": 0.9885714285714285 | |
| }, | |
| "eval_f1": [ | |
| 0.9901840490797545, | |
| 0.9148936170212766, | |
| 1.0 | |
| ], | |
| "eval_loss": 0.0450633242726326, | |
| "eval_precision": [ | |
| 0.9889705882352942, | |
| 0.9247311827956989, | |
| 1.0 | |
| ], | |
| "eval_recall": [ | |
| 0.9914004914004914, | |
| 0.9052631578947369, | |
| 1.0 | |
| ], | |
| "eval_runtime": 3.1686, | |
| "eval_samples_per_second": 15.78, | |
| "eval_steps_per_second": 0.316, | |
| "step": 112 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "grad_norm": 0.7053983807563782, | |
| "learning_rate": 3e-05, | |
| "loss": 0.0029, | |
| "step": 128 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "eval_accurracy": { | |
| "accuracy": 0.9871428571428571 | |
| }, | |
| "eval_f1": [ | |
| 0.9889570552147239, | |
| 0.9042553191489362, | |
| 1.0 | |
| ], | |
| "eval_loss": 0.055573731660842896, | |
| "eval_precision": [ | |
| 0.9877450980392157, | |
| 0.9139784946236559, | |
| 1.0 | |
| ], | |
| "eval_recall": [ | |
| 0.9901719901719902, | |
| 0.8947368421052632, | |
| 1.0 | |
| ], | |
| "eval_runtime": 3.4353, | |
| "eval_samples_per_second": 14.555, | |
| "eval_steps_per_second": 0.291, | |
| "step": 128 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "grad_norm": 0.16288042068481445, | |
| "learning_rate": 2.7500000000000004e-05, | |
| "loss": 0.0023, | |
| "step": 144 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "eval_accurracy": { | |
| "accuracy": 0.9892857142857143 | |
| }, | |
| "eval_f1": [ | |
| 0.9908144519289651, | |
| 0.918918918918919, | |
| 1.0 | |
| ], | |
| "eval_loss": 0.05289832502603531, | |
| "eval_precision": [ | |
| 0.9877899877899878, | |
| 0.9444444444444444, | |
| 1.0 | |
| ], | |
| "eval_recall": [ | |
| 0.9938574938574939, | |
| 0.8947368421052632, | |
| 1.0 | |
| ], | |
| "eval_runtime": 3.8415, | |
| "eval_samples_per_second": 13.016, | |
| "eval_steps_per_second": 0.26, | |
| "step": 144 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "grad_norm": 0.19770997762680054, | |
| "learning_rate": 2.5e-05, | |
| "loss": 0.0021, | |
| "step": 160 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "eval_accurracy": { | |
| "accuracy": 0.9892857142857143 | |
| }, | |
| "eval_f1": [ | |
| 0.990791896869245, | |
| 0.9206349206349206, | |
| 1.0 | |
| ], | |
| "eval_loss": 0.04967246204614639, | |
| "eval_precision": [ | |
| 0.9901840490797545, | |
| 0.925531914893617, | |
| 1.0 | |
| ], | |
| "eval_recall": [ | |
| 0.9914004914004914, | |
| 0.9157894736842105, | |
| 1.0 | |
| ], | |
| "eval_runtime": 3.3345, | |
| "eval_samples_per_second": 14.995, | |
| "eval_steps_per_second": 0.3, | |
| "step": 160 | |
| }, | |
| { | |
| "epoch": 11.0, | |
| "grad_norm": 0.07273274660110474, | |
| "learning_rate": 2.25e-05, | |
| "loss": 0.0013, | |
| "step": 176 | |
| }, | |
| { | |
| "epoch": 11.0, | |
| "eval_accurracy": { | |
| "accuracy": 0.9921428571428571 | |
| }, | |
| "eval_f1": [ | |
| 0.9932390903503381, | |
| 0.9424083769633508, | |
| 1.0 | |
| ], | |
| "eval_loss": 0.04350681230425835, | |
| "eval_precision": [ | |
| 0.993849938499385, | |
| 0.9375, | |
| 1.0 | |
| ], | |
| "eval_recall": [ | |
| 0.9926289926289926, | |
| 0.9473684210526315, | |
| 1.0 | |
| ], | |
| "eval_runtime": 3.3327, | |
| "eval_samples_per_second": 15.003, | |
| "eval_steps_per_second": 0.3, | |
| "step": 176 | |
| } | |
| ], | |
| "logging_steps": 500, | |
| "max_steps": 320, | |
| "num_input_tokens_seen": 0, | |
| "num_train_epochs": 20, | |
| "save_steps": 500, | |
| "stateful_callbacks": { | |
| "TrainerControl": { | |
| "args": { | |
| "should_epoch_stop": false, | |
| "should_evaluate": false, | |
| "should_log": false, | |
| "should_save": true, | |
| "should_training_stop": false | |
| }, | |
| "attributes": {} | |
| } | |
| }, | |
| "total_flos": 168415447860000.0, | |
| "train_batch_size": 64, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |