NERMODEL / trainer_state.json
Mohsen21's picture
Initial upload
3298466 verified
{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 76.0,
"eval_steps": 500,
"global_step": 988,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 3.766739246202633e-05,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0758,
"eval_samples_per_second": 672.473,
"eval_steps_per_second": 52.743,
"step": 13
},
{
"epoch": 2.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 2.708461215661373e-05,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0739,
"eval_samples_per_second": 689.71,
"eval_steps_per_second": 54.095,
"step": 26
},
{
"epoch": 3.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 2.261350891785696e-05,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.075,
"eval_samples_per_second": 679.831,
"eval_steps_per_second": 53.32,
"step": 39
},
{
"epoch": 3.8461538461538463,
"grad_norm": 0.0005477790255099535,
"learning_rate": 1.924615384615385e-05,
"loss": 0.0001,
"step": 50
},
{
"epoch": 4.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 1.9983246602350846e-05,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0755,
"eval_samples_per_second": 675.625,
"eval_steps_per_second": 52.99,
"step": 52
},
{
"epoch": 5.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 1.7973663489101455e-05,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0792,
"eval_samples_per_second": 643.631,
"eval_steps_per_second": 50.481,
"step": 65
},
{
"epoch": 6.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 1.637468085391447e-05,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0782,
"eval_samples_per_second": 652.282,
"eval_steps_per_second": 51.159,
"step": 78
},
{
"epoch": 7.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 1.5053579772938974e-05,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0805,
"eval_samples_per_second": 633.305,
"eval_steps_per_second": 49.671,
"step": 91
},
{
"epoch": 7.6923076923076925,
"grad_norm": 0.0003741559630725533,
"learning_rate": 1.847692307692308e-05,
"loss": 0.0,
"step": 100
},
{
"epoch": 8.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 1.389792396366829e-05,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0742,
"eval_samples_per_second": 687.259,
"eval_steps_per_second": 53.903,
"step": 104
},
{
"epoch": 9.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 1.2904973118565977e-05,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0794,
"eval_samples_per_second": 642.487,
"eval_steps_per_second": 50.391,
"step": 117
},
{
"epoch": 10.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 1.2025779142277315e-05,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0748,
"eval_samples_per_second": 682.218,
"eval_steps_per_second": 53.507,
"step": 130
},
{
"epoch": 11.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 1.126035385823343e-05,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.076,
"eval_samples_per_second": 671.112,
"eval_steps_per_second": 52.636,
"step": 143
},
{
"epoch": 11.538461538461538,
"grad_norm": 0.00027452429640106857,
"learning_rate": 1.770769230769231e-05,
"loss": 0.0,
"step": 150
},
{
"epoch": 12.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 1.0585004929453135e-05,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0754,
"eval_samples_per_second": 676.83,
"eval_steps_per_second": 53.085,
"step": 156
},
{
"epoch": 13.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 9.961702744476497e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.2793,
"eval_samples_per_second": 182.586,
"eval_steps_per_second": 14.32,
"step": 169
},
{
"epoch": 14.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 9.413349289388862e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0764,
"eval_samples_per_second": 667.706,
"eval_steps_per_second": 52.369,
"step": 182
},
{
"epoch": 15.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 8.932946002460085e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.076,
"eval_samples_per_second": 671.445,
"eval_steps_per_second": 52.662,
"step": 195
},
{
"epoch": 15.384615384615385,
"grad_norm": 0.0002010212338063866,
"learning_rate": 1.693846153846154e-05,
"loss": 0.0,
"step": 200
},
{
"epoch": 16.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 8.463478479825426e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.076,
"eval_samples_per_second": 671.392,
"eval_steps_per_second": 52.658,
"step": 208
},
{
"epoch": 17.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 8.053830242715776e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0839,
"eval_samples_per_second": 608.167,
"eval_steps_per_second": 47.699,
"step": 221
},
{
"epoch": 18.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 7.682633622607682e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0742,
"eval_samples_per_second": 687.463,
"eval_steps_per_second": 53.919,
"step": 234
},
{
"epoch": 19.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 7.346277016040403e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0756,
"eval_samples_per_second": 674.981,
"eval_steps_per_second": 52.94,
"step": 247
},
{
"epoch": 19.23076923076923,
"grad_norm": 0.00017087982269003987,
"learning_rate": 1.6169230769230772e-05,
"loss": 0.0,
"step": 250
},
{
"epoch": 20.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 7.011135039647343e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0764,
"eval_samples_per_second": 667.716,
"eval_steps_per_second": 52.37,
"step": 260
},
{
"epoch": 21.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 6.707206921419129e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0766,
"eval_samples_per_second": 665.655,
"eval_steps_per_second": 52.208,
"step": 273
},
{
"epoch": 22.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 6.460109489125898e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0816,
"eval_samples_per_second": 624.77,
"eval_steps_per_second": 49.002,
"step": 286
},
{
"epoch": 23.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 6.168189429445192e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0788,
"eval_samples_per_second": 646.907,
"eval_steps_per_second": 50.738,
"step": 299
},
{
"epoch": 23.076923076923077,
"grad_norm": 0.0001346742210444063,
"learning_rate": 1.54e-05,
"loss": 0.0,
"step": 300
},
{
"epoch": 24.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 5.980409241601592e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.2365,
"eval_samples_per_second": 215.673,
"eval_steps_per_second": 16.916,
"step": 312
},
{
"epoch": 25.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 5.7013526202354115e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0758,
"eval_samples_per_second": 672.947,
"eval_steps_per_second": 52.78,
"step": 325
},
{
"epoch": 26.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 5.5516734391858336e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0754,
"eval_samples_per_second": 676.203,
"eval_steps_per_second": 53.036,
"step": 338
},
{
"epoch": 26.923076923076923,
"grad_norm": 0.00011714433640008792,
"learning_rate": 1.4630769230769233e-05,
"loss": 0.0,
"step": 350
},
{
"epoch": 27.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 5.349874300009105e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0772,
"eval_samples_per_second": 660.463,
"eval_steps_per_second": 51.801,
"step": 351
},
{
"epoch": 28.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 5.1536571845645085e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0774,
"eval_samples_per_second": 659.11,
"eval_steps_per_second": 51.695,
"step": 364
},
{
"epoch": 29.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 5.008918833482312e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0797,
"eval_samples_per_second": 640.166,
"eval_steps_per_second": 50.209,
"step": 377
},
{
"epoch": 30.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 4.825435553357238e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0741,
"eval_samples_per_second": 688.662,
"eval_steps_per_second": 54.013,
"step": 390
},
{
"epoch": 30.76923076923077,
"grad_norm": 0.000104076876596082,
"learning_rate": 1.3861538461538461e-05,
"loss": 0.0,
"step": 400
},
{
"epoch": 31.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 4.660724698624108e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0772,
"eval_samples_per_second": 660.52,
"eval_steps_per_second": 51.806,
"step": 403
},
{
"epoch": 32.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 4.554401130008046e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0779,
"eval_samples_per_second": 654.388,
"eval_steps_per_second": 51.325,
"step": 416
},
{
"epoch": 33.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 4.401058504299726e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.079,
"eval_samples_per_second": 645.62,
"eval_steps_per_second": 50.637,
"step": 429
},
{
"epoch": 34.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 4.281378551240778e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0747,
"eval_samples_per_second": 682.954,
"eval_steps_per_second": 53.565,
"step": 442
},
{
"epoch": 34.61538461538461,
"grad_norm": 9.115073044085875e-05,
"learning_rate": 1.3092307692307693e-05,
"loss": 0.0,
"step": 450
},
{
"epoch": 35.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 4.155664555582916e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0772,
"eval_samples_per_second": 660.928,
"eval_steps_per_second": 51.838,
"step": 455
},
{
"epoch": 36.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 4.062813331984216e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0778,
"eval_samples_per_second": 655.34,
"eval_steps_per_second": 51.399,
"step": 468
},
{
"epoch": 37.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 3.960818958148593e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0763,
"eval_samples_per_second": 668.511,
"eval_steps_per_second": 52.432,
"step": 481
},
{
"epoch": 38.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 3.86090732718003e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0754,
"eval_samples_per_second": 676.372,
"eval_steps_per_second": 53.049,
"step": 494
},
{
"epoch": 38.46153846153846,
"grad_norm": 8.525206794729456e-05,
"learning_rate": 1.2323076923076924e-05,
"loss": 0.0,
"step": 500
},
{
"epoch": 39.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 3.718094603755162e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0769,
"eval_samples_per_second": 663.353,
"eval_steps_per_second": 52.028,
"step": 507
},
{
"epoch": 40.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 3.6739313600264722e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.082,
"eval_samples_per_second": 621.958,
"eval_steps_per_second": 48.781,
"step": 520
},
{
"epoch": 41.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 3.5706143535207957e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0839,
"eval_samples_per_second": 607.589,
"eval_steps_per_second": 47.654,
"step": 533
},
{
"epoch": 42.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 3.473499873507535e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0781,
"eval_samples_per_second": 653.089,
"eval_steps_per_second": 51.223,
"step": 546
},
{
"epoch": 42.30769230769231,
"grad_norm": 7.703923620283604e-05,
"learning_rate": 1.1553846153846156e-05,
"loss": 0.0,
"step": 550
},
{
"epoch": 43.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 3.4267693536094157e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0781,
"eval_samples_per_second": 653.245,
"eval_steps_per_second": 51.235,
"step": 559
},
{
"epoch": 44.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 3.3662902296782704e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0773,
"eval_samples_per_second": 659.878,
"eval_steps_per_second": 51.755,
"step": 572
},
{
"epoch": 45.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 3.2630439363856567e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0767,
"eval_samples_per_second": 665.299,
"eval_steps_per_second": 52.18,
"step": 585
},
{
"epoch": 46.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 3.18609454552643e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0765,
"eval_samples_per_second": 666.648,
"eval_steps_per_second": 52.286,
"step": 598
},
{
"epoch": 46.15384615384615,
"grad_norm": 6.898341962369159e-05,
"learning_rate": 1.0784615384615384e-05,
"loss": 0.0,
"step": 600
},
{
"epoch": 47.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 3.125113380519906e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0802,
"eval_samples_per_second": 635.718,
"eval_steps_per_second": 49.86,
"step": 611
},
{
"epoch": 48.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 3.0880059966875706e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0811,
"eval_samples_per_second": 629.003,
"eval_steps_per_second": 49.334,
"step": 624
},
{
"epoch": 49.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 3.007978648383869e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0776,
"eval_samples_per_second": 656.906,
"eval_steps_per_second": 51.522,
"step": 637
},
{
"epoch": 50.0,
"grad_norm": 6.396565004251897e-05,
"learning_rate": 1.0015384615384615e-05,
"loss": 0.0,
"step": 650
},
{
"epoch": 50.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 2.9140269361960236e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0867,
"eval_samples_per_second": 588.503,
"eval_steps_per_second": 46.157,
"step": 650
},
{
"epoch": 51.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 2.8741619644279126e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0783,
"eval_samples_per_second": 651.157,
"eval_steps_per_second": 51.071,
"step": 663
},
{
"epoch": 52.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 2.8582894628925715e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0778,
"eval_samples_per_second": 655.119,
"eval_steps_per_second": 51.382,
"step": 676
},
{
"epoch": 53.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 2.8347033094178187e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.077,
"eval_samples_per_second": 662.076,
"eval_steps_per_second": 51.928,
"step": 689
},
{
"epoch": 53.84615384615385,
"grad_norm": 5.985860479995608e-05,
"learning_rate": 9.246153846153847e-06,
"loss": 0.0,
"step": 700
},
{
"epoch": 54.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 2.7935459456784884e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0847,
"eval_samples_per_second": 602.475,
"eval_steps_per_second": 47.253,
"step": 702
},
{
"epoch": 55.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 2.730073902057484e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0809,
"eval_samples_per_second": 630.412,
"eval_steps_per_second": 49.444,
"step": 715
},
{
"epoch": 56.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 2.65099970420124e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0795,
"eval_samples_per_second": 641.431,
"eval_steps_per_second": 50.308,
"step": 728
},
{
"epoch": 57.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 2.6181696739513427e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.079,
"eval_samples_per_second": 645.371,
"eval_steps_per_second": 50.617,
"step": 741
},
{
"epoch": 57.69230769230769,
"grad_norm": 5.6825054343789816e-05,
"learning_rate": 8.476923076923078e-06,
"loss": 0.0,
"step": 750
},
{
"epoch": 58.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 2.5803217340580886e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0845,
"eval_samples_per_second": 603.199,
"eval_steps_per_second": 47.31,
"step": 754
},
{
"epoch": 59.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 2.5398476282134652e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0818,
"eval_samples_per_second": 623.278,
"eval_steps_per_second": 48.885,
"step": 767
},
{
"epoch": 60.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 2.4956075321824756e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0783,
"eval_samples_per_second": 651.367,
"eval_steps_per_second": 51.088,
"step": 780
},
{
"epoch": 61.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 2.46099057221727e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0847,
"eval_samples_per_second": 602.231,
"eval_steps_per_second": 47.234,
"step": 793
},
{
"epoch": 61.53846153846154,
"grad_norm": 5.1071423513349146e-05,
"learning_rate": 7.707692307692308e-06,
"loss": 0.0,
"step": 800
},
{
"epoch": 62.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 2.4360676889045862e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0837,
"eval_samples_per_second": 609.373,
"eval_steps_per_second": 47.794,
"step": 806
},
{
"epoch": 63.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 2.3770801362843486e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0865,
"eval_samples_per_second": 589.861,
"eval_steps_per_second": 46.264,
"step": 819
},
{
"epoch": 64.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 2.331081532247481e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0785,
"eval_samples_per_second": 649.981,
"eval_steps_per_second": 50.979,
"step": 832
},
{
"epoch": 65.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 2.3108309505914804e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0886,
"eval_samples_per_second": 575.651,
"eval_steps_per_second": 45.149,
"step": 845
},
{
"epoch": 65.38461538461539,
"grad_norm": 5.284359576762654e-05,
"learning_rate": 6.9384615384615395e-06,
"loss": 0.0,
"step": 850
},
{
"epoch": 66.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 2.2956874090596102e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0804,
"eval_samples_per_second": 634.054,
"eval_steps_per_second": 49.73,
"step": 858
},
{
"epoch": 67.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 2.2875919967191294e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0853,
"eval_samples_per_second": 598.007,
"eval_steps_per_second": 46.903,
"step": 871
},
{
"epoch": 68.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 2.276377244925243e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0852,
"eval_samples_per_second": 598.276,
"eval_steps_per_second": 46.924,
"step": 884
},
{
"epoch": 69.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 2.2665922188025434e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0817,
"eval_samples_per_second": 624.209,
"eval_steps_per_second": 48.958,
"step": 897
},
{
"epoch": 69.23076923076923,
"grad_norm": 4.872769204666838e-05,
"learning_rate": 6.169230769230769e-06,
"loss": 0.0,
"step": 900
},
{
"epoch": 70.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 2.2590579646930564e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0808,
"eval_samples_per_second": 631.529,
"eval_steps_per_second": 49.532,
"step": 910
},
{
"epoch": 71.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 2.2511769657285186e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0846,
"eval_samples_per_second": 602.946,
"eval_steps_per_second": 47.29,
"step": 923
},
{
"epoch": 72.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 2.2218735011847457e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0818,
"eval_samples_per_second": 623.221,
"eval_steps_per_second": 48.88,
"step": 936
},
{
"epoch": 73.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 2.199440586991841e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0816,
"eval_samples_per_second": 624.999,
"eval_steps_per_second": 49.019,
"step": 949
},
{
"epoch": 73.07692307692308,
"grad_norm": 4.863178764935583e-05,
"learning_rate": 5.400000000000001e-06,
"loss": 0.0,
"step": 950
},
{
"epoch": 74.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 2.160148142138496e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0841,
"eval_samples_per_second": 606.643,
"eval_steps_per_second": 47.58,
"step": 962
},
{
"epoch": 75.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 2.1215453216427704e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0827,
"eval_samples_per_second": 616.959,
"eval_steps_per_second": 48.389,
"step": 975
},
{
"epoch": 76.0,
"eval_ECONOMIC_ACTIVITIES": {
"f1": 1.0,
"number": 51,
"precision": 1.0,
"recall": 1.0
},
"eval_MONTH": {
"f1": 1.0,
"number": 80,
"precision": 1.0,
"recall": 1.0
},
"eval_YEAR": {
"f1": 1.0,
"number": 67,
"precision": 1.0,
"recall": 1.0
},
"eval_loss": 2.0821323687414406e-06,
"eval_overall_accuracy": 1.0,
"eval_overall_f1": 1.0,
"eval_overall_precision": 1.0,
"eval_overall_recall": 1.0,
"eval_runtime": 0.0862,
"eval_samples_per_second": 591.451,
"eval_steps_per_second": 46.388,
"step": 988
}
],
"logging_steps": 50,
"max_steps": 1300,
"num_input_tokens_seen": 0,
"num_train_epochs": 100,
"save_steps": 500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 229437023509200.0,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}