DunnBC22's picture
All Dunn!!!
6e37896
{
"best_metric": 0.8655209539834394,
"best_model_checkpoint": "fnet-large-Financial_Sentiment_Analysis_v3/checkpoint-670",
"epoch": 10.0,
"global_step": 1340,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.01,
"learning_rate": 1.9985074626865674e-05,
"loss": 1.4558,
"step": 1
},
{
"epoch": 0.37,
"learning_rate": 1.9253731343283585e-05,
"loss": 0.81,
"step": 50
},
{
"epoch": 0.75,
"learning_rate": 1.8507462686567165e-05,
"loss": 0.6757,
"step": 100
},
{
"epoch": 1.0,
"eval_Macro F1": 0.36279759177569026,
"eval_Macro Precision": 0.5210381627879025,
"eval_Macro Recall": 0.4297578136174626,
"eval_Micro F1": 0.585480093676815,
"eval_Micro Precision": 0.585480093676815,
"eval_Micro Recall": 0.585480093676815,
"eval_Weighted F1": 0.4739290274173566,
"eval_Weighted Precision": 0.5912111905595777,
"eval_Weighted Recall": 0.585480093676815,
"eval_accuracy": 0.585480093676815,
"eval_loss": 0.5890011787414551,
"eval_runtime": 572.1521,
"eval_samples_per_second": 3.732,
"eval_steps_per_second": 0.059,
"step": 134
},
{
"epoch": 1.12,
"learning_rate": 1.7761194029850748e-05,
"loss": 0.615,
"step": 150
},
{
"epoch": 1.49,
"learning_rate": 1.701492537313433e-05,
"loss": 0.542,
"step": 200
},
{
"epoch": 1.87,
"learning_rate": 1.626865671641791e-05,
"loss": 0.4815,
"step": 250
},
{
"epoch": 2.0,
"eval_Macro F1": 0.7155645405318029,
"eval_Macro Precision": 0.7388441683808017,
"eval_Macro Recall": 0.7039245533319153,
"eval_Micro F1": 0.7826697892271662,
"eval_Micro Precision": 0.7826697892271662,
"eval_Micro Recall": 0.7826697892271662,
"eval_Weighted F1": 0.778931131467011,
"eval_Weighted Precision": 0.7878024754296866,
"eval_Weighted Recall": 0.7826697892271662,
"eval_accuracy": 0.7826697892271662,
"eval_loss": 0.3994453251361847,
"eval_runtime": 570.0533,
"eval_samples_per_second": 3.745,
"eval_steps_per_second": 0.06,
"step": 268
},
{
"epoch": 2.24,
"learning_rate": 1.5522388059701494e-05,
"loss": 0.3774,
"step": 300
},
{
"epoch": 2.61,
"learning_rate": 1.4776119402985077e-05,
"loss": 0.3366,
"step": 350
},
{
"epoch": 2.99,
"learning_rate": 1.4029850746268658e-05,
"loss": 0.314,
"step": 400
},
{
"epoch": 3.0,
"eval_Macro F1": 0.736751489500019,
"eval_Macro Precision": 0.7612057314604446,
"eval_Macro Recall": 0.7252037377440934,
"eval_Micro F1": 0.7990632318501172,
"eval_Micro Precision": 0.7990632318501171,
"eval_Micro Recall": 0.7990632318501171,
"eval_Weighted F1": 0.7977313198767033,
"eval_Weighted Precision": 0.8100534851227623,
"eval_Weighted Recall": 0.7990632318501171,
"eval_accuracy": 0.7990632318501171,
"eval_loss": 0.3560428321361542,
"eval_runtime": 581.4066,
"eval_samples_per_second": 3.672,
"eval_steps_per_second": 0.058,
"step": 402
},
{
"epoch": 3.36,
"learning_rate": 1.328358208955224e-05,
"loss": 0.2486,
"step": 450
},
{
"epoch": 3.73,
"learning_rate": 1.2537313432835823e-05,
"loss": 0.235,
"step": 500
},
{
"epoch": 4.0,
"eval_Macro F1": 0.7548578890974982,
"eval_Macro Precision": 0.7630930133664333,
"eval_Macro Recall": 0.7508943526446905,
"eval_Micro F1": 0.8201405152224824,
"eval_Micro Precision": 0.8201405152224824,
"eval_Micro Recall": 0.8201405152224824,
"eval_Weighted F1": 0.8217495227304409,
"eval_Weighted Precision": 0.8273969119402248,
"eval_Weighted Recall": 0.8201405152224824,
"eval_accuracy": 0.8201405152224824,
"eval_loss": 0.32777392864227295,
"eval_runtime": 571.7549,
"eval_samples_per_second": 3.734,
"eval_steps_per_second": 0.059,
"step": 536
},
{
"epoch": 4.1,
"learning_rate": 1.1791044776119405e-05,
"loss": 0.2309,
"step": 550
},
{
"epoch": 4.48,
"learning_rate": 1.1044776119402986e-05,
"loss": 0.188,
"step": 600
},
{
"epoch": 4.85,
"learning_rate": 1.029850746268657e-05,
"loss": 0.1986,
"step": 650
},
{
"epoch": 5.0,
"eval_Macro F1": 0.8208742913000978,
"eval_Macro Precision": 0.8083647050243598,
"eval_Macro Recall": 0.8400854990635674,
"eval_Micro F1": 0.8618266978922716,
"eval_Micro Precision": 0.8618266978922716,
"eval_Micro Recall": 0.8618266978922716,
"eval_Weighted F1": 0.8655209539834394,
"eval_Weighted Precision": 0.8723242107411118,
"eval_Weighted Recall": 0.8618266978922716,
"eval_accuracy": 0.8618266978922716,
"eval_loss": 0.3573662042617798,
"eval_runtime": 572.7753,
"eval_samples_per_second": 3.727,
"eval_steps_per_second": 0.059,
"step": 670
},
{
"epoch": 5.22,
"learning_rate": 9.552238805970149e-06,
"loss": 0.1838,
"step": 700
},
{
"epoch": 5.6,
"learning_rate": 8.805970149253732e-06,
"loss": 0.1485,
"step": 750
},
{
"epoch": 5.97,
"learning_rate": 8.059701492537314e-06,
"loss": 0.1605,
"step": 800
},
{
"epoch": 6.0,
"eval_Macro F1": 0.6588158445976257,
"eval_Macro Precision": 0.6987220074939374,
"eval_Macro Recall": 0.6469038522815648,
"eval_Micro F1": 0.7995316159250586,
"eval_Micro Precision": 0.7995316159250585,
"eval_Micro Recall": 0.7995316159250585,
"eval_Weighted F1": 0.7803428354754396,
"eval_Weighted Precision": 0.778138163263271,
"eval_Weighted Recall": 0.7995316159250585,
"eval_accuracy": 0.7995316159250585,
"eval_loss": 0.3885968029499054,
"eval_runtime": 571.7311,
"eval_samples_per_second": 3.734,
"eval_steps_per_second": 0.059,
"step": 804
},
{
"epoch": 6.34,
"learning_rate": 7.313432835820896e-06,
"loss": 0.1425,
"step": 850
},
{
"epoch": 6.72,
"learning_rate": 6.567164179104478e-06,
"loss": 0.1436,
"step": 900
},
{
"epoch": 7.0,
"eval_Macro F1": 0.7442069309467508,
"eval_Macro Precision": 0.7576208137220202,
"eval_Macro Recall": 0.7336057451045414,
"eval_Micro F1": 0.8229508196721311,
"eval_Micro Precision": 0.8229508196721311,
"eval_Micro Recall": 0.8229508196721311,
"eval_Weighted F1": 0.820676653014847,
"eval_Weighted Precision": 0.8209948655272054,
"eval_Weighted Recall": 0.8229508196721311,
"eval_accuracy": 0.8229508196721311,
"eval_loss": 0.4039975702762604,
"eval_runtime": 571.7322,
"eval_samples_per_second": 3.734,
"eval_steps_per_second": 0.059,
"step": 938
},
{
"epoch": 7.09,
"learning_rate": 5.820895522388061e-06,
"loss": 0.1368,
"step": 950
},
{
"epoch": 7.46,
"learning_rate": 5.074626865671642e-06,
"loss": 0.1253,
"step": 1000
},
{
"epoch": 7.84,
"learning_rate": 4.3283582089552236e-06,
"loss": 0.1373,
"step": 1050
},
{
"epoch": 8.0,
"eval_Macro F1": 0.7123175103612404,
"eval_Macro Precision": 0.7322548905353868,
"eval_Macro Recall": 0.7019914283796879,
"eval_Micro F1": 0.8168618266978923,
"eval_Micro Precision": 0.8168618266978923,
"eval_Micro Recall": 0.8168618266978923,
"eval_Weighted F1": 0.807557064029797,
"eval_Weighted Precision": 0.8030050439721781,
"eval_Weighted Recall": 0.8168618266978923,
"eval_accuracy": 0.8168618266978923,
"eval_loss": 0.4517393112182617,
"eval_runtime": 571.7202,
"eval_samples_per_second": 3.734,
"eval_steps_per_second": 0.059,
"step": 1072
},
{
"epoch": 8.21,
"learning_rate": 3.582089552238806e-06,
"loss": 0.1206,
"step": 1100
},
{
"epoch": 8.58,
"learning_rate": 2.835820895522388e-06,
"loss": 0.1141,
"step": 1150
},
{
"epoch": 8.96,
"learning_rate": 2.08955223880597e-06,
"loss": 0.1271,
"step": 1200
},
{
"epoch": 9.0,
"eval_Macro F1": 0.6891590047543085,
"eval_Macro Precision": 0.7169021915882458,
"eval_Macro Recall": 0.6768345177275865,
"eval_Micro F1": 0.8070257611241218,
"eval_Micro Precision": 0.8070257611241218,
"eval_Micro Recall": 0.8070257611241218,
"eval_Weighted F1": 0.7944945373911929,
"eval_Weighted Precision": 0.790593845937712,
"eval_Weighted Recall": 0.8070257611241218,
"eval_accuracy": 0.8070257611241218,
"eval_loss": 0.45325130224227905,
"eval_runtime": 593.452,
"eval_samples_per_second": 3.598,
"eval_steps_per_second": 0.057,
"step": 1206
},
{
"epoch": 9.33,
"learning_rate": 1.3432835820895524e-06,
"loss": 0.1171,
"step": 1250
},
{
"epoch": 9.7,
"learning_rate": 5.970149253731343e-07,
"loss": 0.1199,
"step": 1300
},
{
"epoch": 10.0,
"eval_Macro F1": 0.7368644623841439,
"eval_Macro Precision": 0.7514878901301887,
"eval_Macro Recall": 0.726942967276122,
"eval_Micro F1": 0.824824355971897,
"eval_Micro Precision": 0.824824355971897,
"eval_Micro Recall": 0.824824355971897,
"eval_Weighted F1": 0.8193666524247488,
"eval_Weighted Precision": 0.8163202759848958,
"eval_Weighted Recall": 0.824824355971897,
"eval_accuracy": 0.824824355971897,
"eval_loss": 0.474141001701355,
"eval_runtime": 569.2941,
"eval_samples_per_second": 3.75,
"eval_steps_per_second": 0.06,
"step": 1340
},
{
"epoch": 10.0,
"step": 1340,
"total_flos": 1.105606065652704e+16,
"train_loss": 0.26616470564657185,
"train_runtime": 95644.4856,
"train_samples_per_second": 0.892,
"train_steps_per_second": 0.014
}
],
"max_steps": 1340,
"num_train_epochs": 10,
"total_flos": 1.105606065652704e+16,
"trial_name": null,
"trial_params": null
}