{ "best_metric": 0.8655209539834394, "best_model_checkpoint": "fnet-large-Financial_Sentiment_Analysis_v3/checkpoint-670", "epoch": 10.0, "global_step": 1340, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.01, "learning_rate": 1.9985074626865674e-05, "loss": 1.4558, "step": 1 }, { "epoch": 0.37, "learning_rate": 1.9253731343283585e-05, "loss": 0.81, "step": 50 }, { "epoch": 0.75, "learning_rate": 1.8507462686567165e-05, "loss": 0.6757, "step": 100 }, { "epoch": 1.0, "eval_Macro F1": 0.36279759177569026, "eval_Macro Precision": 0.5210381627879025, "eval_Macro Recall": 0.4297578136174626, "eval_Micro F1": 0.585480093676815, "eval_Micro Precision": 0.585480093676815, "eval_Micro Recall": 0.585480093676815, "eval_Weighted F1": 0.4739290274173566, "eval_Weighted Precision": 0.5912111905595777, "eval_Weighted Recall": 0.585480093676815, "eval_accuracy": 0.585480093676815, "eval_loss": 0.5890011787414551, "eval_runtime": 572.1521, "eval_samples_per_second": 3.732, "eval_steps_per_second": 0.059, "step": 134 }, { "epoch": 1.12, "learning_rate": 1.7761194029850748e-05, "loss": 0.615, "step": 150 }, { "epoch": 1.49, "learning_rate": 1.701492537313433e-05, "loss": 0.542, "step": 200 }, { "epoch": 1.87, "learning_rate": 1.626865671641791e-05, "loss": 0.4815, "step": 250 }, { "epoch": 2.0, "eval_Macro F1": 0.7155645405318029, "eval_Macro Precision": 0.7388441683808017, "eval_Macro Recall": 0.7039245533319153, "eval_Micro F1": 0.7826697892271662, "eval_Micro Precision": 0.7826697892271662, "eval_Micro Recall": 0.7826697892271662, "eval_Weighted F1": 0.778931131467011, "eval_Weighted Precision": 0.7878024754296866, "eval_Weighted Recall": 0.7826697892271662, "eval_accuracy": 0.7826697892271662, "eval_loss": 0.3994453251361847, "eval_runtime": 570.0533, "eval_samples_per_second": 3.745, "eval_steps_per_second": 0.06, "step": 268 }, { "epoch": 2.24, "learning_rate": 1.5522388059701494e-05, "loss": 0.3774, "step": 300 }, { "epoch": 2.61, "learning_rate": 1.4776119402985077e-05, "loss": 0.3366, "step": 350 }, { "epoch": 2.99, "learning_rate": 1.4029850746268658e-05, "loss": 0.314, "step": 400 }, { "epoch": 3.0, "eval_Macro F1": 0.736751489500019, "eval_Macro Precision": 0.7612057314604446, "eval_Macro Recall": 0.7252037377440934, "eval_Micro F1": 0.7990632318501172, "eval_Micro Precision": 0.7990632318501171, "eval_Micro Recall": 0.7990632318501171, "eval_Weighted F1": 0.7977313198767033, "eval_Weighted Precision": 0.8100534851227623, "eval_Weighted Recall": 0.7990632318501171, "eval_accuracy": 0.7990632318501171, "eval_loss": 0.3560428321361542, "eval_runtime": 581.4066, "eval_samples_per_second": 3.672, "eval_steps_per_second": 0.058, "step": 402 }, { "epoch": 3.36, "learning_rate": 1.328358208955224e-05, "loss": 0.2486, "step": 450 }, { "epoch": 3.73, "learning_rate": 1.2537313432835823e-05, "loss": 0.235, "step": 500 }, { "epoch": 4.0, "eval_Macro F1": 0.7548578890974982, "eval_Macro Precision": 0.7630930133664333, "eval_Macro Recall": 0.7508943526446905, "eval_Micro F1": 0.8201405152224824, "eval_Micro Precision": 0.8201405152224824, "eval_Micro Recall": 0.8201405152224824, "eval_Weighted F1": 0.8217495227304409, "eval_Weighted Precision": 0.8273969119402248, "eval_Weighted Recall": 0.8201405152224824, "eval_accuracy": 0.8201405152224824, "eval_loss": 0.32777392864227295, "eval_runtime": 571.7549, "eval_samples_per_second": 3.734, "eval_steps_per_second": 0.059, "step": 536 }, { "epoch": 4.1, "learning_rate": 1.1791044776119405e-05, "loss": 0.2309, "step": 550 }, { "epoch": 4.48, "learning_rate": 1.1044776119402986e-05, "loss": 0.188, "step": 600 }, { "epoch": 4.85, "learning_rate": 1.029850746268657e-05, "loss": 0.1986, "step": 650 }, { "epoch": 5.0, "eval_Macro F1": 0.8208742913000978, "eval_Macro Precision": 0.8083647050243598, "eval_Macro Recall": 0.8400854990635674, "eval_Micro F1": 0.8618266978922716, "eval_Micro Precision": 0.8618266978922716, "eval_Micro Recall": 0.8618266978922716, "eval_Weighted F1": 0.8655209539834394, "eval_Weighted Precision": 0.8723242107411118, "eval_Weighted Recall": 0.8618266978922716, "eval_accuracy": 0.8618266978922716, "eval_loss": 0.3573662042617798, "eval_runtime": 572.7753, "eval_samples_per_second": 3.727, "eval_steps_per_second": 0.059, "step": 670 }, { "epoch": 5.22, "learning_rate": 9.552238805970149e-06, "loss": 0.1838, "step": 700 }, { "epoch": 5.6, "learning_rate": 8.805970149253732e-06, "loss": 0.1485, "step": 750 }, { "epoch": 5.97, "learning_rate": 8.059701492537314e-06, "loss": 0.1605, "step": 800 }, { "epoch": 6.0, "eval_Macro F1": 0.6588158445976257, "eval_Macro Precision": 0.6987220074939374, "eval_Macro Recall": 0.6469038522815648, "eval_Micro F1": 0.7995316159250586, "eval_Micro Precision": 0.7995316159250585, "eval_Micro Recall": 0.7995316159250585, "eval_Weighted F1": 0.7803428354754396, "eval_Weighted Precision": 0.778138163263271, "eval_Weighted Recall": 0.7995316159250585, "eval_accuracy": 0.7995316159250585, "eval_loss": 0.3885968029499054, "eval_runtime": 571.7311, "eval_samples_per_second": 3.734, "eval_steps_per_second": 0.059, "step": 804 }, { "epoch": 6.34, "learning_rate": 7.313432835820896e-06, "loss": 0.1425, "step": 850 }, { "epoch": 6.72, "learning_rate": 6.567164179104478e-06, "loss": 0.1436, "step": 900 }, { "epoch": 7.0, "eval_Macro F1": 0.7442069309467508, "eval_Macro Precision": 0.7576208137220202, "eval_Macro Recall": 0.7336057451045414, "eval_Micro F1": 0.8229508196721311, "eval_Micro Precision": 0.8229508196721311, "eval_Micro Recall": 0.8229508196721311, "eval_Weighted F1": 0.820676653014847, "eval_Weighted Precision": 0.8209948655272054, "eval_Weighted Recall": 0.8229508196721311, "eval_accuracy": 0.8229508196721311, "eval_loss": 0.4039975702762604, "eval_runtime": 571.7322, "eval_samples_per_second": 3.734, "eval_steps_per_second": 0.059, "step": 938 }, { "epoch": 7.09, "learning_rate": 5.820895522388061e-06, "loss": 0.1368, "step": 950 }, { "epoch": 7.46, "learning_rate": 5.074626865671642e-06, "loss": 0.1253, "step": 1000 }, { "epoch": 7.84, "learning_rate": 4.3283582089552236e-06, "loss": 0.1373, "step": 1050 }, { "epoch": 8.0, "eval_Macro F1": 0.7123175103612404, "eval_Macro Precision": 0.7322548905353868, "eval_Macro Recall": 0.7019914283796879, "eval_Micro F1": 0.8168618266978923, "eval_Micro Precision": 0.8168618266978923, "eval_Micro Recall": 0.8168618266978923, "eval_Weighted F1": 0.807557064029797, "eval_Weighted Precision": 0.8030050439721781, "eval_Weighted Recall": 0.8168618266978923, "eval_accuracy": 0.8168618266978923, "eval_loss": 0.4517393112182617, "eval_runtime": 571.7202, "eval_samples_per_second": 3.734, "eval_steps_per_second": 0.059, "step": 1072 }, { "epoch": 8.21, "learning_rate": 3.582089552238806e-06, "loss": 0.1206, "step": 1100 }, { "epoch": 8.58, "learning_rate": 2.835820895522388e-06, "loss": 0.1141, "step": 1150 }, { "epoch": 8.96, "learning_rate": 2.08955223880597e-06, "loss": 0.1271, "step": 1200 }, { "epoch": 9.0, "eval_Macro F1": 0.6891590047543085, "eval_Macro Precision": 0.7169021915882458, "eval_Macro Recall": 0.6768345177275865, "eval_Micro F1": 0.8070257611241218, "eval_Micro Precision": 0.8070257611241218, "eval_Micro Recall": 0.8070257611241218, "eval_Weighted F1": 0.7944945373911929, "eval_Weighted Precision": 0.790593845937712, "eval_Weighted Recall": 0.8070257611241218, "eval_accuracy": 0.8070257611241218, "eval_loss": 0.45325130224227905, "eval_runtime": 593.452, "eval_samples_per_second": 3.598, "eval_steps_per_second": 0.057, "step": 1206 }, { "epoch": 9.33, "learning_rate": 1.3432835820895524e-06, "loss": 0.1171, "step": 1250 }, { "epoch": 9.7, "learning_rate": 5.970149253731343e-07, "loss": 0.1199, "step": 1300 }, { "epoch": 10.0, "eval_Macro F1": 0.7368644623841439, "eval_Macro Precision": 0.7514878901301887, "eval_Macro Recall": 0.726942967276122, "eval_Micro F1": 0.824824355971897, "eval_Micro Precision": 0.824824355971897, "eval_Micro Recall": 0.824824355971897, "eval_Weighted F1": 0.8193666524247488, "eval_Weighted Precision": 0.8163202759848958, "eval_Weighted Recall": 0.824824355971897, "eval_accuracy": 0.824824355971897, "eval_loss": 0.474141001701355, "eval_runtime": 569.2941, "eval_samples_per_second": 3.75, "eval_steps_per_second": 0.06, "step": 1340 }, { "epoch": 10.0, "step": 1340, "total_flos": 1.105606065652704e+16, "train_loss": 0.26616470564657185, "train_runtime": 95644.4856, "train_samples_per_second": 0.892, "train_steps_per_second": 0.014 } ], "max_steps": 1340, "num_train_epochs": 10, "total_flos": 1.105606065652704e+16, "trial_name": null, "trial_params": null }