| { | |
| "best_metric": 0.8655209539834394, | |
| "best_model_checkpoint": "fnet-large-Financial_Sentiment_Analysis_v3/checkpoint-670", | |
| "epoch": 10.0, | |
| "global_step": 1340, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 0.01, | |
| "learning_rate": 1.9985074626865674e-05, | |
| "loss": 1.4558, | |
| "step": 1 | |
| }, | |
| { | |
| "epoch": 0.37, | |
| "learning_rate": 1.9253731343283585e-05, | |
| "loss": 0.81, | |
| "step": 50 | |
| }, | |
| { | |
| "epoch": 0.75, | |
| "learning_rate": 1.8507462686567165e-05, | |
| "loss": 0.6757, | |
| "step": 100 | |
| }, | |
| { | |
| "epoch": 1.0, | |
| "eval_Macro F1": 0.36279759177569026, | |
| "eval_Macro Precision": 0.5210381627879025, | |
| "eval_Macro Recall": 0.4297578136174626, | |
| "eval_Micro F1": 0.585480093676815, | |
| "eval_Micro Precision": 0.585480093676815, | |
| "eval_Micro Recall": 0.585480093676815, | |
| "eval_Weighted F1": 0.4739290274173566, | |
| "eval_Weighted Precision": 0.5912111905595777, | |
| "eval_Weighted Recall": 0.585480093676815, | |
| "eval_accuracy": 0.585480093676815, | |
| "eval_loss": 0.5890011787414551, | |
| "eval_runtime": 572.1521, | |
| "eval_samples_per_second": 3.732, | |
| "eval_steps_per_second": 0.059, | |
| "step": 134 | |
| }, | |
| { | |
| "epoch": 1.12, | |
| "learning_rate": 1.7761194029850748e-05, | |
| "loss": 0.615, | |
| "step": 150 | |
| }, | |
| { | |
| "epoch": 1.49, | |
| "learning_rate": 1.701492537313433e-05, | |
| "loss": 0.542, | |
| "step": 200 | |
| }, | |
| { | |
| "epoch": 1.87, | |
| "learning_rate": 1.626865671641791e-05, | |
| "loss": 0.4815, | |
| "step": 250 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_Macro F1": 0.7155645405318029, | |
| "eval_Macro Precision": 0.7388441683808017, | |
| "eval_Macro Recall": 0.7039245533319153, | |
| "eval_Micro F1": 0.7826697892271662, | |
| "eval_Micro Precision": 0.7826697892271662, | |
| "eval_Micro Recall": 0.7826697892271662, | |
| "eval_Weighted F1": 0.778931131467011, | |
| "eval_Weighted Precision": 0.7878024754296866, | |
| "eval_Weighted Recall": 0.7826697892271662, | |
| "eval_accuracy": 0.7826697892271662, | |
| "eval_loss": 0.3994453251361847, | |
| "eval_runtime": 570.0533, | |
| "eval_samples_per_second": 3.745, | |
| "eval_steps_per_second": 0.06, | |
| "step": 268 | |
| }, | |
| { | |
| "epoch": 2.24, | |
| "learning_rate": 1.5522388059701494e-05, | |
| "loss": 0.3774, | |
| "step": 300 | |
| }, | |
| { | |
| "epoch": 2.61, | |
| "learning_rate": 1.4776119402985077e-05, | |
| "loss": 0.3366, | |
| "step": 350 | |
| }, | |
| { | |
| "epoch": 2.99, | |
| "learning_rate": 1.4029850746268658e-05, | |
| "loss": 0.314, | |
| "step": 400 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "eval_Macro F1": 0.736751489500019, | |
| "eval_Macro Precision": 0.7612057314604446, | |
| "eval_Macro Recall": 0.7252037377440934, | |
| "eval_Micro F1": 0.7990632318501172, | |
| "eval_Micro Precision": 0.7990632318501171, | |
| "eval_Micro Recall": 0.7990632318501171, | |
| "eval_Weighted F1": 0.7977313198767033, | |
| "eval_Weighted Precision": 0.8100534851227623, | |
| "eval_Weighted Recall": 0.7990632318501171, | |
| "eval_accuracy": 0.7990632318501171, | |
| "eval_loss": 0.3560428321361542, | |
| "eval_runtime": 581.4066, | |
| "eval_samples_per_second": 3.672, | |
| "eval_steps_per_second": 0.058, | |
| "step": 402 | |
| }, | |
| { | |
| "epoch": 3.36, | |
| "learning_rate": 1.328358208955224e-05, | |
| "loss": 0.2486, | |
| "step": 450 | |
| }, | |
| { | |
| "epoch": 3.73, | |
| "learning_rate": 1.2537313432835823e-05, | |
| "loss": 0.235, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "eval_Macro F1": 0.7548578890974982, | |
| "eval_Macro Precision": 0.7630930133664333, | |
| "eval_Macro Recall": 0.7508943526446905, | |
| "eval_Micro F1": 0.8201405152224824, | |
| "eval_Micro Precision": 0.8201405152224824, | |
| "eval_Micro Recall": 0.8201405152224824, | |
| "eval_Weighted F1": 0.8217495227304409, | |
| "eval_Weighted Precision": 0.8273969119402248, | |
| "eval_Weighted Recall": 0.8201405152224824, | |
| "eval_accuracy": 0.8201405152224824, | |
| "eval_loss": 0.32777392864227295, | |
| "eval_runtime": 571.7549, | |
| "eval_samples_per_second": 3.734, | |
| "eval_steps_per_second": 0.059, | |
| "step": 536 | |
| }, | |
| { | |
| "epoch": 4.1, | |
| "learning_rate": 1.1791044776119405e-05, | |
| "loss": 0.2309, | |
| "step": 550 | |
| }, | |
| { | |
| "epoch": 4.48, | |
| "learning_rate": 1.1044776119402986e-05, | |
| "loss": 0.188, | |
| "step": 600 | |
| }, | |
| { | |
| "epoch": 4.85, | |
| "learning_rate": 1.029850746268657e-05, | |
| "loss": 0.1986, | |
| "step": 650 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "eval_Macro F1": 0.8208742913000978, | |
| "eval_Macro Precision": 0.8083647050243598, | |
| "eval_Macro Recall": 0.8400854990635674, | |
| "eval_Micro F1": 0.8618266978922716, | |
| "eval_Micro Precision": 0.8618266978922716, | |
| "eval_Micro Recall": 0.8618266978922716, | |
| "eval_Weighted F1": 0.8655209539834394, | |
| "eval_Weighted Precision": 0.8723242107411118, | |
| "eval_Weighted Recall": 0.8618266978922716, | |
| "eval_accuracy": 0.8618266978922716, | |
| "eval_loss": 0.3573662042617798, | |
| "eval_runtime": 572.7753, | |
| "eval_samples_per_second": 3.727, | |
| "eval_steps_per_second": 0.059, | |
| "step": 670 | |
| }, | |
| { | |
| "epoch": 5.22, | |
| "learning_rate": 9.552238805970149e-06, | |
| "loss": 0.1838, | |
| "step": 700 | |
| }, | |
| { | |
| "epoch": 5.6, | |
| "learning_rate": 8.805970149253732e-06, | |
| "loss": 0.1485, | |
| "step": 750 | |
| }, | |
| { | |
| "epoch": 5.97, | |
| "learning_rate": 8.059701492537314e-06, | |
| "loss": 0.1605, | |
| "step": 800 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "eval_Macro F1": 0.6588158445976257, | |
| "eval_Macro Precision": 0.6987220074939374, | |
| "eval_Macro Recall": 0.6469038522815648, | |
| "eval_Micro F1": 0.7995316159250586, | |
| "eval_Micro Precision": 0.7995316159250585, | |
| "eval_Micro Recall": 0.7995316159250585, | |
| "eval_Weighted F1": 0.7803428354754396, | |
| "eval_Weighted Precision": 0.778138163263271, | |
| "eval_Weighted Recall": 0.7995316159250585, | |
| "eval_accuracy": 0.7995316159250585, | |
| "eval_loss": 0.3885968029499054, | |
| "eval_runtime": 571.7311, | |
| "eval_samples_per_second": 3.734, | |
| "eval_steps_per_second": 0.059, | |
| "step": 804 | |
| }, | |
| { | |
| "epoch": 6.34, | |
| "learning_rate": 7.313432835820896e-06, | |
| "loss": 0.1425, | |
| "step": 850 | |
| }, | |
| { | |
| "epoch": 6.72, | |
| "learning_rate": 6.567164179104478e-06, | |
| "loss": 0.1436, | |
| "step": 900 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "eval_Macro F1": 0.7442069309467508, | |
| "eval_Macro Precision": 0.7576208137220202, | |
| "eval_Macro Recall": 0.7336057451045414, | |
| "eval_Micro F1": 0.8229508196721311, | |
| "eval_Micro Precision": 0.8229508196721311, | |
| "eval_Micro Recall": 0.8229508196721311, | |
| "eval_Weighted F1": 0.820676653014847, | |
| "eval_Weighted Precision": 0.8209948655272054, | |
| "eval_Weighted Recall": 0.8229508196721311, | |
| "eval_accuracy": 0.8229508196721311, | |
| "eval_loss": 0.4039975702762604, | |
| "eval_runtime": 571.7322, | |
| "eval_samples_per_second": 3.734, | |
| "eval_steps_per_second": 0.059, | |
| "step": 938 | |
| }, | |
| { | |
| "epoch": 7.09, | |
| "learning_rate": 5.820895522388061e-06, | |
| "loss": 0.1368, | |
| "step": 950 | |
| }, | |
| { | |
| "epoch": 7.46, | |
| "learning_rate": 5.074626865671642e-06, | |
| "loss": 0.1253, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 7.84, | |
| "learning_rate": 4.3283582089552236e-06, | |
| "loss": 0.1373, | |
| "step": 1050 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "eval_Macro F1": 0.7123175103612404, | |
| "eval_Macro Precision": 0.7322548905353868, | |
| "eval_Macro Recall": 0.7019914283796879, | |
| "eval_Micro F1": 0.8168618266978923, | |
| "eval_Micro Precision": 0.8168618266978923, | |
| "eval_Micro Recall": 0.8168618266978923, | |
| "eval_Weighted F1": 0.807557064029797, | |
| "eval_Weighted Precision": 0.8030050439721781, | |
| "eval_Weighted Recall": 0.8168618266978923, | |
| "eval_accuracy": 0.8168618266978923, | |
| "eval_loss": 0.4517393112182617, | |
| "eval_runtime": 571.7202, | |
| "eval_samples_per_second": 3.734, | |
| "eval_steps_per_second": 0.059, | |
| "step": 1072 | |
| }, | |
| { | |
| "epoch": 8.21, | |
| "learning_rate": 3.582089552238806e-06, | |
| "loss": 0.1206, | |
| "step": 1100 | |
| }, | |
| { | |
| "epoch": 8.58, | |
| "learning_rate": 2.835820895522388e-06, | |
| "loss": 0.1141, | |
| "step": 1150 | |
| }, | |
| { | |
| "epoch": 8.96, | |
| "learning_rate": 2.08955223880597e-06, | |
| "loss": 0.1271, | |
| "step": 1200 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "eval_Macro F1": 0.6891590047543085, | |
| "eval_Macro Precision": 0.7169021915882458, | |
| "eval_Macro Recall": 0.6768345177275865, | |
| "eval_Micro F1": 0.8070257611241218, | |
| "eval_Micro Precision": 0.8070257611241218, | |
| "eval_Micro Recall": 0.8070257611241218, | |
| "eval_Weighted F1": 0.7944945373911929, | |
| "eval_Weighted Precision": 0.790593845937712, | |
| "eval_Weighted Recall": 0.8070257611241218, | |
| "eval_accuracy": 0.8070257611241218, | |
| "eval_loss": 0.45325130224227905, | |
| "eval_runtime": 593.452, | |
| "eval_samples_per_second": 3.598, | |
| "eval_steps_per_second": 0.057, | |
| "step": 1206 | |
| }, | |
| { | |
| "epoch": 9.33, | |
| "learning_rate": 1.3432835820895524e-06, | |
| "loss": 0.1171, | |
| "step": 1250 | |
| }, | |
| { | |
| "epoch": 9.7, | |
| "learning_rate": 5.970149253731343e-07, | |
| "loss": 0.1199, | |
| "step": 1300 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "eval_Macro F1": 0.7368644623841439, | |
| "eval_Macro Precision": 0.7514878901301887, | |
| "eval_Macro Recall": 0.726942967276122, | |
| "eval_Micro F1": 0.824824355971897, | |
| "eval_Micro Precision": 0.824824355971897, | |
| "eval_Micro Recall": 0.824824355971897, | |
| "eval_Weighted F1": 0.8193666524247488, | |
| "eval_Weighted Precision": 0.8163202759848958, | |
| "eval_Weighted Recall": 0.824824355971897, | |
| "eval_accuracy": 0.824824355971897, | |
| "eval_loss": 0.474141001701355, | |
| "eval_runtime": 569.2941, | |
| "eval_samples_per_second": 3.75, | |
| "eval_steps_per_second": 0.06, | |
| "step": 1340 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "step": 1340, | |
| "total_flos": 1.105606065652704e+16, | |
| "train_loss": 0.26616470564657185, | |
| "train_runtime": 95644.4856, | |
| "train_samples_per_second": 0.892, | |
| "train_steps_per_second": 0.014 | |
| } | |
| ], | |
| "max_steps": 1340, | |
| "num_train_epochs": 10, | |
| "total_flos": 1.105606065652704e+16, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |