🔄 Incremental importance | Acc: 0.762, F1: 0.499

Browse files

Files changed (10) hide show

README.md +9 -9
{checkpoint-38 → checkpoint-70}/config.json +0 -0
{checkpoint-38 → checkpoint-70}/model.safetensors +1 -1
{checkpoint-38 → checkpoint-70}/special_tokens_map.json +0 -0
{checkpoint-38 → checkpoint-70}/tokenizer.json +0 -0
{checkpoint-38 → checkpoint-70}/tokenizer_config.json +0 -0
{checkpoint-38 → checkpoint-70}/trainer_state.json +74 -31
{checkpoint-38 → checkpoint-70}/vocab.txt +0 -0
model.safetensors +1 -1
training_args.bin +1 -1

README.md CHANGED Viewed

@@ -21,19 +21,19 @@ Fine-tuned FinBERT model for financial importance analysis in TradePulse.
 ## Performance
-*Last training: 2025-07-25 15:44*
-*Dataset: `news_20250725.csv` (202 samples)*
 | Metric | Value |
 |--------|-------|
-| Loss | 1.7456 |
-| Accuracy | 0.7451 |
-| F1 Score | 0.7395 |
-| F1 Macro | 0.7395 |
-| Precision | 0.7354 |
-| Recall | 0.7451 |
 ## Training Details
@@ -65,4 +65,4 @@ predictions = outputs.logits.softmax(dim=-1)
 ## Model Card Authors
 - TradePulse ML Team
-- Auto-generated on 2025-07-25 15:44:54

 ## Performance
+*Last training: 2025-07-26 17:59*
+*Dataset: `news_20250726.csv` (186 samples)*
 | Metric | Value |
 |--------|-------|
+| Loss | 1.1184 |
+| Accuracy | 0.7021 |
+| F1 Score | 0.6383 |
+| F1 Macro | 0.6383 |
+| Precision | 0.6169 |
+| Recall | 0.7021 |
 ## Training Details
 ## Model Card Authors
 - TradePulse ML Team
+- Auto-generated on 2025-07-26 17:59:14

{checkpoint-38 → checkpoint-70}/config.json RENAMED Viewed

File without changes

{checkpoint-38 → checkpoint-70}/model.safetensors RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e797b4cfa01182c3d339ebe75e46e9f81dd739c15a145eef2574a40e5e702688
 size 439039996

 version https://git-lfs.github.com/spec/v1
+oid sha256:a4087bd081287dc33455f8706cdab2450b8a56b2fbbe6d1535ab736e2d2e4d5b
 size 439039996

{checkpoint-38 → checkpoint-70}/special_tokens_map.json RENAMED Viewed

File without changes

{checkpoint-38 → checkpoint-70}/tokenizer.json RENAMED Viewed

File without changes

{checkpoint-38 → checkpoint-70}/tokenizer_config.json RENAMED Viewed

File without changes

{checkpoint-38 → checkpoint-70}/trainer_state.json RENAMED Viewed

@@ -1,52 +1,95 @@
 {
-  "best_metric": 0.7394630366766589,
-  "best_model_checkpoint": "hf-importance-production/checkpoint-38",
-  "epoch": 1.0,
   "eval_steps": 500,
-  "global_step": 38,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
-      "epoch": 0.2631578947368421,
-      "grad_norm": 55.620182037353516,
-      "learning_rate": 2.702702702702703e-06,
-      "loss": 2.4772,
       "step": 10
     },
     {
-      "epoch": 0.5263157894736842,
-      "grad_norm": 77.68924713134766,
-      "learning_rate": 5.405405405405406e-06,
-      "loss": 2.5891,
       "step": 20
     },
     {
-      "epoch": 0.7894736842105263,
-      "grad_norm": 60.01732635498047,
-      "learning_rate": 8.108108108108109e-06,
-      "loss": 2.7644,
       "step": 30
     },
     {
       "epoch": 1.0,
-      "eval_accuracy": 0.7450980392156863,
-      "eval_f1": 0.7394630366766589,
-      "eval_f1_macro": 0.492620439988861,
-      "eval_loss": 1.7456282377243042,
-      "eval_precision": 0.7354206198608476,
-      "eval_precision_macro": 0.485483870967742,
-      "eval_recall": 0.7450980392156863,
-      "eval_recall_macro": 0.5011574074074074,
-      "eval_runtime": 28.4033,
-      "eval_samples_per_second": 1.796,
-      "eval_steps_per_second": 0.458,
-      "step": 38
     }
   ],
   "logging_steps": 10,
-  "max_steps": 76,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 2,
   "save_steps": 500,
@@ -66,12 +109,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": false
       },
       "attributes": {}
     }
   },
-  "total_flos": 39730126076928.0,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null

 {
+  "best_metric": 0.6383321617775644,
+  "best_model_checkpoint": "hf-importance-production/checkpoint-70",
+  "epoch": 2.0,
   "eval_steps": 500,
+  "global_step": 70,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
+      "epoch": 0.2857142857142857,
+      "grad_norm": 107.85406494140625,
+      "learning_rate": 2.9411764705882355e-06,
+      "loss": 3.316,
       "step": 10
     },
     {
+      "epoch": 0.5714285714285714,
+      "grad_norm": 41.05527877807617,
+      "learning_rate": 5.882352941176471e-06,
+      "loss": 2.2774,
       "step": 20
     },
     {
+      "epoch": 0.8571428571428571,
+      "grad_norm": 58.872947692871094,
+      "learning_rate": 8.823529411764707e-06,
+      "loss": 1.1755,
       "step": 30
     },
     {
       "epoch": 1.0,
+      "eval_accuracy": 0.6808510638297872,
+      "eval_f1": 0.5894736842105264,
+      "eval_f1_macro": 0.3163742690058479,
+      "eval_loss": 1.8137695789337158,
+      "eval_precision": 0.5647969052224372,
+      "eval_precision_macro": 0.34595959595959597,
+      "eval_recall": 0.6808510638297872,
+      "eval_recall_macro": 0.3506944444444444,
+      "eval_runtime": 26.1342,
+      "eval_samples_per_second": 1.798,
+      "eval_steps_per_second": 0.459,
+      "step": 35
+    },
+    {
+      "epoch": 1.1428571428571428,
+      "grad_norm": 62.1671142578125,
+      "learning_rate": 8.333333333333334e-06,
+      "loss": 2.2904,
+      "step": 40
+    },
+    {
+      "epoch": 1.4285714285714286,
+      "grad_norm": 87.3003921508789,
+      "learning_rate": 5.555555555555557e-06,
+      "loss": 0.7705,
+      "step": 50
+    },
+    {
+      "epoch": 1.7142857142857144,
+      "grad_norm": 58.54560470581055,
+      "learning_rate": 2.7777777777777783e-06,
+      "loss": 0.6563,
+      "step": 60
+    },
+    {
+      "epoch": 2.0,
+      "grad_norm": 4.384439468383789,
+      "learning_rate": 0.0,
+      "loss": 0.9612,
+      "step": 70
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.7021276595744681,
+      "eval_f1": 0.6383321617775644,
+      "eval_f1_macro": 0.3615363953800698,
+      "eval_loss": 1.1184031963348389,
+      "eval_precision": 0.6169174883238194,
+      "eval_precision_macro": 0.38536585365853665,
+      "eval_recall": 0.7021276595744681,
+      "eval_recall_macro": 0.37847222222222227,
+      "eval_runtime": 26.1131,
+      "eval_samples_per_second": 1.8,
+      "eval_steps_per_second": 0.46,
+      "step": 70
     }
   ],
   "logging_steps": 10,
+  "max_steps": 70,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 2,
   "save_steps": 500,
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": true
       },
       "attributes": {}
     }
   },
+  "total_flos": 73145530128384.0,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null

{checkpoint-38 → checkpoint-70}/vocab.txt RENAMED Viewed

File without changes

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e797b4cfa01182c3d339ebe75e46e9f81dd739c15a145eef2574a40e5e702688
 size 439039996

 version https://git-lfs.github.com/spec/v1
+oid sha256:a4087bd081287dc33455f8706cdab2450b8a56b2fbbe6d1535ab736e2d2e4d5b
 size 439039996

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3b061dbe96085bccc3c91f3751222bd984561b8f688f02aae26349205f0e29f8
 size 5521

 version https://git-lfs.github.com/spec/v1
+oid sha256:194a232eff0c1caf9732b79147ab47826ba935238e565d577007a4ee5ffdaec7
 size 5521