🔄 Incremental importance | Acc: 0.750, F1: 0.468

Browse files

Files changed (10) hide show

README.md +9 -9
{checkpoint-40 → checkpoint-54}/config.json +0 -0
{checkpoint-40 → checkpoint-54}/model.safetensors +1 -1
{checkpoint-40 → checkpoint-54}/special_tokens_map.json +0 -0
{checkpoint-40 → checkpoint-54}/tokenizer.json +0 -0
{checkpoint-40 → checkpoint-54}/tokenizer_config.json +0 -0
{checkpoint-40 → checkpoint-54}/trainer_state.json +58 -36
{checkpoint-40 → checkpoint-54}/vocab.txt +0 -0
model.safetensors +1 -1
training_args.bin +1 -1

README.md CHANGED Viewed

@@ -20,17 +20,17 @@ Fine-tuned FinBERT model for financial importance analysis in TradePulse.
 ## Performance
-*Last training: 2025-07-16 06:55*
-*Dataset: `news_20250716.csv` (214 samples)*
 | Metric | Value |
 |--------|-------|
-| Loss | 1.9563 |
-| Accuracy | 0.6481 |
-| F1 Score | 0.6376 |
-| F1 Macro | 0.6376 |
-| Precision | 0.6685 |
-| Recall | 0.6481 |
 ## Training Details
@@ -59,4 +59,4 @@ predictions = outputs.logits.softmax(dim=-1)
 ## Model Card Authors
 - TradePulse ML Team
-- Auto-generated on 2025-07-16 06:55:39

 ## Performance
+*Last training: 2025-07-17 13:34*
+*Dataset: `news_20250717.csv` (142 samples)*
 | Metric | Value |
 |--------|-------|
+| Loss | 0.8034 |
+| Accuracy | 0.7222 |
+| F1 Score | 0.6776 |
+| F1 Macro | 0.6776 |
+| Precision | 0.6819 |
+| Recall | 0.7222 |
 ## Training Details
 ## Model Card Authors
 - TradePulse ML Team
+- Auto-generated on 2025-07-17 13:34:20

{checkpoint-40 → checkpoint-54}/config.json RENAMED Viewed

File without changes

{checkpoint-40 → checkpoint-54}/model.safetensors RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c7317c601691b02a030c5214c45334acbe36778068e0340cfe791923d599c2c2
 size 439039996

 version https://git-lfs.github.com/spec/v1
+oid sha256:c5f69416f12d48d75db96ab4b07e52fe52522972d4bd436defe00a32efe7e4c0
 size 439039996

{checkpoint-40 → checkpoint-54}/special_tokens_map.json RENAMED Viewed

File without changes

{checkpoint-40 → checkpoint-54}/tokenizer.json RENAMED Viewed

File without changes

{checkpoint-40 → checkpoint-54}/tokenizer_config.json RENAMED Viewed

File without changes

{checkpoint-40 → checkpoint-54}/trainer_state.json RENAMED Viewed

@@ -1,59 +1,81 @@
 {
-  "best_metric": 0.6376050420168068,
-  "best_model_checkpoint": "hf-importance-production/checkpoint-40",
-  "epoch": 1.0,
   "eval_steps": 500,
-  "global_step": 40,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
-      "epoch": 0.25,
-      "grad_norm": 35.63239288330078,
-      "learning_rate": 2.5e-06,
-      "loss": 1.8605,
       "step": 10
     },
     {
-      "epoch": 0.5,
-      "grad_norm": 27.44408416748047,
-      "learning_rate": 5e-06,
-      "loss": 1.5892,
       "step": 20
     },
     {
-      "epoch": 0.75,
-      "grad_norm": 34.42560958862305,
-      "learning_rate": 7.500000000000001e-06,
-      "loss": 1.3163,
       "step": 30
     },
     {
-      "epoch": 1.0,
-      "grad_norm": 78.49942016601562,
-      "learning_rate": 1e-05,
-      "loss": 2.0013,
       "step": 40
     },
     {
-      "epoch": 1.0,
-      "eval_accuracy": 0.6481481481481481,
-      "eval_f1": 0.6376050420168068,
-      "eval_f1_macro": 0.4353408029878618,
-      "eval_loss": 1.9562698602676392,
-      "eval_precision": 0.6685105018438351,
-      "eval_precision_macro": 0.44588744588744583,
-      "eval_recall": 0.6481481481481481,
-      "eval_recall_macro": 0.45314009661835747,
-      "eval_runtime": 30.1459,
-      "eval_samples_per_second": 1.791,
-      "eval_steps_per_second": 0.464,
-      "step": 40
     }
   ],
   "logging_steps": 10,
-  "max_steps": 80,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 2,
   "save_steps": 500,
@@ -73,12 +95,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": false
       },
       "attributes": {}
     }
   },
-  "total_flos": 42098146836480.0,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null

 {
+  "best_metric": 0.6775793650793651,
+  "best_model_checkpoint": "hf-importance-production/checkpoint-54",
+  "epoch": 2.0,
   "eval_steps": 500,
+  "global_step": 54,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
+      "epoch": 0.37037037037037035,
+      "grad_norm": 43.338623046875,
+      "learning_rate": 3.846153846153847e-06,
+      "loss": 1.1141,
       "step": 10
     },
     {
+      "epoch": 0.7407407407407407,
+      "grad_norm": 5.277134895324707,
+      "learning_rate": 7.692307692307694e-06,
+      "loss": 1.1598,
       "step": 20
     },
     {
+      "epoch": 1.0,
+      "eval_accuracy": 0.6944444444444444,
+      "eval_f1": 0.6309416704153546,
+      "eval_f1_macro": 0.6536212325686009,
+      "eval_loss": 1.1927357912063599,
+      "eval_precision": 0.6195023148148148,
+      "eval_precision_macro": 0.6840277777777777,
+      "eval_recall": 0.6944444444444444,
+      "eval_recall_macro": 0.6733333333333333,
+      "eval_runtime": 20.0468,
+      "eval_samples_per_second": 1.796,
+      "eval_steps_per_second": 0.449,
+      "step": 27
+    },
+    {
+      "epoch": 1.1111111111111112,
+      "grad_norm": 4.237745761871338,
+      "learning_rate": 8.571428571428571e-06,
+      "loss": 1.0568,
       "step": 30
     },
     {
+      "epoch": 1.4814814814814814,
+      "grad_norm": 1.0734100341796875,
+      "learning_rate": 5e-06,
+      "loss": 0.4549,
       "step": 40
     },
     {
+      "epoch": 1.8518518518518519,
+      "grad_norm": 17.751998901367188,
+      "learning_rate": 1.4285714285714286e-06,
+      "loss": 0.9042,
+      "step": 50
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.7222222222222222,
+      "eval_f1": 0.6775793650793651,
+      "eval_f1_macro": 0.7023809523809524,
+      "eval_loss": 0.8034341335296631,
+      "eval_precision": 0.6818996415770608,
+      "eval_precision_macro": 0.7473118279569894,
+      "eval_recall": 0.7222222222222222,
+      "eval_recall_macro": 0.7066666666666667,
+      "eval_runtime": 20.008,
+      "eval_samples_per_second": 1.799,
+      "eval_steps_per_second": 0.45,
+      "step": 54
     }
   ],
   "logging_steps": 10,
+  "max_steps": 54,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 2,
   "save_steps": 500,
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": true
       },
       "attributes": {}
     }
   },
+  "total_flos": 55780044558336.0,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null

{checkpoint-40 → checkpoint-54}/vocab.txt RENAMED Viewed

File without changes

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c7317c601691b02a030c5214c45334acbe36778068e0340cfe791923d599c2c2
 size 439039996

 version https://git-lfs.github.com/spec/v1
+oid sha256:c5f69416f12d48d75db96ab4b07e52fe52522972d4bd436defe00a32efe7e4c0
 size 439039996

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2f15beae061f900df55a72593a0d6e94a0aa87b4abafd58adf1bf7ac2a4b64f9
 size 5521

 version https://git-lfs.github.com/spec/v1
+oid sha256:b6bbac70dcc30ea2489bf42b0b6da04b30b625b4819082efc3a718b014a9e877
 size 5521