🔄 Incremental importance | Acc: 0.812, F1: 0.560

Browse files

Files changed (10) hide show

README.md +9 -9
{checkpoint-18 → checkpoint-52}/config.json +0 -0
{checkpoint-18 → checkpoint-52}/model.safetensors +1 -1
{checkpoint-18 → checkpoint-52}/special_tokens_map.json +0 -0
{checkpoint-18 → checkpoint-52}/tokenizer.json +0 -0
{checkpoint-18 → checkpoint-52}/tokenizer_config.json +0 -0
{checkpoint-18 → checkpoint-52}/trainer_state.json +62 -34
{checkpoint-18 → checkpoint-52}/vocab.txt +0 -0
model.safetensors +1 -1
training_args.bin +1 -1

README.md CHANGED Viewed

@@ -20,17 +20,17 @@ Fine-tuned FinBERT model for financial importance analysis in TradePulse.
 ## Performance
-*Last training: 2025-07-09 16:17*
-*Dataset: `news_20250709.csv` (46 samples)*
 | Metric | Value |
 |--------|-------|
-| Loss | 1.6092 |
-| Accuracy | 0.8333 |
-| F1 Score | 0.7989 |
-| F1 Macro | 0.7989 |
-| Precision | 0.7917 |
-| Recall | 0.8333 |
 ## Training Details
@@ -59,4 +59,4 @@ predictions = outputs.logits.softmax(dim=-1)
 ## Model Card Authors
 - TradePulse ML Team
-- Auto-generated on 2025-07-09 16:17:17

 ## Performance
+*Last training: 2025-07-10 09:11*
+*Dataset: `news_20250710.csv` (138 samples)*
 | Metric | Value |
 |--------|-------|
+| Loss | 0.0703 |
+| Accuracy | 0.9714 |
+| F1 Score | 0.9758 |
+| F1 Macro | 0.9758 |
+| Precision | 0.9857 |
+| Recall | 0.9714 |
 ## Training Details
 ## Model Card Authors
 - TradePulse ML Team
+- Auto-generated on 2025-07-10 09:11:15

{checkpoint-18 → checkpoint-52}/config.json RENAMED Viewed

File without changes

{checkpoint-18 → checkpoint-52}/model.safetensors RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1b3dabca8d8e63ed66cfb9eb1910581f8f656f01b7cba193238cfe67ce50d181
 size 439039996

 version https://git-lfs.github.com/spec/v1
+oid sha256:ae4c5c9032b9108afe5cd8569212b5eee6a8bc68a8b592e27c95b758887b4834
 size 439039996

{checkpoint-18 → checkpoint-52}/special_tokens_map.json RENAMED Viewed

File without changes

{checkpoint-18 → checkpoint-52}/tokenizer.json RENAMED Viewed

File without changes

{checkpoint-18 → checkpoint-52}/tokenizer_config.json RENAMED Viewed

File without changes

{checkpoint-18 → checkpoint-52}/trainer_state.json RENAMED Viewed

@@ -1,53 +1,81 @@
 {
-  "best_metric": 0.798941798941799,
-  "best_model_checkpoint": "hf-importance-production/checkpoint-18",
   "epoch": 2.0,
   "eval_steps": 500,
-  "global_step": 18,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
-      "epoch": 1.0,
-      "eval_accuracy": 0.75,
-      "eval_f1": 0.7125,
-      "eval_f1_macro": 0.5166666666666667,
-      "eval_loss": 2.042041540145874,
-      "eval_precision": 0.75,
-      "eval_precision_macro": 0.5555555555555555,
-      "eval_recall": 0.75,
-      "eval_recall_macro": 0.5333333333333333,
-      "eval_runtime": 6.64,
-      "eval_samples_per_second": 1.807,
-      "eval_steps_per_second": 0.452,
-      "step": 9
     },
     {
-      "epoch": 1.1111111111111112,
-      "grad_norm": 0.657223641872406,
       "learning_rate": 8.000000000000001e-06,
-      "loss": 1.2448,
-      "step": 10
     },
     {
       "epoch": 2.0,
-      "eval_accuracy": 0.8333333333333334,
-      "eval_f1": 0.798941798941799,
-      "eval_f1_macro": 0.582010582010582,
-      "eval_loss": 1.6091957092285156,
-      "eval_precision": 0.7916666666666666,
-      "eval_precision_macro": 0.5833333333333334,
-      "eval_recall": 0.8333333333333334,
-      "eval_recall_macro": 0.6,
-      "eval_runtime": 6.6395,
-      "eval_samples_per_second": 1.807,
-      "eval_steps_per_second": 0.452,
-      "step": 18
     }
   ],
   "logging_steps": 10,
-  "max_steps": 18,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 2,
   "save_steps": 500,
@@ -72,7 +100,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 17891712405504.0,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null

 {
+  "best_metric": 0.9757823129251698,
+  "best_model_checkpoint": "hf-importance-production/checkpoint-52",
   "epoch": 2.0,
   "eval_steps": 500,
+  "global_step": 52,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
+      "epoch": 0.38461538461538464,
+      "grad_norm": 0.08406942337751389,
+      "learning_rate": 4.000000000000001e-06,
+      "loss": 0.1652,
+      "step": 10
     },
     {
+      "epoch": 0.7692307692307693,
+      "grad_norm": 44.237098693847656,
       "learning_rate": 8.000000000000001e-06,
+      "loss": 0.2935,
+      "step": 20
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.9714285714285714,
+      "eval_f1": 0.9757296466973886,
+      "eval_f1_macro": 0.8781362007168458,
+      "eval_loss": 0.0774894431233406,
+      "eval_precision": 0.9857142857142858,
+      "eval_precision_macro": 0.8333333333333334,
+      "eval_recall": 0.9714285714285714,
+      "eval_recall_macro": 0.9791666666666666,
+      "eval_runtime": 19.4749,
+      "eval_samples_per_second": 1.797,
+      "eval_steps_per_second": 0.462,
+      "step": 26
+    },
+    {
+      "epoch": 1.1538461538461537,
+      "grad_norm": 0.001178277307190001,
+      "learning_rate": 8.148148148148148e-06,
+      "loss": 0.1045,
+      "step": 30
+    },
+    {
+      "epoch": 1.5384615384615383,
+      "grad_norm": 52.080684661865234,
+      "learning_rate": 4.444444444444444e-06,
+      "loss": 0.2248,
+      "step": 40
+    },
+    {
+      "epoch": 1.9230769230769231,
+      "grad_norm": 0.37515753507614136,
+      "learning_rate": 7.407407407407407e-07,
+      "loss": 0.1178,
+      "step": 50
     },
     {
       "epoch": 2.0,
+      "eval_accuracy": 0.9714285714285714,
+      "eval_f1": 0.9757823129251698,
+      "eval_f1_macro": 0.8793650793650793,
+      "eval_loss": 0.07033431529998779,
+      "eval_precision": 0.9857142857142858,
+      "eval_precision_macro": 0.8333333333333334,
+      "eval_recall": 0.9714285714285714,
+      "eval_recall_macro": 0.9814814814814815,
+      "eval_runtime": 19.6277,
+      "eval_samples_per_second": 1.783,
+      "eval_steps_per_second": 0.459,
+      "step": 52
     }
   ],
   "logging_steps": 10,
+  "max_steps": 52,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 2,
   "save_steps": 500,
       "attributes": {}
     }
   },
+  "total_flos": 54201364051968.0,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null

{checkpoint-18 → checkpoint-52}/vocab.txt RENAMED Viewed

File without changes

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1b3dabca8d8e63ed66cfb9eb1910581f8f656f01b7cba193238cfe67ce50d181
 size 439039996

 version https://git-lfs.github.com/spec/v1
+oid sha256:ae4c5c9032b9108afe5cd8569212b5eee6a8bc68a8b592e27c95b758887b4834
 size 439039996

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a3c99de83de5f22fdddae294ce3c58b232ced45309611f6aca8ad972a4b071c7
 size 5521

 version https://git-lfs.github.com/spec/v1
+oid sha256:46014ae489d03a5169b574c28a7d88c2ad6dab9de05cdb9d53a95b988c48d865
 size 5521