Bencode92 commited on
Commit
0ce764b
Β·
1 Parent(s): 139952c

πŸ”„ Incremental importance | Acc: 0.762, F1: 0.499

Browse files
README.md CHANGED
@@ -21,19 +21,19 @@ Fine-tuned FinBERT model for financial importance analysis in TradePulse.
21
 
22
  ## Performance
23
 
24
- *Last training: 2025-07-25 15:44*
25
- *Dataset: `news_20250725.csv` (202 samples)*
26
 
27
  | Metric | Value |
28
  |--------|-------|
29
- | Loss | 1.7456 |
30
- | Accuracy | 0.7451 |
31
- | F1 Score | 0.7395 |
32
 
33
- | F1 Macro | 0.7395 |
34
 
35
- | Precision | 0.7354 |
36
- | Recall | 0.7451 |
37
 
38
  ## Training Details
39
 
@@ -65,4 +65,4 @@ predictions = outputs.logits.softmax(dim=-1)
65
  ## Model Card Authors
66
 
67
  - TradePulse ML Team
68
- - Auto-generated on 2025-07-25 15:44:54
 
21
 
22
  ## Performance
23
 
24
+ *Last training: 2025-07-26 17:59*
25
+ *Dataset: `news_20250726.csv` (186 samples)*
26
 
27
  | Metric | Value |
28
  |--------|-------|
29
+ | Loss | 1.1184 |
30
+ | Accuracy | 0.7021 |
31
+ | F1 Score | 0.6383 |
32
 
33
+ | F1 Macro | 0.6383 |
34
 
35
+ | Precision | 0.6169 |
36
+ | Recall | 0.7021 |
37
 
38
  ## Training Details
39
 
 
65
  ## Model Card Authors
66
 
67
  - TradePulse ML Team
68
+ - Auto-generated on 2025-07-26 17:59:14
{checkpoint-38 β†’ checkpoint-70}/config.json RENAMED
File without changes
{checkpoint-38 β†’ checkpoint-70}/model.safetensors RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e797b4cfa01182c3d339ebe75e46e9f81dd739c15a145eef2574a40e5e702688
3
  size 439039996
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4087bd081287dc33455f8706cdab2450b8a56b2fbbe6d1535ab736e2d2e4d5b
3
  size 439039996
{checkpoint-38 β†’ checkpoint-70}/special_tokens_map.json RENAMED
File without changes
{checkpoint-38 β†’ checkpoint-70}/tokenizer.json RENAMED
File without changes
{checkpoint-38 β†’ checkpoint-70}/tokenizer_config.json RENAMED
File without changes
{checkpoint-38 β†’ checkpoint-70}/trainer_state.json RENAMED
@@ -1,52 +1,95 @@
1
  {
2
- "best_metric": 0.7394630366766589,
3
- "best_model_checkpoint": "hf-importance-production/checkpoint-38",
4
- "epoch": 1.0,
5
  "eval_steps": 500,
6
- "global_step": 38,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.2631578947368421,
13
- "grad_norm": 55.620182037353516,
14
- "learning_rate": 2.702702702702703e-06,
15
- "loss": 2.4772,
16
  "step": 10
17
  },
18
  {
19
- "epoch": 0.5263157894736842,
20
- "grad_norm": 77.68924713134766,
21
- "learning_rate": 5.405405405405406e-06,
22
- "loss": 2.5891,
23
  "step": 20
24
  },
25
  {
26
- "epoch": 0.7894736842105263,
27
- "grad_norm": 60.01732635498047,
28
- "learning_rate": 8.108108108108109e-06,
29
- "loss": 2.7644,
30
  "step": 30
31
  },
32
  {
33
  "epoch": 1.0,
34
- "eval_accuracy": 0.7450980392156863,
35
- "eval_f1": 0.7394630366766589,
36
- "eval_f1_macro": 0.492620439988861,
37
- "eval_loss": 1.7456282377243042,
38
- "eval_precision": 0.7354206198608476,
39
- "eval_precision_macro": 0.485483870967742,
40
- "eval_recall": 0.7450980392156863,
41
- "eval_recall_macro": 0.5011574074074074,
42
- "eval_runtime": 28.4033,
43
- "eval_samples_per_second": 1.796,
44
- "eval_steps_per_second": 0.458,
45
- "step": 38
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
46
  }
47
  ],
48
  "logging_steps": 10,
49
- "max_steps": 76,
50
  "num_input_tokens_seen": 0,
51
  "num_train_epochs": 2,
52
  "save_steps": 500,
@@ -66,12 +109,12 @@
66
  "should_evaluate": false,
67
  "should_log": false,
68
  "should_save": true,
69
- "should_training_stop": false
70
  },
71
  "attributes": {}
72
  }
73
  },
74
- "total_flos": 39730126076928.0,
75
  "train_batch_size": 4,
76
  "trial_name": null,
77
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.6383321617775644,
3
+ "best_model_checkpoint": "hf-importance-production/checkpoint-70",
4
+ "epoch": 2.0,
5
  "eval_steps": 500,
6
+ "global_step": 70,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.2857142857142857,
13
+ "grad_norm": 107.85406494140625,
14
+ "learning_rate": 2.9411764705882355e-06,
15
+ "loss": 3.316,
16
  "step": 10
17
  },
18
  {
19
+ "epoch": 0.5714285714285714,
20
+ "grad_norm": 41.05527877807617,
21
+ "learning_rate": 5.882352941176471e-06,
22
+ "loss": 2.2774,
23
  "step": 20
24
  },
25
  {
26
+ "epoch": 0.8571428571428571,
27
+ "grad_norm": 58.872947692871094,
28
+ "learning_rate": 8.823529411764707e-06,
29
+ "loss": 1.1755,
30
  "step": 30
31
  },
32
  {
33
  "epoch": 1.0,
34
+ "eval_accuracy": 0.6808510638297872,
35
+ "eval_f1": 0.5894736842105264,
36
+ "eval_f1_macro": 0.3163742690058479,
37
+ "eval_loss": 1.8137695789337158,
38
+ "eval_precision": 0.5647969052224372,
39
+ "eval_precision_macro": 0.34595959595959597,
40
+ "eval_recall": 0.6808510638297872,
41
+ "eval_recall_macro": 0.3506944444444444,
42
+ "eval_runtime": 26.1342,
43
+ "eval_samples_per_second": 1.798,
44
+ "eval_steps_per_second": 0.459,
45
+ "step": 35
46
+ },
47
+ {
48
+ "epoch": 1.1428571428571428,
49
+ "grad_norm": 62.1671142578125,
50
+ "learning_rate": 8.333333333333334e-06,
51
+ "loss": 2.2904,
52
+ "step": 40
53
+ },
54
+ {
55
+ "epoch": 1.4285714285714286,
56
+ "grad_norm": 87.3003921508789,
57
+ "learning_rate": 5.555555555555557e-06,
58
+ "loss": 0.7705,
59
+ "step": 50
60
+ },
61
+ {
62
+ "epoch": 1.7142857142857144,
63
+ "grad_norm": 58.54560470581055,
64
+ "learning_rate": 2.7777777777777783e-06,
65
+ "loss": 0.6563,
66
+ "step": 60
67
+ },
68
+ {
69
+ "epoch": 2.0,
70
+ "grad_norm": 4.384439468383789,
71
+ "learning_rate": 0.0,
72
+ "loss": 0.9612,
73
+ "step": 70
74
+ },
75
+ {
76
+ "epoch": 2.0,
77
+ "eval_accuracy": 0.7021276595744681,
78
+ "eval_f1": 0.6383321617775644,
79
+ "eval_f1_macro": 0.3615363953800698,
80
+ "eval_loss": 1.1184031963348389,
81
+ "eval_precision": 0.6169174883238194,
82
+ "eval_precision_macro": 0.38536585365853665,
83
+ "eval_recall": 0.7021276595744681,
84
+ "eval_recall_macro": 0.37847222222222227,
85
+ "eval_runtime": 26.1131,
86
+ "eval_samples_per_second": 1.8,
87
+ "eval_steps_per_second": 0.46,
88
+ "step": 70
89
  }
90
  ],
91
  "logging_steps": 10,
92
+ "max_steps": 70,
93
  "num_input_tokens_seen": 0,
94
  "num_train_epochs": 2,
95
  "save_steps": 500,
 
109
  "should_evaluate": false,
110
  "should_log": false,
111
  "should_save": true,
112
+ "should_training_stop": true
113
  },
114
  "attributes": {}
115
  }
116
  },
117
+ "total_flos": 73145530128384.0,
118
  "train_batch_size": 4,
119
  "trial_name": null,
120
  "trial_params": null
{checkpoint-38 β†’ checkpoint-70}/vocab.txt RENAMED
File without changes
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e797b4cfa01182c3d339ebe75e46e9f81dd739c15a145eef2574a40e5e702688
3
  size 439039996
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4087bd081287dc33455f8706cdab2450b8a56b2fbbe6d1535ab736e2d2e4d5b
3
  size 439039996
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3b061dbe96085bccc3c91f3751222bd984561b8f688f02aae26349205f0e29f8
3
  size 5521
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:194a232eff0c1caf9732b79147ab47826ba935238e565d577007a4ee5ffdaec7
3
  size 5521