Bencode92 commited on
Commit
ffb163c
Β·
1 Parent(s): 7e76a53

πŸ”„ Incremental importance | Acc: 0.803, F1: 0.662

Browse files
README.md CHANGED
@@ -21,19 +21,19 @@ Fine-tuned FinBERT model for financial importance analysis in TradePulse.
21
 
22
  ## Performance
23
 
24
- *Last training: 2025-07-29 09:32*
25
- *Dataset: `news_20250729.csv` (53 samples)*
26
 
27
  | Metric | Value |
28
  |--------|-------|
29
- | Loss | 2.5392 |
30
- | Accuracy | 0.6429 |
31
- | F1 Score | 0.5031 |
32
 
33
- | F1 Macro | 0.5031 |
34
 
35
- | Precision | 0.4133 |
36
- | Recall | 0.6429 |
37
 
38
  ## Training Details
39
 
@@ -65,4 +65,4 @@ predictions = outputs.logits.softmax(dim=-1)
65
  ## Model Card Authors
66
 
67
  - TradePulse ML Team
68
- - Auto-generated on 2025-07-29 09:32:10
 
21
 
22
  ## Performance
23
 
24
+ *Last training: 2025-07-29 13:33*
25
+ *Dataset: `base_reference.csv` (637 samples)*
26
 
27
  | Metric | Value |
28
  |--------|-------|
29
+ | Loss | 0.6551 |
30
+ | Accuracy | 0.8125 |
31
+ | F1 Score | 0.8127 |
32
 
33
+ | F1 Macro | 0.8127 |
34
 
35
+ | Precision | 0.8140 |
36
+ | Recall | 0.8125 |
37
 
38
  ## Training Details
39
 
 
65
  ## Model Card Authors
66
 
67
  - TradePulse ML Team
68
+ - Auto-generated on 2025-07-29 13:33:51
checkpoint-20/trainer_state.json DELETED
@@ -1,86 +0,0 @@
1
- {
2
- "best_metric": 0.5031055900621119,
3
- "best_model_checkpoint": "hf-importance-production/checkpoint-20",
4
- "epoch": 2.0,
5
- "eval_steps": 500,
6
- "global_step": 20,
7
- "is_hyper_param_search": false,
8
- "is_local_process_zero": true,
9
- "is_world_process_zero": true,
10
- "log_history": [
11
- {
12
- "epoch": 1.0,
13
- "grad_norm": 181.4758758544922,
14
- "learning_rate": 9.090909090909091e-06,
15
- "loss": 3.3705,
16
- "step": 10
17
- },
18
- {
19
- "epoch": 1.0,
20
- "eval_accuracy": 0.35714285714285715,
21
- "eval_f1": 0.3383458646616541,
22
- "eval_f1_macro": 0.17543859649122806,
23
- "eval_loss": 1.8454712629318237,
24
- "eval_precision": 0.32142857142857145,
25
- "eval_precision_macro": 0.16666666666666666,
26
- "eval_recall": 0.35714285714285715,
27
- "eval_recall_macro": 0.1851851851851852,
28
- "eval_runtime": 7.7174,
29
- "eval_samples_per_second": 1.814,
30
- "eval_steps_per_second": 0.518,
31
- "step": 10
32
- },
33
- {
34
- "epoch": 2.0,
35
- "grad_norm": 83.5034408569336,
36
- "learning_rate": 0.0,
37
- "loss": 1.439,
38
- "step": 20
39
- },
40
- {
41
- "epoch": 2.0,
42
- "eval_accuracy": 0.6428571428571429,
43
- "eval_f1": 0.5031055900621119,
44
- "eval_f1_macro": 0.2608695652173913,
45
- "eval_loss": 2.539227247238159,
46
- "eval_precision": 0.41326530612244905,
47
- "eval_precision_macro": 0.2142857142857143,
48
- "eval_recall": 0.6428571428571429,
49
- "eval_recall_macro": 0.3333333333333333,
50
- "eval_runtime": 7.725,
51
- "eval_samples_per_second": 1.812,
52
- "eval_steps_per_second": 0.518,
53
- "step": 20
54
- }
55
- ],
56
- "logging_steps": 10,
57
- "max_steps": 20,
58
- "num_input_tokens_seen": 0,
59
- "num_train_epochs": 2,
60
- "save_steps": 500,
61
- "stateful_callbacks": {
62
- "EarlyStoppingCallback": {
63
- "args": {
64
- "early_stopping_patience": 1,
65
- "early_stopping_threshold": 0.0
66
- },
67
- "attributes": {
68
- "early_stopping_patience_counter": 0
69
- }
70
- },
71
- "TrainerControl": {
72
- "args": {
73
- "should_epoch_stop": false,
74
- "should_evaluate": false,
75
- "should_log": false,
76
- "should_save": true,
77
- "should_training_stop": true
78
- },
79
- "attributes": {}
80
- }
81
- },
82
- "total_flos": 20522846582784.0,
83
- "train_batch_size": 4,
84
- "trial_name": null,
85
- "trial_params": null
86
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
{checkpoint-20 β†’ checkpoint-240}/config.json RENAMED
File without changes
{checkpoint-20 β†’ checkpoint-240}/model.safetensors RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9451c2dc524d02e41d47d82c6085a255f1022b0b351a2d0a6fb9dd8386e8ff77
3
  size 439039996
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5adf2aaa4fe85784e8bc042af10862ff3a302c4a368f116c0a5f33220511fc72
3
  size 439039996
{checkpoint-20 β†’ checkpoint-240}/special_tokens_map.json RENAMED
File without changes
{checkpoint-20 β†’ checkpoint-240}/tokenizer.json RENAMED
File without changes
{checkpoint-20 β†’ checkpoint-240}/tokenizer_config.json RENAMED
File without changes
checkpoint-240/trainer_state.json ADDED
@@ -0,0 +1,240 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.8126807447116778,
3
+ "best_model_checkpoint": "hf-importance-production/checkpoint-240",
4
+ "epoch": 2.0,
5
+ "eval_steps": 500,
6
+ "global_step": 240,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.08333333333333333,
13
+ "grad_norm": 70.0009765625,
14
+ "learning_rate": 8.403361344537816e-07,
15
+ "loss": 0.7483,
16
+ "step": 10
17
+ },
18
+ {
19
+ "epoch": 0.16666666666666666,
20
+ "grad_norm": 24.547622680664062,
21
+ "learning_rate": 1.6806722689075632e-06,
22
+ "loss": 0.9913,
23
+ "step": 20
24
+ },
25
+ {
26
+ "epoch": 0.25,
27
+ "grad_norm": 57.52896499633789,
28
+ "learning_rate": 2.521008403361345e-06,
29
+ "loss": 0.6966,
30
+ "step": 30
31
+ },
32
+ {
33
+ "epoch": 0.3333333333333333,
34
+ "grad_norm": 74.12036895751953,
35
+ "learning_rate": 3.3613445378151265e-06,
36
+ "loss": 0.6548,
37
+ "step": 40
38
+ },
39
+ {
40
+ "epoch": 0.4166666666666667,
41
+ "grad_norm": 9.066349983215332,
42
+ "learning_rate": 4.201680672268908e-06,
43
+ "loss": 0.3729,
44
+ "step": 50
45
+ },
46
+ {
47
+ "epoch": 0.5,
48
+ "grad_norm": 50.364627838134766,
49
+ "learning_rate": 5.04201680672269e-06,
50
+ "loss": 0.6898,
51
+ "step": 60
52
+ },
53
+ {
54
+ "epoch": 0.5833333333333334,
55
+ "grad_norm": 78.47008514404297,
56
+ "learning_rate": 5.882352941176471e-06,
57
+ "loss": 0.7254,
58
+ "step": 70
59
+ },
60
+ {
61
+ "epoch": 0.6666666666666666,
62
+ "grad_norm": 0.9752311706542969,
63
+ "learning_rate": 6.722689075630253e-06,
64
+ "loss": 0.6388,
65
+ "step": 80
66
+ },
67
+ {
68
+ "epoch": 0.75,
69
+ "grad_norm": 12.438714027404785,
70
+ "learning_rate": 7.563025210084034e-06,
71
+ "loss": 0.5719,
72
+ "step": 90
73
+ },
74
+ {
75
+ "epoch": 0.8333333333333334,
76
+ "grad_norm": 70.23839569091797,
77
+ "learning_rate": 8.403361344537815e-06,
78
+ "loss": 0.7578,
79
+ "step": 100
80
+ },
81
+ {
82
+ "epoch": 0.9166666666666666,
83
+ "grad_norm": 85.30646514892578,
84
+ "learning_rate": 9.243697478991598e-06,
85
+ "loss": 1.2087,
86
+ "step": 110
87
+ },
88
+ {
89
+ "epoch": 1.0,
90
+ "grad_norm": 1.3721972703933716,
91
+ "learning_rate": 9.917355371900828e-06,
92
+ "loss": 0.7927,
93
+ "step": 120
94
+ },
95
+ {
96
+ "epoch": 1.0,
97
+ "eval_accuracy": 0.8125,
98
+ "eval_f1": 0.8083101323053494,
99
+ "eval_f1_macro": 0.6997588679484738,
100
+ "eval_loss": 0.6532053351402283,
101
+ "eval_precision": 0.8070379283788987,
102
+ "eval_precision_macro": 0.7347195481966371,
103
+ "eval_recall": 0.8125,
104
+ "eval_recall_macro": 0.6755615453728661,
105
+ "eval_runtime": 88.1395,
106
+ "eval_samples_per_second": 1.815,
107
+ "eval_steps_per_second": 0.454,
108
+ "step": 120
109
+ },
110
+ {
111
+ "epoch": 1.0833333333333333,
112
+ "grad_norm": 53.19272232055664,
113
+ "learning_rate": 9.090909090909091e-06,
114
+ "loss": 0.347,
115
+ "step": 130
116
+ },
117
+ {
118
+ "epoch": 1.1666666666666667,
119
+ "grad_norm": 130.35791015625,
120
+ "learning_rate": 8.264462809917356e-06,
121
+ "loss": 0.6841,
122
+ "step": 140
123
+ },
124
+ {
125
+ "epoch": 1.25,
126
+ "grad_norm": 24.545459747314453,
127
+ "learning_rate": 7.43801652892562e-06,
128
+ "loss": 0.5361,
129
+ "step": 150
130
+ },
131
+ {
132
+ "epoch": 1.3333333333333333,
133
+ "grad_norm": 11.489201545715332,
134
+ "learning_rate": 6.611570247933885e-06,
135
+ "loss": 0.1774,
136
+ "step": 160
137
+ },
138
+ {
139
+ "epoch": 1.4166666666666667,
140
+ "grad_norm": 7.724330902099609,
141
+ "learning_rate": 5.785123966942149e-06,
142
+ "loss": 0.1986,
143
+ "step": 170
144
+ },
145
+ {
146
+ "epoch": 1.5,
147
+ "grad_norm": 51.44404602050781,
148
+ "learning_rate": 4.958677685950414e-06,
149
+ "loss": 0.2807,
150
+ "step": 180
151
+ },
152
+ {
153
+ "epoch": 1.5833333333333335,
154
+ "grad_norm": 58.367225646972656,
155
+ "learning_rate": 4.132231404958678e-06,
156
+ "loss": 0.5279,
157
+ "step": 190
158
+ },
159
+ {
160
+ "epoch": 1.6666666666666665,
161
+ "grad_norm": 0.692018985748291,
162
+ "learning_rate": 3.3057851239669424e-06,
163
+ "loss": 0.3302,
164
+ "step": 200
165
+ },
166
+ {
167
+ "epoch": 1.75,
168
+ "grad_norm": 39.534156799316406,
169
+ "learning_rate": 2.479338842975207e-06,
170
+ "loss": 1.0246,
171
+ "step": 210
172
+ },
173
+ {
174
+ "epoch": 1.8333333333333335,
175
+ "grad_norm": 45.754249572753906,
176
+ "learning_rate": 1.6528925619834712e-06,
177
+ "loss": 0.6398,
178
+ "step": 220
179
+ },
180
+ {
181
+ "epoch": 1.9166666666666665,
182
+ "grad_norm": 55.728824615478516,
183
+ "learning_rate": 8.264462809917356e-07,
184
+ "loss": 0.3741,
185
+ "step": 230
186
+ },
187
+ {
188
+ "epoch": 2.0,
189
+ "grad_norm": 0.00028416712302714586,
190
+ "learning_rate": 0.0,
191
+ "loss": 0.4744,
192
+ "step": 240
193
+ },
194
+ {
195
+ "epoch": 2.0,
196
+ "eval_accuracy": 0.8125,
197
+ "eval_f1": 0.8126807447116778,
198
+ "eval_f1_macro": 0.6772336520815223,
199
+ "eval_loss": 0.6551325917243958,
200
+ "eval_precision": 0.8140347917079452,
201
+ "eval_precision_macro": 0.6750957664619245,
202
+ "eval_recall": 0.8125,
203
+ "eval_recall_macro": 0.6814734950584006,
204
+ "eval_runtime": 88.2081,
205
+ "eval_samples_per_second": 1.814,
206
+ "eval_steps_per_second": 0.453,
207
+ "step": 240
208
+ }
209
+ ],
210
+ "logging_steps": 10,
211
+ "max_steps": 240,
212
+ "num_input_tokens_seen": 0,
213
+ "num_train_epochs": 2,
214
+ "save_steps": 500,
215
+ "stateful_callbacks": {
216
+ "EarlyStoppingCallback": {
217
+ "args": {
218
+ "early_stopping_patience": 1,
219
+ "early_stopping_threshold": 0.0
220
+ },
221
+ "attributes": {
222
+ "early_stopping_patience_counter": 0
223
+ }
224
+ },
225
+ "TrainerControl": {
226
+ "args": {
227
+ "should_epoch_stop": false,
228
+ "should_evaluate": false,
229
+ "should_log": false,
230
+ "should_save": true,
231
+ "should_training_stop": true
232
+ },
233
+ "attributes": {}
234
+ }
235
+ },
236
+ "total_flos": 251010200512512.0,
237
+ "train_batch_size": 4,
238
+ "trial_name": null,
239
+ "trial_params": null
240
+ }
{checkpoint-20 β†’ checkpoint-240}/vocab.txt RENAMED
File without changes
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9451c2dc524d02e41d47d82c6085a255f1022b0b351a2d0a6fb9dd8386e8ff77
3
  size 439039996
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5adf2aaa4fe85784e8bc042af10862ff3a302c4a368f116c0a5f33220511fc72
3
  size 439039996
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4d854fcf3b8b50fb52ab209646977147211be9331153446e6dbf38c9cb0bb27f
3
  size 5521
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e92fee1fb04aadd9214a2ac739f02f3f2f13b9a2c138bafa3f4c239de58adc1b
3
  size 5521