Bencode92 commited on
Commit
7e9103f
ยท
1 Parent(s): ffb163c

๐Ÿ”„ Incremental importance | Acc: 0.775, F1: 0.644

Browse files
README.md CHANGED
@@ -21,19 +21,19 @@ Fine-tuned FinBERT model for financial importance analysis in TradePulse.
21
 
22
  ## Performance
23
 
24
- *Last training: 2025-07-29 13:33*
25
  *Dataset: `base_reference.csv` (637 samples)*
26
 
27
  | Metric | Value |
28
  |--------|-------|
29
- | Loss | 0.6551 |
30
- | Accuracy | 0.8125 |
31
- | F1 Score | 0.8127 |
32
 
33
- | F1 Macro | 0.8127 |
34
 
35
- | Precision | 0.8140 |
36
- | Recall | 0.8125 |
37
 
38
  ## Training Details
39
 
@@ -65,4 +65,4 @@ predictions = outputs.logits.softmax(dim=-1)
65
  ## Model Card Authors
66
 
67
  - TradePulse ML Team
68
- - Auto-generated on 2025-07-29 13:33:51
 
21
 
22
  ## Performance
23
 
24
+ *Last training: 2025-07-29 15:39*
25
  *Dataset: `base_reference.csv` (637 samples)*
26
 
27
  | Metric | Value |
28
  |--------|-------|
29
+ | Loss | 0.8320 |
30
+ | Accuracy | 0.8063 |
31
+ | F1 Score | 0.8051 |
32
 
33
+ | F1 Macro | 0.8051 |
34
 
35
+ | Precision | 0.8047 |
36
+ | Recall | 0.8063 |
37
 
38
  ## Training Details
39
 
 
65
  ## Model Card Authors
66
 
67
  - TradePulse ML Team
68
+ - Auto-generated on 2025-07-29 15:39:17
checkpoint-240/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5adf2aaa4fe85784e8bc042af10862ff3a302c4a368f116c0a5f33220511fc72
3
  size 439039996
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fdc01d91706d553799d11f3cb8130f8e1b17d70daf22d597f48fcefb01b77f14
3
  size 439039996
checkpoint-240/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.8126807447116778,
3
  "best_model_checkpoint": "hf-importance-production/checkpoint-240",
4
  "epoch": 2.0,
5
  "eval_steps": 500,
@@ -10,200 +10,200 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.08333333333333333,
13
- "grad_norm": 70.0009765625,
14
  "learning_rate": 8.403361344537816e-07,
15
- "loss": 0.7483,
16
  "step": 10
17
  },
18
  {
19
  "epoch": 0.16666666666666666,
20
- "grad_norm": 24.547622680664062,
21
  "learning_rate": 1.6806722689075632e-06,
22
- "loss": 0.9913,
23
  "step": 20
24
  },
25
  {
26
  "epoch": 0.25,
27
- "grad_norm": 57.52896499633789,
28
  "learning_rate": 2.521008403361345e-06,
29
- "loss": 0.6966,
30
  "step": 30
31
  },
32
  {
33
  "epoch": 0.3333333333333333,
34
- "grad_norm": 74.12036895751953,
35
  "learning_rate": 3.3613445378151265e-06,
36
- "loss": 0.6548,
37
  "step": 40
38
  },
39
  {
40
  "epoch": 0.4166666666666667,
41
- "grad_norm": 9.066349983215332,
42
  "learning_rate": 4.201680672268908e-06,
43
- "loss": 0.3729,
44
  "step": 50
45
  },
46
  {
47
  "epoch": 0.5,
48
- "grad_norm": 50.364627838134766,
49
  "learning_rate": 5.04201680672269e-06,
50
- "loss": 0.6898,
51
  "step": 60
52
  },
53
  {
54
  "epoch": 0.5833333333333334,
55
- "grad_norm": 78.47008514404297,
56
  "learning_rate": 5.882352941176471e-06,
57
- "loss": 0.7254,
58
  "step": 70
59
  },
60
  {
61
  "epoch": 0.6666666666666666,
62
- "grad_norm": 0.9752311706542969,
63
  "learning_rate": 6.722689075630253e-06,
64
- "loss": 0.6388,
65
  "step": 80
66
  },
67
  {
68
  "epoch": 0.75,
69
- "grad_norm": 12.438714027404785,
70
  "learning_rate": 7.563025210084034e-06,
71
- "loss": 0.5719,
72
  "step": 90
73
  },
74
  {
75
  "epoch": 0.8333333333333334,
76
- "grad_norm": 70.23839569091797,
77
  "learning_rate": 8.403361344537815e-06,
78
- "loss": 0.7578,
79
  "step": 100
80
  },
81
  {
82
  "epoch": 0.9166666666666666,
83
- "grad_norm": 85.30646514892578,
84
  "learning_rate": 9.243697478991598e-06,
85
- "loss": 1.2087,
86
  "step": 110
87
  },
88
  {
89
  "epoch": 1.0,
90
- "grad_norm": 1.3721972703933716,
91
  "learning_rate": 9.917355371900828e-06,
92
- "loss": 0.7927,
93
  "step": 120
94
  },
95
  {
96
  "epoch": 1.0,
97
- "eval_accuracy": 0.8125,
98
- "eval_f1": 0.8083101323053494,
99
- "eval_f1_macro": 0.6997588679484738,
100
- "eval_loss": 0.6532053351402283,
101
- "eval_precision": 0.8070379283788987,
102
- "eval_precision_macro": 0.7347195481966371,
103
- "eval_recall": 0.8125,
104
- "eval_recall_macro": 0.6755615453728661,
105
- "eval_runtime": 88.1395,
106
- "eval_samples_per_second": 1.815,
107
- "eval_steps_per_second": 0.454,
108
  "step": 120
109
  },
110
  {
111
  "epoch": 1.0833333333333333,
112
- "grad_norm": 53.19272232055664,
113
  "learning_rate": 9.090909090909091e-06,
114
- "loss": 0.347,
115
  "step": 130
116
  },
117
  {
118
  "epoch": 1.1666666666666667,
119
- "grad_norm": 130.35791015625,
120
  "learning_rate": 8.264462809917356e-06,
121
- "loss": 0.6841,
122
  "step": 140
123
  },
124
  {
125
  "epoch": 1.25,
126
- "grad_norm": 24.545459747314453,
127
  "learning_rate": 7.43801652892562e-06,
128
- "loss": 0.5361,
129
  "step": 150
130
  },
131
  {
132
  "epoch": 1.3333333333333333,
133
- "grad_norm": 11.489201545715332,
134
  "learning_rate": 6.611570247933885e-06,
135
- "loss": 0.1774,
136
  "step": 160
137
  },
138
  {
139
  "epoch": 1.4166666666666667,
140
- "grad_norm": 7.724330902099609,
141
  "learning_rate": 5.785123966942149e-06,
142
- "loss": 0.1986,
143
  "step": 170
144
  },
145
  {
146
  "epoch": 1.5,
147
- "grad_norm": 51.44404602050781,
148
  "learning_rate": 4.958677685950414e-06,
149
- "loss": 0.2807,
150
  "step": 180
151
  },
152
  {
153
  "epoch": 1.5833333333333335,
154
- "grad_norm": 58.367225646972656,
155
  "learning_rate": 4.132231404958678e-06,
156
- "loss": 0.5279,
157
  "step": 190
158
  },
159
  {
160
  "epoch": 1.6666666666666665,
161
- "grad_norm": 0.692018985748291,
162
  "learning_rate": 3.3057851239669424e-06,
163
- "loss": 0.3302,
164
  "step": 200
165
  },
166
  {
167
  "epoch": 1.75,
168
- "grad_norm": 39.534156799316406,
169
  "learning_rate": 2.479338842975207e-06,
170
- "loss": 1.0246,
171
  "step": 210
172
  },
173
  {
174
  "epoch": 1.8333333333333335,
175
- "grad_norm": 45.754249572753906,
176
  "learning_rate": 1.6528925619834712e-06,
177
- "loss": 0.6398,
178
  "step": 220
179
  },
180
  {
181
  "epoch": 1.9166666666666665,
182
- "grad_norm": 55.728824615478516,
183
  "learning_rate": 8.264462809917356e-07,
184
- "loss": 0.3741,
185
  "step": 230
186
  },
187
  {
188
  "epoch": 2.0,
189
- "grad_norm": 0.00028416712302714586,
190
  "learning_rate": 0.0,
191
- "loss": 0.4744,
192
  "step": 240
193
  },
194
  {
195
  "epoch": 2.0,
196
- "eval_accuracy": 0.8125,
197
- "eval_f1": 0.8126807447116778,
198
- "eval_f1_macro": 0.6772336520815223,
199
- "eval_loss": 0.6551325917243958,
200
- "eval_precision": 0.8140347917079452,
201
- "eval_precision_macro": 0.6750957664619245,
202
- "eval_recall": 0.8125,
203
- "eval_recall_macro": 0.6814734950584006,
204
- "eval_runtime": 88.2081,
205
- "eval_samples_per_second": 1.814,
206
- "eval_steps_per_second": 0.453,
207
  "step": 240
208
  }
209
  ],
 
1
  {
2
+ "best_metric": 0.8051317614424409,
3
  "best_model_checkpoint": "hf-importance-production/checkpoint-240",
4
  "epoch": 2.0,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.08333333333333333,
13
+ "grad_norm": 1.5605429410934448,
14
  "learning_rate": 8.403361344537816e-07,
15
+ "loss": 0.2922,
16
  "step": 10
17
  },
18
  {
19
  "epoch": 0.16666666666666666,
20
+ "grad_norm": 2.0631015300750732,
21
  "learning_rate": 1.6806722689075632e-06,
22
+ "loss": 0.2751,
23
  "step": 20
24
  },
25
  {
26
  "epoch": 0.25,
27
+ "grad_norm": 26.44710350036621,
28
  "learning_rate": 2.521008403361345e-06,
29
+ "loss": 0.1431,
30
  "step": 30
31
  },
32
  {
33
  "epoch": 0.3333333333333333,
34
+ "grad_norm": 15.7521390914917,
35
  "learning_rate": 3.3613445378151265e-06,
36
+ "loss": 0.1394,
37
  "step": 40
38
  },
39
  {
40
  "epoch": 0.4166666666666667,
41
+ "grad_norm": 0.29773807525634766,
42
  "learning_rate": 4.201680672268908e-06,
43
+ "loss": 0.0197,
44
  "step": 50
45
  },
46
  {
47
  "epoch": 0.5,
48
+ "grad_norm": 22.171756744384766,
49
  "learning_rate": 5.04201680672269e-06,
50
+ "loss": 0.0483,
51
  "step": 60
52
  },
53
  {
54
  "epoch": 0.5833333333333334,
55
+ "grad_norm": 19.108678817749023,
56
  "learning_rate": 5.882352941176471e-06,
57
+ "loss": 0.1641,
58
  "step": 70
59
  },
60
  {
61
  "epoch": 0.6666666666666666,
62
+ "grad_norm": 0.05635490268468857,
63
  "learning_rate": 6.722689075630253e-06,
64
+ "loss": 0.0468,
65
  "step": 80
66
  },
67
  {
68
  "epoch": 0.75,
69
+ "grad_norm": 0.11963564902544022,
70
  "learning_rate": 7.563025210084034e-06,
71
+ "loss": 0.009,
72
  "step": 90
73
  },
74
  {
75
  "epoch": 0.8333333333333334,
76
+ "grad_norm": 42.91386413574219,
77
  "learning_rate": 8.403361344537815e-06,
78
+ "loss": 0.0908,
79
  "step": 100
80
  },
81
  {
82
  "epoch": 0.9166666666666666,
83
+ "grad_norm": 1.6929007768630981,
84
  "learning_rate": 9.243697478991598e-06,
85
+ "loss": 0.1529,
86
  "step": 110
87
  },
88
  {
89
  "epoch": 1.0,
90
+ "grad_norm": 9.662502270657569e-05,
91
  "learning_rate": 9.917355371900828e-06,
92
+ "loss": 0.0054,
93
  "step": 120
94
  },
95
  {
96
  "epoch": 1.0,
97
+ "eval_accuracy": 0.8,
98
+ "eval_f1": 0.7951267793019712,
99
+ "eval_f1_macro": 0.7037467600127446,
100
+ "eval_loss": 0.8872003555297852,
101
+ "eval_precision": 0.7960396600228876,
102
+ "eval_precision_macro": 0.7721565261618667,
103
+ "eval_recall": 0.8,
104
+ "eval_recall_macro": 0.6659389038634321,
105
+ "eval_runtime": 90.131,
106
+ "eval_samples_per_second": 1.775,
107
+ "eval_steps_per_second": 0.444,
108
  "step": 120
109
  },
110
  {
111
  "epoch": 1.0833333333333333,
112
+ "grad_norm": 7.114067077636719,
113
  "learning_rate": 9.090909090909091e-06,
114
+ "loss": 0.0037,
115
  "step": 130
116
  },
117
  {
118
  "epoch": 1.1666666666666667,
119
+ "grad_norm": 3.9886481761932373,
120
  "learning_rate": 8.264462809917356e-06,
121
+ "loss": 0.014,
122
  "step": 140
123
  },
124
  {
125
  "epoch": 1.25,
126
+ "grad_norm": 2.7626068592071533,
127
  "learning_rate": 7.43801652892562e-06,
128
+ "loss": 0.1729,
129
  "step": 150
130
  },
131
  {
132
  "epoch": 1.3333333333333333,
133
+ "grad_norm": 0.5616143345832825,
134
  "learning_rate": 6.611570247933885e-06,
135
+ "loss": 0.0071,
136
  "step": 160
137
  },
138
  {
139
  "epoch": 1.4166666666666667,
140
+ "grad_norm": 1.5667345523834229,
141
  "learning_rate": 5.785123966942149e-06,
142
+ "loss": 0.0452,
143
  "step": 170
144
  },
145
  {
146
  "epoch": 1.5,
147
+ "grad_norm": 9.732388496398926,
148
  "learning_rate": 4.958677685950414e-06,
149
+ "loss": 0.0161,
150
  "step": 180
151
  },
152
  {
153
  "epoch": 1.5833333333333335,
154
+ "grad_norm": 1.119588851928711,
155
  "learning_rate": 4.132231404958678e-06,
156
+ "loss": 0.0546,
157
  "step": 190
158
  },
159
  {
160
  "epoch": 1.6666666666666665,
161
+ "grad_norm": 0.037918105721473694,
162
  "learning_rate": 3.3057851239669424e-06,
163
+ "loss": 0.1803,
164
  "step": 200
165
  },
166
  {
167
  "epoch": 1.75,
168
+ "grad_norm": 2.7715115547180176,
169
  "learning_rate": 2.479338842975207e-06,
170
+ "loss": 0.4811,
171
  "step": 210
172
  },
173
  {
174
  "epoch": 1.8333333333333335,
175
+ "grad_norm": 68.59700775146484,
176
  "learning_rate": 1.6528925619834712e-06,
177
+ "loss": 0.191,
178
  "step": 220
179
  },
180
  {
181
  "epoch": 1.9166666666666665,
182
+ "grad_norm": 9.923303604125977,
183
  "learning_rate": 8.264462809917356e-07,
184
+ "loss": 0.157,
185
  "step": 230
186
  },
187
  {
188
  "epoch": 2.0,
189
+ "grad_norm": 4.033025470562279e-05,
190
  "learning_rate": 0.0,
191
+ "loss": 0.2956,
192
  "step": 240
193
  },
194
  {
195
  "epoch": 2.0,
196
+ "eval_accuracy": 0.80625,
197
+ "eval_f1": 0.8051317614424409,
198
+ "eval_f1_macro": 0.7221451687471104,
199
+ "eval_loss": 0.8320282101631165,
200
+ "eval_precision": 0.8046626213592234,
201
+ "eval_precision_macro": 0.7253629218677761,
202
+ "eval_recall": 0.80625,
203
+ "eval_recall_macro": 0.7194699011680145,
204
+ "eval_runtime": 90.1147,
205
+ "eval_samples_per_second": 1.776,
206
+ "eval_steps_per_second": 0.444,
207
  "step": 240
208
  }
209
  ],
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5adf2aaa4fe85784e8bc042af10862ff3a302c4a368f116c0a5f33220511fc72
3
  size 439039996
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fdc01d91706d553799d11f3cb8130f8e1b17d70daf22d597f48fcefb01b77f14
3
  size 439039996