Bencode92 commited on
Commit
ef62e20
ยท
1 Parent(s): 6a87ec8

๐Ÿ”„ Incremental label | Acc: 0.831, F1: 0.825

Browse files
README.md CHANGED
@@ -21,19 +21,19 @@ Fine-tuned FinBERT model for financial sentiment analysis in TradePulse.
21
 
22
  ## Performance
23
 
24
- *Last training: 2025-07-29 12:46*
25
  *Dataset: `base_reference.csv` (637 samples)*
26
 
27
  | Metric | Value |
28
  |--------|-------|
29
- | Loss | 0.9526 |
30
- | Accuracy | 0.8250 |
31
- | F1 Score | 0.8217 |
32
 
33
- | F1 Macro | 0.8217 |
34
 
35
- | Precision | 0.8277 |
36
- | Recall | 0.8250 |
37
 
38
  ## Training Details
39
 
@@ -65,4 +65,4 @@ predictions = outputs.logits.softmax(dim=-1)
65
  ## Model Card Authors
66
 
67
  - TradePulse ML Team
68
- - Auto-generated on 2025-07-29 12:46:43
 
21
 
22
  ## Performance
23
 
24
+ *Last training: 2025-07-29 14:55*
25
  *Dataset: `base_reference.csv` (637 samples)*
26
 
27
  | Metric | Value |
28
  |--------|-------|
29
+ | Loss | 1.1338 |
30
+ | Accuracy | 0.8187 |
31
+ | F1 Score | 0.8160 |
32
 
33
+ | F1 Macro | 0.8160 |
34
 
35
+ | Precision | 0.8227 |
36
+ | Recall | 0.8187 |
37
 
38
  ## Training Details
39
 
 
65
  ## Model Card Authors
66
 
67
  - TradePulse ML Team
68
+ - Auto-generated on 2025-07-29 14:55:29
checkpoint-240/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f2b8d9dbc3c718fdf0698f3013f7f79c7162a22a441338d87fa34509632536c6
3
  size 439039996
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3086611e9d798eb5c227056fa1df462ffab398880a94c55f85c7417182546d44
3
  size 439039996
checkpoint-240/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.8217223565907776,
3
  "best_model_checkpoint": "hf-sentiment-production/checkpoint-240",
4
  "epoch": 2.0,
5
  "eval_steps": 500,
@@ -10,200 +10,200 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.08333333333333333,
13
- "grad_norm": 32.42210006713867,
14
  "learning_rate": 8.403361344537816e-07,
15
- "loss": 0.5341,
16
  "step": 10
17
  },
18
  {
19
  "epoch": 0.16666666666666666,
20
- "grad_norm": 32.30667495727539,
21
  "learning_rate": 1.6806722689075632e-06,
22
- "loss": 0.2982,
23
  "step": 20
24
  },
25
  {
26
  "epoch": 0.25,
27
- "grad_norm": 65.03559112548828,
28
  "learning_rate": 2.521008403361345e-06,
29
- "loss": 0.4933,
30
  "step": 30
31
  },
32
  {
33
  "epoch": 0.3333333333333333,
34
- "grad_norm": 11.74012565612793,
35
  "learning_rate": 3.3613445378151265e-06,
36
- "loss": 0.3533,
37
  "step": 40
38
  },
39
  {
40
  "epoch": 0.4166666666666667,
41
- "grad_norm": 88.07356262207031,
42
  "learning_rate": 4.201680672268908e-06,
43
- "loss": 0.9541,
44
  "step": 50
45
  },
46
  {
47
  "epoch": 0.5,
48
- "grad_norm": 56.444908142089844,
49
  "learning_rate": 5.04201680672269e-06,
50
- "loss": 0.857,
51
  "step": 60
52
  },
53
  {
54
  "epoch": 0.5833333333333334,
55
- "grad_norm": 7.758561611175537,
56
  "learning_rate": 5.882352941176471e-06,
57
- "loss": 0.8653,
58
  "step": 70
59
  },
60
  {
61
  "epoch": 0.6666666666666666,
62
- "grad_norm": 2.285611629486084,
63
  "learning_rate": 6.722689075630253e-06,
64
- "loss": 1.3253,
65
  "step": 80
66
  },
67
  {
68
  "epoch": 0.75,
69
- "grad_norm": 51.23533630371094,
70
  "learning_rate": 7.563025210084034e-06,
71
- "loss": 0.6127,
72
  "step": 90
73
  },
74
  {
75
  "epoch": 0.8333333333333334,
76
- "grad_norm": 79.65983581542969,
77
  "learning_rate": 8.403361344537815e-06,
78
- "loss": 0.6925,
79
  "step": 100
80
  },
81
  {
82
  "epoch": 0.9166666666666666,
83
- "grad_norm": 98.18861389160156,
84
  "learning_rate": 9.243697478991598e-06,
85
- "loss": 0.7733,
86
  "step": 110
87
  },
88
  {
89
  "epoch": 1.0,
90
- "grad_norm": 0.007537131663411856,
91
  "learning_rate": 9.917355371900828e-06,
92
- "loss": 0.3243,
93
  "step": 120
94
  },
95
  {
96
  "epoch": 1.0,
97
- "eval_accuracy": 0.81875,
98
- "eval_f1": 0.8149920382165605,
99
- "eval_f1_macro": 0.8011677282377919,
100
- "eval_loss": 0.8371865153312683,
101
- "eval_precision": 0.8279807278208441,
102
- "eval_precision_macro": 0.8436405397645709,
103
- "eval_recall": 0.81875,
104
- "eval_recall_macro": 0.7802058251146221,
105
- "eval_runtime": 88.4094,
106
- "eval_samples_per_second": 1.81,
107
- "eval_steps_per_second": 0.452,
108
  "step": 120
109
  },
110
  {
111
  "epoch": 1.0833333333333333,
112
- "grad_norm": 77.50802612304688,
113
  "learning_rate": 9.090909090909091e-06,
114
- "loss": 0.4296,
115
  "step": 130
116
  },
117
  {
118
  "epoch": 1.1666666666666667,
119
- "grad_norm": 15.326767921447754,
120
  "learning_rate": 8.264462809917356e-06,
121
- "loss": 0.1833,
122
  "step": 140
123
  },
124
  {
125
  "epoch": 1.25,
126
- "grad_norm": 91.35188293457031,
127
  "learning_rate": 7.43801652892562e-06,
128
- "loss": 0.3804,
129
  "step": 150
130
  },
131
  {
132
  "epoch": 1.3333333333333333,
133
- "grad_norm": 88.58149719238281,
134
  "learning_rate": 6.611570247933885e-06,
135
- "loss": 0.5602,
136
  "step": 160
137
  },
138
  {
139
  "epoch": 1.4166666666666667,
140
- "grad_norm": 44.488040924072266,
141
  "learning_rate": 5.785123966942149e-06,
142
- "loss": 0.1753,
143
  "step": 170
144
  },
145
  {
146
  "epoch": 1.5,
147
- "grad_norm": 71.1673583984375,
148
  "learning_rate": 4.958677685950414e-06,
149
- "loss": 0.2846,
150
  "step": 180
151
  },
152
  {
153
  "epoch": 1.5833333333333335,
154
- "grad_norm": 68.90252685546875,
155
  "learning_rate": 4.132231404958678e-06,
156
- "loss": 0.3893,
157
  "step": 190
158
  },
159
  {
160
  "epoch": 1.6666666666666665,
161
- "grad_norm": 9.828429222106934,
162
  "learning_rate": 3.3057851239669424e-06,
163
- "loss": 0.2814,
164
  "step": 200
165
  },
166
  {
167
  "epoch": 1.75,
168
- "grad_norm": 29.61725616455078,
169
  "learning_rate": 2.479338842975207e-06,
170
- "loss": 0.3129,
171
  "step": 210
172
  },
173
  {
174
  "epoch": 1.8333333333333335,
175
- "grad_norm": 108.5630111694336,
176
  "learning_rate": 1.6528925619834712e-06,
177
- "loss": 0.3268,
178
  "step": 220
179
  },
180
  {
181
  "epoch": 1.9166666666666665,
182
- "grad_norm": 21.261966705322266,
183
  "learning_rate": 8.264462809917356e-07,
184
- "loss": 0.8541,
185
  "step": 230
186
  },
187
  {
188
  "epoch": 2.0,
189
- "grad_norm": 0.0011018794029951096,
190
  "learning_rate": 0.0,
191
- "loss": 0.8383,
192
  "step": 240
193
  },
194
  {
195
  "epoch": 2.0,
196
- "eval_accuracy": 0.825,
197
- "eval_f1": 0.8217223565907776,
198
- "eval_f1_macro": 0.8096114411903885,
199
- "eval_loss": 0.9526222348213196,
200
- "eval_precision": 0.8277439948473138,
201
- "eval_precision_macro": 0.8298729509231896,
202
- "eval_recall": 0.825,
203
- "eval_recall_macro": 0.798550868049829,
204
- "eval_runtime": 88.1644,
205
- "eval_samples_per_second": 1.815,
206
- "eval_steps_per_second": 0.454,
207
  "step": 240
208
  }
209
  ],
 
1
  {
2
+ "best_metric": 0.8159816100353184,
3
  "best_model_checkpoint": "hf-sentiment-production/checkpoint-240",
4
  "epoch": 2.0,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.08333333333333333,
13
+ "grad_norm": 1.4732459783554077,
14
  "learning_rate": 8.403361344537816e-07,
15
+ "loss": 0.2538,
16
  "step": 10
17
  },
18
  {
19
  "epoch": 0.16666666666666666,
20
+ "grad_norm": 15.764479637145996,
21
  "learning_rate": 1.6806722689075632e-06,
22
+ "loss": 0.2491,
23
  "step": 20
24
  },
25
  {
26
  "epoch": 0.25,
27
+ "grad_norm": 0.6188515424728394,
28
  "learning_rate": 2.521008403361345e-06,
29
+ "loss": 0.0484,
30
  "step": 30
31
  },
32
  {
33
  "epoch": 0.3333333333333333,
34
+ "grad_norm": 5.2134857177734375,
35
  "learning_rate": 3.3613445378151265e-06,
36
+ "loss": 0.0038,
37
  "step": 40
38
  },
39
  {
40
  "epoch": 0.4166666666666667,
41
+ "grad_norm": 67.50135803222656,
42
  "learning_rate": 4.201680672268908e-06,
43
+ "loss": 0.2405,
44
  "step": 50
45
  },
46
  {
47
  "epoch": 0.5,
48
+ "grad_norm": 1.7730236053466797,
49
  "learning_rate": 5.04201680672269e-06,
50
+ "loss": 0.0307,
51
  "step": 60
52
  },
53
  {
54
  "epoch": 0.5833333333333334,
55
+ "grad_norm": 0.07660957425832748,
56
  "learning_rate": 5.882352941176471e-06,
57
+ "loss": 0.0168,
58
  "step": 70
59
  },
60
  {
61
  "epoch": 0.6666666666666666,
62
+ "grad_norm": 0.02174329198896885,
63
  "learning_rate": 6.722689075630253e-06,
64
+ "loss": 0.1938,
65
  "step": 80
66
  },
67
  {
68
  "epoch": 0.75,
69
+ "grad_norm": 2.6392903327941895,
70
  "learning_rate": 7.563025210084034e-06,
71
+ "loss": 0.0109,
72
  "step": 90
73
  },
74
  {
75
  "epoch": 0.8333333333333334,
76
+ "grad_norm": 0.5411686897277832,
77
  "learning_rate": 8.403361344537815e-06,
78
+ "loss": 0.0039,
79
  "step": 100
80
  },
81
  {
82
  "epoch": 0.9166666666666666,
83
+ "grad_norm": 0.4245348274707794,
84
  "learning_rate": 9.243697478991598e-06,
85
+ "loss": 0.0448,
86
  "step": 110
87
  },
88
  {
89
  "epoch": 1.0,
90
+ "grad_norm": 0.00010414929420221597,
91
  "learning_rate": 9.917355371900828e-06,
92
+ "loss": 0.0007,
93
  "step": 120
94
  },
95
  {
96
  "epoch": 1.0,
97
+ "eval_accuracy": 0.80625,
98
+ "eval_f1": 0.8014322617130588,
99
+ "eval_f1_macro": 0.7881169644454667,
100
+ "eval_loss": 1.2546101808547974,
101
+ "eval_precision": 0.8257927529986354,
102
+ "eval_precision_macro": 0.8514807632454691,
103
+ "eval_recall": 0.80625,
104
+ "eval_recall_macro": 0.7620669371419776,
105
+ "eval_runtime": 89.5753,
106
+ "eval_samples_per_second": 1.786,
107
+ "eval_steps_per_second": 0.447,
108
  "step": 120
109
  },
110
  {
111
  "epoch": 1.0833333333333333,
112
+ "grad_norm": 1.6099791526794434,
113
  "learning_rate": 9.090909090909091e-06,
114
+ "loss": 0.0035,
115
  "step": 130
116
  },
117
  {
118
  "epoch": 1.1666666666666667,
119
+ "grad_norm": 125.70403289794922,
120
  "learning_rate": 8.264462809917356e-06,
121
+ "loss": 0.0688,
122
  "step": 140
123
  },
124
  {
125
  "epoch": 1.25,
126
+ "grad_norm": 0.19366542994976044,
127
  "learning_rate": 7.43801652892562e-06,
128
+ "loss": 0.0129,
129
  "step": 150
130
  },
131
  {
132
  "epoch": 1.3333333333333333,
133
+ "grad_norm": 0.0414673388004303,
134
  "learning_rate": 6.611570247933885e-06,
135
+ "loss": 0.0142,
136
  "step": 160
137
  },
138
  {
139
  "epoch": 1.4166666666666667,
140
+ "grad_norm": 0.003162428503856063,
141
  "learning_rate": 5.785123966942149e-06,
142
+ "loss": 0.0044,
143
  "step": 170
144
  },
145
  {
146
  "epoch": 1.5,
147
+ "grad_norm": 29.15802574157715,
148
  "learning_rate": 4.958677685950414e-06,
149
+ "loss": 0.0142,
150
  "step": 180
151
  },
152
  {
153
  "epoch": 1.5833333333333335,
154
+ "grad_norm": 1.950109601020813,
155
  "learning_rate": 4.132231404958678e-06,
156
+ "loss": 0.011,
157
  "step": 190
158
  },
159
  {
160
  "epoch": 1.6666666666666665,
161
+ "grad_norm": 0.06768287718296051,
162
  "learning_rate": 3.3057851239669424e-06,
163
+ "loss": 0.0288,
164
  "step": 200
165
  },
166
  {
167
  "epoch": 1.75,
168
+ "grad_norm": 0.052531249821186066,
169
  "learning_rate": 2.479338842975207e-06,
170
+ "loss": 0.1647,
171
  "step": 210
172
  },
173
  {
174
  "epoch": 1.8333333333333335,
175
+ "grad_norm": 17.331710815429688,
176
  "learning_rate": 1.6528925619834712e-06,
177
+ "loss": 0.0113,
178
  "step": 220
179
  },
180
  {
181
  "epoch": 1.9166666666666665,
182
+ "grad_norm": 0.38937193155288696,
183
  "learning_rate": 8.264462809917356e-07,
184
+ "loss": 0.3054,
185
  "step": 230
186
  },
187
  {
188
  "epoch": 2.0,
189
+ "grad_norm": 5.238432277110405e-05,
190
  "learning_rate": 0.0,
191
+ "loss": 0.5109,
192
  "step": 240
193
  },
194
  {
195
  "epoch": 2.0,
196
+ "eval_accuracy": 0.81875,
197
+ "eval_f1": 0.8159816100353184,
198
+ "eval_f1_macro": 0.808021759428409,
199
+ "eval_loss": 1.1338030099868774,
200
+ "eval_precision": 0.8227436921599441,
201
+ "eval_precision_macro": 0.8326930912054014,
202
+ "eval_recall": 0.81875,
203
+ "eval_recall_macro": 0.7938560323690779,
204
+ "eval_runtime": 90.3771,
205
+ "eval_samples_per_second": 1.77,
206
+ "eval_steps_per_second": 0.443,
207
  "step": 240
208
  }
209
  ],
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f2b8d9dbc3c718fdf0698f3013f7f79c7162a22a441338d87fa34509632536c6
3
  size 439039996
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3086611e9d798eb5c227056fa1df462ffab398880a94c55f85c7417182546d44
3
  size 439039996