Alasil commited on
Commit
6e4e84e
·
verified ·
1 Parent(s): 36cbc2c

[Run 20260606_161024] Log metrics

Browse files
metrics/run_20260606_161024_metrics.json ADDED
@@ -0,0 +1,250 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "run_id": "20260606_161024",
3
+ "hyperparameters": {
4
+ "model_architecture": "UBC-NLP/MARBERT",
5
+ "task": "sequence-classification",
6
+ "dataset": "Nexus-Analytics/multilingual-hate-detection-dataset_v2",
7
+ "learning_rate": 3e-05,
8
+ "batch_size": 64,
9
+ "num_epochs": 5,
10
+ "max_seq_length": 128,
11
+ "early_stopping_patience": 2,
12
+ "optimizer": "AdamW",
13
+ "seed": 42
14
+ },
15
+ "per_epoch_results": [
16
+ {
17
+ "epoch": 1,
18
+ "train_loss": 0.1463778932577299,
19
+ "val_loss": 0.11948525108891772,
20
+ "val_accuracy": 0.9739877300613496,
21
+ "val_f1_weighted": 0.9739560473009347,
22
+ "val_f1_macro": 0.9738772572783241,
23
+ "val_precision_macro": 0.975375976145564,
24
+ "val_recall_macro": 0.973064780580503,
25
+ "hate_recall": 0.9531652084405559,
26
+ "hate_f1": 0.9721784776902888,
27
+ "classification_report": {
28
+ "Hate": {
29
+ "precision": 0.9919657204070702,
30
+ "recall": 0.9531652084405559,
31
+ "f1-score": 0.9721784776902888,
32
+ "support": 1943.0
33
+ },
34
+ "Normal": {
35
+ "precision": 0.958786231884058,
36
+ "recall": 0.9929643527204502,
37
+ "f1-score": 0.9755760368663594,
38
+ "support": 2132.0
39
+ },
40
+ "accuracy": 0.9739877300613496,
41
+ "macro avg": {
42
+ "precision": 0.975375976145564,
43
+ "recall": 0.973064780580503,
44
+ "f1-score": 0.9738772572783241,
45
+ "support": 4075.0
46
+ },
47
+ "weighted avg": {
48
+ "precision": 0.974606537700061,
49
+ "recall": 0.9739877300613496,
50
+ "f1-score": 0.9739560473009347,
51
+ "support": 4075.0
52
+ }
53
+ }
54
+ },
55
+ {
56
+ "epoch": 2,
57
+ "train_loss": 0.062295065309083554,
58
+ "val_loss": 0.25368876694119535,
59
+ "val_accuracy": 0.9423312883435583,
60
+ "val_f1_weighted": 0.9419861159442119,
61
+ "val_f1_macro": 0.9417061263155575,
62
+ "val_precision_macro": 0.950236143565397,
63
+ "val_recall_macro": 0.9395493178475869,
64
+ "hate_recall": 0.8795676788471436,
65
+ "hate_f1": 0.9356693128935122,
66
+ "classification_report": {
67
+ "Hate": {
68
+ "precision": 0.9994152046783625,
69
+ "recall": 0.8795676788471436,
70
+ "f1-score": 0.9356693128935122,
71
+ "support": 1943.0
72
+ },
73
+ "Normal": {
74
+ "precision": 0.9010570824524313,
75
+ "recall": 0.9995309568480301,
76
+ "f1-score": 0.9477429397376028,
77
+ "support": 2132.0
78
+ },
79
+ "accuracy": 0.9423312883435583,
80
+ "macro avg": {
81
+ "precision": 0.950236143565397,
82
+ "recall": 0.9395493178475869,
83
+ "f1-score": 0.9417061263155575,
84
+ "support": 4075.0
85
+ },
86
+ "weighted avg": {
87
+ "precision": 0.9479552006082557,
88
+ "recall": 0.9423312883435583,
89
+ "f1-score": 0.9419861159442119,
90
+ "support": 4075.0
91
+ }
92
+ }
93
+ },
94
+ {
95
+ "epoch": 3,
96
+ "train_loss": 0.042429992100227805,
97
+ "val_loss": 0.08841686587220465,
98
+ "val_accuracy": 0.9815950920245399,
99
+ "val_f1_weighted": 0.9815846068456822,
100
+ "val_f1_macro": 0.9815362727285084,
101
+ "val_precision_macro": 0.9821854148248047,
102
+ "val_recall_macro": 0.9810877600739268,
103
+ "hate_recall": 0.9701492537313433,
104
+ "hate_f1": 0.9804941482444733,
105
+ "classification_report": {
106
+ "Hate": {
107
+ "precision": 0.991062039957939,
108
+ "recall": 0.9701492537313433,
109
+ "f1-score": 0.9804941482444733,
110
+ "support": 1943.0
111
+ },
112
+ "Normal": {
113
+ "precision": 0.9733087896916705,
114
+ "recall": 0.9920262664165104,
115
+ "f1-score": 0.9825783972125436,
116
+ "support": 2132.0
117
+ },
118
+ "accuracy": 0.9815950920245399,
119
+ "macro avg": {
120
+ "precision": 0.9821854148248047,
121
+ "recall": 0.9810877600739268,
122
+ "f1-score": 0.9815362727285084,
123
+ "support": 4075.0
124
+ },
125
+ "weighted avg": {
126
+ "precision": 0.9817737136836604,
127
+ "recall": 0.9815950920245399,
128
+ "f1-score": 0.9815846068456822,
129
+ "support": 4075.0
130
+ }
131
+ }
132
+ },
133
+ {
134
+ "epoch": 4,
135
+ "train_loss": 0.02510130808260151,
136
+ "val_loss": 0.0717304450595293,
137
+ "val_accuracy": 0.9852760736196319,
138
+ "val_f1_weighted": 0.9852723575092364,
139
+ "val_f1_macro": 0.9852372402659978,
140
+ "val_precision_macro": 0.9855061116942819,
141
+ "val_recall_macro": 0.9850162076980047,
142
+ "hate_recall": 0.9794132784354092,
143
+ "hate_f1": 0.9844800827728919,
144
+ "classification_report": {
145
+ "Hate": {
146
+ "precision": 0.9895995839833593,
147
+ "recall": 0.9794132784354092,
148
+ "f1-score": 0.9844800827728919,
149
+ "support": 1943.0
150
+ },
151
+ "Normal": {
152
+ "precision": 0.9814126394052045,
153
+ "recall": 0.9906191369606003,
154
+ "f1-score": 0.9859943977591037,
155
+ "support": 2132.0
156
+ },
157
+ "accuracy": 0.9852760736196319,
158
+ "macro avg": {
159
+ "precision": 0.9855061116942819,
160
+ "recall": 0.9850162076980047,
161
+ "f1-score": 0.9852372402659978,
162
+ "support": 4075.0
163
+ },
164
+ "weighted avg": {
165
+ "precision": 0.9853162549427149,
166
+ "recall": 0.9852760736196319,
167
+ "f1-score": 0.9852723575092364,
168
+ "support": 4075.0
169
+ }
170
+ }
171
+ },
172
+ {
173
+ "epoch": 5,
174
+ "train_loss": 0.020272867037444343,
175
+ "val_loss": 0.10328626508123762,
176
+ "val_accuracy": 0.9850306748466258,
177
+ "val_f1_weighted": 0.9850294351740828,
178
+ "val_f1_macro": 0.9849959640154234,
179
+ "val_precision_macro": 0.9850792204204483,
180
+ "val_recall_macro": 0.9849185607834542,
181
+ "hate_recall": 0.9825012866700978,
182
+ "hate_f1": 0.9842742974993555,
183
+ "classification_report": {
184
+ "Hate": {
185
+ "precision": 0.9860537190082644,
186
+ "recall": 0.9825012866700978,
187
+ "f1-score": 0.9842742974993555,
188
+ "support": 1943.0
189
+ },
190
+ "Normal": {
191
+ "precision": 0.9841047218326321,
192
+ "recall": 0.9873358348968105,
193
+ "f1-score": 0.9857176305314914,
194
+ "support": 2132.0
195
+ },
196
+ "accuracy": 0.9850306748466258,
197
+ "macro avg": {
198
+ "precision": 0.9850792204204483,
199
+ "recall": 0.9849185607834542,
200
+ "f1-score": 0.9849959640154234,
201
+ "support": 4075.0
202
+ },
203
+ "weighted avg": {
204
+ "precision": 0.9850340228172343,
205
+ "recall": 0.9850306748466258,
206
+ "f1-score": 0.9850294351740828,
207
+ "support": 4075.0
208
+ }
209
+ }
210
+ }
211
+ ],
212
+ "best_val_macro_f1": 0.9852372402659978,
213
+ "best_val_weighted_f1": 0.9852723575092364,
214
+ "best_epoch": 4,
215
+ "test_metrics": {
216
+ "test_accuracy": 0.9850306748466258,
217
+ "test_f1_macro": 0.9849884977742274,
218
+ "test_f1_weighted": 0.9850254027125759,
219
+ "test_precision_macro": 0.9853737715887565,
220
+ "test_recall_macro": 0.9846904363477302,
221
+ "classification_report": {
222
+ "Hate": {
223
+ "precision": 0.9911273486430062,
224
+ "recall": 0.9773546062789501,
225
+ "f1-score": 0.9841927960611557,
226
+ "support": 1943.0
227
+ },
228
+ "Normal": {
229
+ "precision": 0.9796201945345067,
230
+ "recall": 0.9920262664165104,
231
+ "f1-score": 0.985784199487299,
232
+ "support": 2132.0
233
+ },
234
+ "accuracy": 0.9850306748466258,
235
+ "macro avg": {
236
+ "precision": 0.9853737715887565,
237
+ "recall": 0.9846904363477302,
238
+ "f1-score": 0.9849884977742274,
239
+ "support": 4075.0
240
+ },
241
+ "weighted avg": {
242
+ "precision": 0.9851069185670992,
243
+ "recall": 0.9850306748466258,
244
+ "f1-score": 0.9850254027125759,
245
+ "support": 4075.0
246
+ }
247
+ }
248
+ },
249
+ "notes": "MARBERT sweep. LR=3e-05, Batch=64. Early stopping based on validation macro F1."
250
+ }