Alasil commited on
Commit
60002d9
·
verified ·
1 Parent(s): 0062063

[Run 20260606_151208] Log metrics

Browse files
metrics/run_20260606_151208_metrics.json ADDED
@@ -0,0 +1,250 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "run_id": "20260606_151208",
3
+ "hyperparameters": {
4
+ "model_architecture": "UBC-NLP/MARBERT",
5
+ "task": "sequence-classification",
6
+ "dataset": "Nexus-Analytics/multilingual-hate-detection-dataset_v2",
7
+ "learning_rate": 2e-05,
8
+ "batch_size": 32,
9
+ "num_epochs": 5,
10
+ "max_seq_length": 128,
11
+ "early_stopping_patience": 2,
12
+ "optimizer": "AdamW",
13
+ "seed": 42
14
+ },
15
+ "per_epoch_results": [
16
+ {
17
+ "epoch": 1,
18
+ "train_loss": 0.1552482957959551,
19
+ "val_loss": 0.06442766166583169,
20
+ "val_accuracy": 0.9776687116564418,
21
+ "val_f1_weighted": 0.9776713498136897,
22
+ "val_f1_macro": 0.9776260214755199,
23
+ "val_precision_macro": 0.9775203320887725,
24
+ "val_recall_macro": 0.9777460388424701,
25
+ "hate_recall": 0.9794132784354092,
26
+ "hate_f1": 0.9766487041313832,
27
+ "classification_report": {
28
+ "Hate": {
29
+ "precision": 0.973899692937564,
30
+ "recall": 0.9794132784354092,
31
+ "f1-score": 0.9766487041313832,
32
+ "support": 1943.0
33
+ },
34
+ "Normal": {
35
+ "precision": 0.9811409712399811,
36
+ "recall": 0.976078799249531,
37
+ "f1-score": 0.9786033388196567,
38
+ "support": 2132.0
39
+ },
40
+ "accuracy": 0.9776687116564418,
41
+ "macro avg": {
42
+ "precision": 0.9775203320887725,
43
+ "recall": 0.9777460388424701,
44
+ "f1-score": 0.9776260214755199,
45
+ "support": 4075.0
46
+ },
47
+ "weighted avg": {
48
+ "precision": 0.9776882586653561,
49
+ "recall": 0.9776687116564418,
50
+ "f1-score": 0.9776713498136897,
51
+ "support": 4075.0
52
+ }
53
+ }
54
+ },
55
+ {
56
+ "epoch": 2,
57
+ "train_loss": 0.06698464741152634,
58
+ "val_loss": 0.08235648793765904,
59
+ "val_accuracy": 0.979877300613497,
60
+ "val_f1_weighted": 0.9798606143986976,
61
+ "val_f1_macro": 0.97980429842375,
62
+ "val_precision_macro": 0.9807875544110622,
63
+ "val_recall_macro": 0.9791951721627354,
64
+ "hate_recall": 0.9644879053010808,
65
+ "hate_f1": 0.9785900783289817,
66
+ "classification_report": {
67
+ "Hate": {
68
+ "precision": 0.9931107578166402,
69
+ "recall": 0.9644879053010808,
70
+ "f1-score": 0.9785900783289817,
71
+ "support": 1943.0
72
+ },
73
+ "Normal": {
74
+ "precision": 0.9684643510054844,
75
+ "recall": 0.9939024390243902,
76
+ "f1-score": 0.9810185185185185,
77
+ "support": 2132.0
78
+ },
79
+ "accuracy": 0.979877300613497,
80
+ "macro avg": {
81
+ "precision": 0.9807875544110622,
82
+ "recall": 0.9791951721627354,
83
+ "f1-score": 0.97980429842375,
84
+ "support": 4075.0
85
+ },
86
+ "weighted avg": {
87
+ "precision": 0.9802159997009631,
88
+ "recall": 0.979877300613497,
89
+ "f1-score": 0.9798606143986976,
90
+ "support": 4075.0
91
+ }
92
+ }
93
+ },
94
+ {
95
+ "epoch": 3,
96
+ "train_loss": 0.04852369342719796,
97
+ "val_loss": 0.07133448649710772,
98
+ "val_accuracy": 0.9825766871165644,
99
+ "val_f1_weighted": 0.9825678862883249,
100
+ "val_f1_macro": 0.9825229307062366,
101
+ "val_precision_macro": 0.9830922659607355,
102
+ "val_recall_macro": 0.9821170961521564,
103
+ "hate_recall": 0.9722079258878024,
104
+ "hate_f1": 0.981553650298779,
105
+ "classification_report": {
106
+ "Hate": {
107
+ "precision": 0.9910807974816369,
108
+ "recall": 0.9722079258878024,
109
+ "f1-score": 0.981553650298779,
110
+ "support": 1943.0
111
+ },
112
+ "Normal": {
113
+ "precision": 0.975103734439834,
114
+ "recall": 0.9920262664165104,
115
+ "f1-score": 0.9834922111136944,
116
+ "support": 2132.0
117
+ },
118
+ "accuracy": 0.9825766871165644,
119
+ "macro avg": {
120
+ "precision": 0.9830922659607355,
121
+ "recall": 0.9821170961521564,
122
+ "f1-score": 0.9825229307062366,
123
+ "support": 4075.0
124
+ },
125
+ "weighted avg": {
126
+ "precision": 0.9827217549282322,
127
+ "recall": 0.9825766871165644,
128
+ "f1-score": 0.9825678862883249,
129
+ "support": 4075.0
130
+ }
131
+ }
132
+ },
133
+ {
134
+ "epoch": 4,
135
+ "train_loss": 0.03323969159869843,
136
+ "val_loss": 0.09886962652149123,
137
+ "val_accuracy": 0.9791411042944785,
138
+ "val_f1_weighted": 0.9791271243631345,
139
+ "val_f1_macro": 0.9790709071924115,
140
+ "val_precision_macro": 0.9798448897512311,
141
+ "val_recall_macro": 0.9785600447654977,
142
+ "hate_recall": 0.9660319094184251,
143
+ "hate_f1": 0.9778588174003647,
144
+ "classification_report": {
145
+ "Hate": {
146
+ "precision": 0.9899789029535865,
147
+ "recall": 0.9660319094184251,
148
+ "f1-score": 0.9778588174003647,
149
+ "support": 1943.0
150
+ },
151
+ "Normal": {
152
+ "precision": 0.9697108765488757,
153
+ "recall": 0.9910881801125704,
154
+ "f1-score": 0.9802829969844583,
155
+ "support": 2132.0
156
+ },
157
+ "accuracy": 0.9791411042944785,
158
+ "macro avg": {
159
+ "precision": 0.9798448897512311,
160
+ "recall": 0.9785600447654977,
161
+ "f1-score": 0.9790709071924115,
162
+ "support": 4075.0
163
+ },
164
+ "weighted avg": {
165
+ "precision": 0.9793748704885943,
166
+ "recall": 0.9791411042944785,
167
+ "f1-score": 0.9791271243631345,
168
+ "support": 4075.0
169
+ }
170
+ }
171
+ },
172
+ {
173
+ "epoch": 5,
174
+ "train_loss": 0.021192557967108717,
175
+ "val_loss": 0.10540853567454178,
176
+ "val_accuracy": 0.9838036809815951,
177
+ "val_f1_weighted": 0.9837967629491983,
178
+ "val_f1_macro": 0.9837559033203549,
179
+ "val_precision_macro": 0.9842304403632631,
180
+ "val_recall_macro": 0.9834037662499433,
181
+ "hate_recall": 0.9747812660833762,
182
+ "hate_f1": 0.98287493513233,
183
+ "classification_report": {
184
+ "Hate": {
185
+ "precision": 0.9911041339612768,
186
+ "recall": 0.9747812660833762,
187
+ "f1-score": 0.98287493513233,
188
+ "support": 1943.0
189
+ },
190
+ "Normal": {
191
+ "precision": 0.9773567467652495,
192
+ "recall": 0.9920262664165104,
193
+ "f1-score": 0.9846368715083799,
194
+ "support": 2132.0
195
+ },
196
+ "accuracy": 0.9838036809815951,
197
+ "macro avg": {
198
+ "precision": 0.9842304403632631,
199
+ "recall": 0.9834037662499433,
200
+ "f1-score": 0.9837559033203549,
201
+ "support": 4075.0
202
+ },
203
+ "weighted avg": {
204
+ "precision": 0.9839116359239933,
205
+ "recall": 0.9838036809815951,
206
+ "f1-score": 0.9837967629491983,
207
+ "support": 4075.0
208
+ }
209
+ }
210
+ }
211
+ ],
212
+ "best_val_macro_f1": 0.9837559033203549,
213
+ "best_val_weighted_f1": 0.9837967629491983,
214
+ "best_epoch": 5,
215
+ "test_metrics": {
216
+ "test_accuracy": 0.9811042944785276,
217
+ "test_f1_macro": 0.9810417809481786,
218
+ "test_f1_weighted": 0.9810922726457683,
219
+ "test_precision_macro": 0.9817749312309503,
220
+ "test_recall_macro": 0.9805502795912396,
221
+ "classification_report": {
222
+ "Hate": {
223
+ "precision": 0.9915700737618546,
224
+ "recall": 0.968605249613999,
225
+ "f1-score": 0.9799531372038531,
226
+ "support": 1943.0
227
+ },
228
+ "Normal": {
229
+ "precision": 0.971979788700046,
230
+ "recall": 0.9924953095684803,
231
+ "f1-score": 0.9821304246925041,
232
+ "support": 2132.0
233
+ },
234
+ "accuracy": 0.9811042944785276,
235
+ "macro avg": {
236
+ "precision": 0.9817749312309503,
237
+ "recall": 0.9805502795912396,
238
+ "f1-score": 0.9810417809481786,
239
+ "support": 4075.0
240
+ },
241
+ "weighted avg": {
242
+ "precision": 0.981320628914793,
243
+ "recall": 0.9811042944785276,
244
+ "f1-score": 0.9810922726457683,
245
+ "support": 4075.0
246
+ }
247
+ }
248
+ },
249
+ "notes": "MARBERT sweep. LR=2e-05, Batch=32. Early stopping based on validation macro F1."
250
+ }