Alasil commited on
Commit
9e5a921
·
verified ·
1 Parent(s): bf50f18

[Run 20260606_135237] Log metrics

Browse files
metrics/run_20260606_135237_metrics.json ADDED
@@ -0,0 +1,250 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "run_id": "20260606_135237",
3
+ "hyperparameters": {
4
+ "model_architecture": "UBC-NLP/MARBERT",
5
+ "task": "sequence-classification",
6
+ "dataset": "Nexus-Analytics/multilingual-hate-detection-dataset_v2",
7
+ "learning_rate": 2e-05,
8
+ "batch_size": 16,
9
+ "num_epochs": 5,
10
+ "max_seq_length": 128,
11
+ "early_stopping_patience": 2,
12
+ "optimizer": "AdamW",
13
+ "seed": 42
14
+ },
15
+ "per_epoch_results": [
16
+ {
17
+ "epoch": 1,
18
+ "train_loss": 0.17704563700628081,
19
+ "val_loss": 0.08185144391769142,
20
+ "val_accuracy": 0.9764417177914111,
21
+ "val_f1_weighted": 0.9764376758355681,
22
+ "val_f1_macro": 0.9763831094316877,
23
+ "val_precision_macro": 0.976558193308877,
24
+ "val_recall_macro": 0.9762312443089591,
25
+ "hate_recall": 0.9716932578486875,
26
+ "hate_f1": 0.9752066115702479,
27
+ "classification_report": {
28
+ "Hate": {
29
+ "precision": 0.9787454639709694,
30
+ "recall": 0.9716932578486875,
31
+ "f1-score": 0.9752066115702479,
32
+ "support": 1943.0
33
+ },
34
+ "Normal": {
35
+ "precision": 0.9743709226467847,
36
+ "recall": 0.9807692307692307,
37
+ "f1-score": 0.9775596072931276,
38
+ "support": 2132.0
39
+ },
40
+ "accuracy": 0.9764417177914111,
41
+ "macro avg": {
42
+ "precision": 0.976558193308877,
43
+ "recall": 0.9762312443089591,
44
+ "f1-score": 0.9763831094316877,
45
+ "support": 4075.0
46
+ },
47
+ "weighted avg": {
48
+ "precision": 0.9764567468904389,
49
+ "recall": 0.9764417177914111,
50
+ "f1-score": 0.9764376758355681,
51
+ "support": 4075.0
52
+ }
53
+ }
54
+ },
55
+ {
56
+ "epoch": 2,
57
+ "train_loss": 0.08605310319347592,
58
+ "val_loss": 0.08948595821321029,
59
+ "val_accuracy": 0.9784049079754601,
60
+ "val_f1_weighted": 0.9783943419684894,
61
+ "val_f1_macro": 0.9783388704318936,
62
+ "val_precision_macro": 0.9788841169743632,
63
+ "val_recall_macro": 0.9779477298118323,
64
+ "hate_recall": 0.9680905815748841,
65
+ "hate_f1": 0.9771428571428571,
66
+ "classification_report": {
67
+ "Hate": {
68
+ "precision": 0.9863660199265862,
69
+ "recall": 0.9680905815748841,
70
+ "f1-score": 0.9771428571428571,
71
+ "support": 1943.0
72
+ },
73
+ "Normal": {
74
+ "precision": 0.9714022140221402,
75
+ "recall": 0.9878048780487805,
76
+ "f1-score": 0.9795348837209302,
77
+ "support": 2132.0
78
+ },
79
+ "accuracy": 0.9784049079754601,
80
+ "macro avg": {
81
+ "precision": 0.9788841169743632,
82
+ "recall": 0.9779477298118323,
83
+ "f1-score": 0.9783388704318936,
84
+ "support": 4075.0
85
+ },
86
+ "weighted avg": {
87
+ "precision": 0.9785371035613645,
88
+ "recall": 0.9784049079754601,
89
+ "f1-score": 0.9783943419684894,
90
+ "support": 4075.0
91
+ }
92
+ }
93
+ },
94
+ {
95
+ "epoch": 3,
96
+ "train_loss": 0.0567464292272778,
97
+ "val_loss": 0.09008082439386807,
98
+ "val_accuracy": 0.9820858895705521,
99
+ "val_f1_weighted": 0.982085266800533,
100
+ "val_f1_macro": 0.9820460322893185,
101
+ "val_precision_macro": 0.9820800840194114,
102
+ "val_recall_macro": 0.9820130520973447,
103
+ "hate_recall": 0.9804426145136387,
104
+ "hate_f1": 0.9812001030131342,
105
+ "classification_report": {
106
+ "Hate": {
107
+ "precision": 0.9819587628865979,
108
+ "recall": 0.9804426145136387,
109
+ "f1-score": 0.9812001030131342,
110
+ "support": 1943.0
111
+ },
112
+ "Normal": {
113
+ "precision": 0.9822014051522249,
114
+ "recall": 0.9835834896810507,
115
+ "f1-score": 0.9828919615655027,
116
+ "support": 2132.0
117
+ },
118
+ "accuracy": 0.9820858895705521,
119
+ "macro avg": {
120
+ "precision": 0.9820800840194114,
121
+ "recall": 0.9820130520973447,
122
+ "f1-score": 0.9820460322893185,
123
+ "support": 4075.0
124
+ },
125
+ "weighted avg": {
126
+ "precision": 0.9820857109382093,
127
+ "recall": 0.9820858895705521,
128
+ "f1-score": 0.982085266800533,
129
+ "support": 4075.0
130
+ }
131
+ }
132
+ },
133
+ {
134
+ "epoch": 4,
135
+ "train_loss": 0.03903503223161502,
136
+ "val_loss": 0.10641252933005578,
137
+ "val_accuracy": 0.978159509202454,
138
+ "val_f1_weighted": 0.9781645391606395,
139
+ "val_f1_macro": 0.9781232060259852,
140
+ "val_precision_macro": 0.9779342709417133,
141
+ "val_recall_macro": 0.9783747690994469,
142
+ "hate_recall": 0.9830159547092125,
143
+ "hate_f1": 0.9772320286518291,
144
+ "classification_report": {
145
+ "Hate": {
146
+ "precision": 0.9715157680569685,
147
+ "recall": 0.9830159547092125,
148
+ "f1-score": 0.9772320286518291,
149
+ "support": 1943.0
150
+ },
151
+ "Normal": {
152
+ "precision": 0.984352773826458,
153
+ "recall": 0.9737335834896811,
154
+ "f1-score": 0.9790143834001415,
155
+ "support": 2132.0
156
+ },
157
+ "accuracy": 0.978159509202454,
158
+ "macro avg": {
159
+ "precision": 0.9779342709417133,
160
+ "recall": 0.9783747690994469,
161
+ "f1-score": 0.9781232060259852,
162
+ "support": 4075.0
163
+ },
164
+ "weighted avg": {
165
+ "precision": 0.9782319634681468,
166
+ "recall": 0.978159509202454,
167
+ "f1-score": 0.9781645391606395,
168
+ "support": 4075.0
169
+ }
170
+ }
171
+ },
172
+ {
173
+ "epoch": 5,
174
+ "train_loss": 0.0320917765745486,
175
+ "val_loss": 0.11052904996936644,
176
+ "val_accuracy": 0.9825766871165644,
177
+ "val_f1_weighted": 0.9825730032582375,
178
+ "val_f1_macro": 0.9825320474215442,
179
+ "val_precision_macro": 0.9827533345220337,
180
+ "val_recall_macro": 0.9823452205878803,
181
+ "hate_recall": 0.9773546062789501,
182
+ "hate_f1": 0.9816490049108296,
183
+ "classification_report": {
184
+ "Hate": {
185
+ "precision": 0.985981308411215,
186
+ "recall": 0.9773546062789501,
187
+ "f1-score": 0.9816490049108296,
188
+ "support": 1943.0
189
+ },
190
+ "Normal": {
191
+ "precision": 0.9795253606328524,
192
+ "recall": 0.9873358348968105,
193
+ "f1-score": 0.9834150899322588,
194
+ "support": 2132.0
195
+ },
196
+ "accuracy": 0.9825766871165644,
197
+ "macro avg": {
198
+ "precision": 0.9827533345220337,
199
+ "recall": 0.9823452205878803,
200
+ "f1-score": 0.9825320474215442,
201
+ "support": 4075.0
202
+ },
203
+ "weighted avg": {
204
+ "precision": 0.9826036199048424,
205
+ "recall": 0.9825766871165644,
206
+ "f1-score": 0.9825730032582375,
207
+ "support": 4075.0
208
+ }
209
+ }
210
+ }
211
+ ],
212
+ "best_val_macro_f1": 0.9825320474215442,
213
+ "best_val_weighted_f1": 0.9825730032582375,
214
+ "best_epoch": 5,
215
+ "test_metrics": {
216
+ "test_accuracy": 0.9803680981595092,
217
+ "test_f1_macro": 0.980321168193406,
218
+ "test_f1_weighted": 0.9803657398697553,
219
+ "test_precision_macro": 0.9804425132701813,
220
+ "test_recall_macro": 0.9802117139604429,
221
+ "classification_report": {
222
+ "Hate": {
223
+ "precision": 0.9818934299017071,
224
+ "recall": 0.9768399382398353,
225
+ "f1-score": 0.9793601651186791,
226
+ "support": 1943.0
227
+ },
228
+ "Normal": {
229
+ "precision": 0.9789915966386554,
230
+ "recall": 0.9835834896810507,
231
+ "f1-score": 0.9812821712681329,
232
+ "support": 2132.0
233
+ },
234
+ "accuracy": 0.9803680981595092,
235
+ "macro avg": {
236
+ "precision": 0.9804425132701813,
237
+ "recall": 0.9802117139604429,
238
+ "f1-score": 0.980321168193406,
239
+ "support": 4075.0
240
+ },
241
+ "weighted avg": {
242
+ "precision": 0.9803752192227314,
243
+ "recall": 0.9803680981595092,
244
+ "f1-score": 0.9803657398697553,
245
+ "support": 4075.0
246
+ }
247
+ }
248
+ },
249
+ "notes": "MARBERT sweep. LR=2e-05, Batch=16. Early stopping based on validation macro F1."
250
+ }