Alasil commited on
Commit
dc63f38
·
verified ·
1 Parent(s): e6085cb

[Run 20260606_154823] Log metrics

Browse files
metrics/run_20260606_154823_metrics.json ADDED
@@ -0,0 +1,172 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "run_id": "20260606_154823",
3
+ "hyperparameters": {
4
+ "model_architecture": "UBC-NLP/MARBERT",
5
+ "task": "sequence-classification",
6
+ "dataset": "Nexus-Analytics/multilingual-hate-detection-dataset_v2",
7
+ "learning_rate": 3e-05,
8
+ "batch_size": 32,
9
+ "num_epochs": 6,
10
+ "max_seq_length": 128,
11
+ "early_stopping_patience": 2,
12
+ "optimizer": "AdamW",
13
+ "seed": 42
14
+ },
15
+ "per_epoch_results": [
16
+ {
17
+ "epoch": 1,
18
+ "train_loss": 0.16837380265410082,
19
+ "val_loss": 0.10614141499172547,
20
+ "val_accuracy": 0.9752147239263804,
21
+ "val_f1_weighted": 0.9751963911175322,
22
+ "val_f1_macro": 0.9751284518847415,
23
+ "val_precision_macro": 0.9759859969260837,
24
+ "val_recall_macro": 0.9745795751140138,
25
+ "hate_recall": 0.9608852290272774,
26
+ "hate_f1": 0.9736636245110821,
27
+ "classification_report": {
28
+ "Hate": {
29
+ "precision": 0.9867864693446089,
30
+ "recall": 0.9608852290272774,
31
+ "f1-score": 0.9736636245110821,
32
+ "support": 1943.0
33
+ },
34
+ "Normal": {
35
+ "precision": 0.9651855245075585,
36
+ "recall": 0.9882739212007504,
37
+ "f1-score": 0.9765932792584009,
38
+ "support": 2132.0
39
+ },
40
+ "accuracy": 0.9752147239263804,
41
+ "macro avg": {
42
+ "precision": 0.9759859969260837,
43
+ "recall": 0.9745795751140138,
44
+ "f1-score": 0.9751284518847415,
45
+ "support": 4075.0
46
+ },
47
+ "weighted avg": {
48
+ "precision": 0.9754850670396784,
49
+ "recall": 0.9752147239263804,
50
+ "f1-score": 0.9751963911175322,
51
+ "support": 4075.0
52
+ }
53
+ }
54
+ },
55
+ {
56
+ "epoch": 2,
57
+ "train_loss": 0.07127080849091084,
58
+ "val_loss": 0.10314771042203574,
59
+ "val_accuracy": 0.9700613496932515,
60
+ "val_f1_weighted": 0.970077383915934,
61
+ "val_f1_macro": 0.9700429467785818,
62
+ "val_precision_macro": 0.9699921519770369,
63
+ "val_recall_macro": 0.9710005561891004,
64
+ "hate_recall": 0.9912506433350489,
65
+ "hate_f1": 0.9693004529441369,
66
+ "classification_report": {
67
+ "Hate": {
68
+ "precision": 0.948301329394387,
69
+ "recall": 0.9912506433350489,
70
+ "f1-score": 0.9693004529441369,
71
+ "support": 1943.0
72
+ },
73
+ "Normal": {
74
+ "precision": 0.9916829745596869,
75
+ "recall": 0.950750469043152,
76
+ "f1-score": 0.9707854406130269,
77
+ "support": 2132.0
78
+ },
79
+ "accuracy": 0.9700613496932515,
80
+ "macro avg": {
81
+ "precision": 0.9699921519770369,
82
+ "recall": 0.9710005561891004,
83
+ "f1-score": 0.9700429467785818,
84
+ "support": 4075.0
85
+ },
86
+ "weighted avg": {
87
+ "precision": 0.9709981803127723,
88
+ "recall": 0.9700613496932515,
89
+ "f1-score": 0.970077383915934,
90
+ "support": 4075.0
91
+ }
92
+ }
93
+ },
94
+ {
95
+ "epoch": 3,
96
+ "train_loss": 0.04779951434363337,
97
+ "val_loss": 0.16167892069449863,
98
+ "val_accuracy": 0.9739877300613496,
99
+ "val_f1_weighted": 0.973977408520008,
100
+ "val_f1_macro": 0.9739123828095557,
101
+ "val_precision_macro": 0.9743417766264514,
102
+ "val_recall_macro": 0.9735894667826681,
103
+ "hate_recall": 0.9650025733401956,
104
+ "hate_f1": 0.9725103734439834,
105
+ "classification_report": {
106
+ "Hate": {
107
+ "precision": 0.9801359121798223,
108
+ "recall": 0.9650025733401956,
109
+ "f1-score": 0.9725103734439834,
110
+ "support": 1943.0
111
+ },
112
+ "Normal": {
113
+ "precision": 0.9685476410730804,
114
+ "recall": 0.9821763602251408,
115
+ "f1-score": 0.975314392175128,
116
+ "support": 2132.0
117
+ },
118
+ "accuracy": 0.9739877300613496,
119
+ "macro avg": {
120
+ "precision": 0.9743417766264514,
121
+ "recall": 0.9735894667826681,
122
+ "f1-score": 0.9739123828095557,
123
+ "support": 4075.0
124
+ },
125
+ "weighted avg": {
126
+ "precision": 0.9740730424866755,
127
+ "recall": 0.9739877300613496,
128
+ "f1-score": 0.973977408520008,
129
+ "support": 4075.0
130
+ }
131
+ }
132
+ }
133
+ ],
134
+ "best_val_macro_f1": 0.9751284518847415,
135
+ "best_val_weighted_f1": 0.9751963911175322,
136
+ "best_epoch": 1,
137
+ "test_metrics": {
138
+ "test_accuracy": 0.9749693251533742,
139
+ "test_f1_macro": 0.974890027199601,
140
+ "test_f1_weighted": 0.9749554739824096,
141
+ "test_precision_macro": 0.9755105827863149,
142
+ "test_recall_macro": 0.9744591157558908,
143
+ "classification_report": {
144
+ "Hate": {
145
+ "precision": 0.9837099316868103,
146
+ "recall": 0.9634585692228512,
147
+ "f1-score": 0.9734789391575663,
148
+ "support": 1943.0
149
+ },
150
+ "Normal": {
151
+ "precision": 0.9673112338858195,
152
+ "recall": 0.9854596622889306,
153
+ "f1-score": 0.9763011152416357,
154
+ "support": 2132.0
155
+ },
156
+ "accuracy": 0.9749693251533742,
157
+ "macro avg": {
158
+ "precision": 0.9755105827863149,
159
+ "recall": 0.9744591157558908,
160
+ "f1-score": 0.974890027199601,
161
+ "support": 4075.0
162
+ },
163
+ "weighted avg": {
164
+ "precision": 0.9751302939661447,
165
+ "recall": 0.9749693251533742,
166
+ "f1-score": 0.9749554739824096,
167
+ "support": 4075.0
168
+ }
169
+ }
170
+ },
171
+ "notes": "MARBERT sweep. LR=3e-05, Batch=32. Early stopping based on validation macro F1."
172
+ }