takedarn commited on
Commit
7aad682
·
verified ·
1 Parent(s): 1a19863

Upload folder using huggingface_hub

Browse files
Files changed (5) hide show
  1. best_eval_results.txt +7 -0
  2. config.json +28 -0
  3. eval_results.txt +1379 -0
  4. pytorch_model.bin +3 -0
  5. vocab.txt +0 -0
best_eval_results.txt ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ att_loss = 0.0
2
+ cls_loss = 0.2774283394823569
3
+ eval_loss = 0.4494276660861391
4
+ global_step = 12299
5
+ loss = 0.2774283394823569
6
+ mcc = 0.5547015581596438
7
+ rep_loss = 0.0
config.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "BertForSequenceClassification"
4
+ ],
5
+ "attention_probs_dropout_prob": 0.1,
6
+ "cell": {},
7
+ "classifier_dropout": null,
8
+ "dtype": "float32",
9
+ "hidden_act": "gelu",
10
+ "hidden_dropout_prob": 0.1,
11
+ "hidden_size": 768,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 3072,
14
+ "layer_norm_eps": 1e-12,
15
+ "max_position_embeddings": 512,
16
+ "model_type": "bert",
17
+ "num_attention_heads": 12,
18
+ "num_hidden_layers": 6,
19
+ "pad_token_id": 0,
20
+ "position_embedding_type": "absolute",
21
+ "pre_trained": "",
22
+ "structure": [],
23
+ "training": "",
24
+ "transformers_version": "4.57.0",
25
+ "type_vocab_size": 2,
26
+ "use_cache": true,
27
+ "vocab_size": 30522
28
+ }
eval_results.txt ADDED
@@ -0,0 +1,1379 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ att_loss = 0.0
2
+ cls_loss = 0.3314089049594571
3
+ eval_loss = 0.558346668879191
4
+ global_step = 99
5
+ loss = 0.3314089049594571
6
+ mcc = 0.5379646517492308
7
+ rep_loss = 0.0
8
+ att_loss = 0.0
9
+ cls_loss = 0.30922394601543945
10
+ eval_loss = 0.4729316487456813
11
+ global_step = 199
12
+ loss = 0.30922394601543945
13
+ mcc = 0.53908953967947
14
+ rep_loss = 0.0
15
+ att_loss = 0.0
16
+ cls_loss = 0.29862612834742236
17
+ eval_loss = 0.4591611668919072
18
+ global_step = 299
19
+ loss = 0.29862612834742236
20
+ mcc = 0.5174363323196072
21
+ rep_loss = 0.0
22
+ att_loss = 0.0
23
+ cls_loss = 0.2936462070559499
24
+ eval_loss = 0.46544614389087213
25
+ global_step = 399
26
+ loss = 0.2936462070559499
27
+ mcc = 0.5129362341229983
28
+ rep_loss = 0.0
29
+ att_loss = 0.0
30
+ cls_loss = 0.2904629405729756
31
+ eval_loss = 0.4587692695133614
32
+ global_step = 499
33
+ loss = 0.2904629405729756
34
+ mcc = 0.5024595293214101
35
+ rep_loss = 0.0
36
+ att_loss = 0.0
37
+ cls_loss = 0.28836528601152867
38
+ eval_loss = 0.46001112099849817
39
+ global_step = 599
40
+ loss = 0.28836528601152867
41
+ mcc = 0.5243240799797736
42
+ rep_loss = 0.0
43
+ att_loss = 0.0
44
+ cls_loss = 0.28679145567748
45
+ eval_loss = 0.4705536166826884
46
+ global_step = 699
47
+ loss = 0.28679145567748
48
+ mcc = 0.5083737693895587
49
+ rep_loss = 0.0
50
+ att_loss = 0.0
51
+ cls_loss = 0.28570082403243857
52
+ eval_loss = 0.457729236646132
53
+ global_step = 799
54
+ loss = 0.28570082403243857
55
+ mcc = 0.5195210533288269
56
+ rep_loss = 0.0
57
+ att_loss = 0.0
58
+ cls_loss = 0.2847436185474523
59
+ eval_loss = 0.46017983917034033
60
+ global_step = 899
61
+ loss = 0.2847436185474523
62
+ mcc = 0.5148043176747271
63
+ rep_loss = 0.0
64
+ att_loss = 0.0
65
+ cls_loss = 0.2840113452783934
66
+ eval_loss = 0.4604815100178574
67
+ global_step = 999
68
+ loss = 0.2840113452783934
69
+ mcc = 0.5137144786818878
70
+ rep_loss = 0.0
71
+ att_loss = 0.0
72
+ cls_loss = 0.2833313442176857
73
+ eval_loss = 0.45605057297330914
74
+ global_step = 1099
75
+ loss = 0.2833313442176857
76
+ mcc = 0.5086434504606193
77
+ rep_loss = 0.0
78
+ att_loss = 0.0
79
+ cls_loss = 0.28292435375325775
80
+ eval_loss = 0.4674258195992672
81
+ global_step = 1199
82
+ loss = 0.28292435375325775
83
+ mcc = 0.5023013330243151
84
+ rep_loss = 0.0
85
+ att_loss = 0.0
86
+ cls_loss = 0.28249076254281563
87
+ eval_loss = 0.4585440529115272
88
+ global_step = 1299
89
+ loss = 0.28249076254281563
90
+ mcc = 0.49769781134092017
91
+ rep_loss = 0.0
92
+ att_loss = 0.0
93
+ cls_loss = 0.28220195374887613
94
+ eval_loss = 0.46350200248487067
95
+ global_step = 1399
96
+ loss = 0.28220195374887613
97
+ mcc = 0.5022737075453998
98
+ rep_loss = 0.0
99
+ att_loss = 0.0
100
+ cls_loss = 0.2818971301333915
101
+ eval_loss = 0.45705517133076984
102
+ global_step = 1499
103
+ loss = 0.2818971301333915
104
+ mcc = 0.5090466963654656
105
+ rep_loss = 0.0
106
+ att_loss = 0.0
107
+ cls_loss = 0.28161911792200456
108
+ eval_loss = 0.45958378640088166
109
+ global_step = 1599
110
+ loss = 0.28161911792200456
111
+ mcc = 0.5301258210741284
112
+ rep_loss = 0.0
113
+ att_loss = 0.0
114
+ cls_loss = 0.2813657304341124
115
+ eval_loss = 0.45043707210006134
116
+ global_step = 1699
117
+ loss = 0.2813657304341124
118
+ mcc = 0.5258777693272533
119
+ rep_loss = 0.0
120
+ att_loss = 0.0
121
+ cls_loss = 0.2812084330658968
122
+ eval_loss = 0.458847572406133
123
+ global_step = 1799
124
+ loss = 0.2812084330658968
125
+ mcc = 0.49912748891398284
126
+ rep_loss = 0.0
127
+ att_loss = 0.0
128
+ cls_loss = 0.28113282589990257
129
+ eval_loss = 0.4568930548248869
130
+ global_step = 1899
131
+ loss = 0.28113282589990257
132
+ mcc = 0.5136924627518875
133
+ rep_loss = 0.0
134
+ att_loss = 0.0
135
+ cls_loss = 0.2810653937852878
136
+ eval_loss = 0.460727898460446
137
+ global_step = 1999
138
+ loss = 0.2810653937852878
139
+ mcc = 0.5083396333380269
140
+ rep_loss = 0.0
141
+ att_loss = 0.0
142
+ cls_loss = 0.2809604485086625
143
+ eval_loss = 0.4551165293563496
144
+ global_step = 2099
145
+ loss = 0.2809604485086625
146
+ mcc = 0.5094661687755515
147
+ rep_loss = 0.0
148
+ att_loss = 0.0
149
+ cls_loss = 0.2808897217101214
150
+ eval_loss = 0.4542377916249362
151
+ global_step = 2199
152
+ loss = 0.2808897217101214
153
+ mcc = 0.5216771032432638
154
+ rep_loss = 0.0
155
+ att_loss = 0.0
156
+ cls_loss = 0.2808540752591025
157
+ eval_loss = 0.4551556787707589
158
+ global_step = 2299
159
+ loss = 0.2808540752591025
160
+ mcc = 0.5030366431605939
161
+ rep_loss = 0.0
162
+ att_loss = 0.0
163
+ cls_loss = 0.280771658892878
164
+ eval_loss = 0.4529932525121804
165
+ global_step = 2399
166
+ loss = 0.280771658892878
167
+ mcc = 0.4992436500882773
168
+ rep_loss = 0.0
169
+ att_loss = 0.0
170
+ cls_loss = 0.2806162594997582
171
+ eval_loss = 0.4564899161006465
172
+ global_step = 2499
173
+ loss = 0.2806162594997582
174
+ mcc = 0.5258663312307151
175
+ rep_loss = 0.0
176
+ att_loss = 0.0
177
+ cls_loss = 0.2805227454280156
178
+ eval_loss = 0.45711556709173956
179
+ global_step = 2599
180
+ loss = 0.2805227454280156
181
+ mcc = 0.5083396333380269
182
+ rep_loss = 0.0
183
+ att_loss = 0.0
184
+ cls_loss = 0.2804428632831785
185
+ eval_loss = 0.46782211011106317
186
+ global_step = 2699
187
+ loss = 0.2804428632831785
188
+ mcc = 0.5130268868060578
189
+ rep_loss = 0.0
190
+ att_loss = 0.0
191
+ cls_loss = 0.28033756286640515
192
+ eval_loss = 0.46800248821576435
193
+ global_step = 2799
194
+ loss = 0.28033756286640515
195
+ mcc = 0.5107299372054125
196
+ rep_loss = 0.0
197
+ att_loss = 0.0
198
+ cls_loss = 0.2802383803517377
199
+ eval_loss = 0.45390655145500647
200
+ global_step = 2899
201
+ loss = 0.2802383803517377
202
+ mcc = 0.5290369945616428
203
+ rep_loss = 0.0
204
+ att_loss = 0.0
205
+ cls_loss = 0.28015635979199416
206
+ eval_loss = 0.45774519172581757
207
+ global_step = 2999
208
+ loss = 0.28015635979199416
209
+ mcc = 0.5171981604121658
210
+ rep_loss = 0.0
211
+ att_loss = 0.0
212
+ cls_loss = 0.280116079530819
213
+ eval_loss = 0.46175673965251807
214
+ global_step = 3099
215
+ loss = 0.280116079530819
216
+ mcc = 0.5292575156160738
217
+ rep_loss = 0.0
218
+ att_loss = 0.0
219
+ cls_loss = 0.28002789718596477
220
+ eval_loss = 0.4570824693549763
221
+ global_step = 3199
222
+ loss = 0.28002789718596477
223
+ mcc = 0.5102742207491978
224
+ rep_loss = 0.0
225
+ att_loss = 0.0
226
+ cls_loss = 0.27996111961793596
227
+ eval_loss = 0.4685366289182143
228
+ global_step = 3299
229
+ loss = 0.27996111961793596
230
+ mcc = 0.5075323666037682
231
+ rep_loss = 0.0
232
+ att_loss = 0.0
233
+ cls_loss = 0.2799214343133482
234
+ eval_loss = 0.46386505076379486
235
+ global_step = 3399
236
+ loss = 0.2799214343133482
237
+ mcc = 0.49818194163113544
238
+ rep_loss = 0.0
239
+ att_loss = 0.0
240
+ cls_loss = 0.27988882744421306
241
+ eval_loss = 0.46293420683253894
242
+ global_step = 3499
243
+ loss = 0.27988882744421306
244
+ mcc = 0.5157729880756086
245
+ rep_loss = 0.0
246
+ att_loss = 0.0
247
+ cls_loss = 0.2798519777643843
248
+ eval_loss = 0.46502567240686127
249
+ global_step = 3599
250
+ loss = 0.2798519777643843
251
+ mcc = 0.5141951979542654
252
+ rep_loss = 0.0
253
+ att_loss = 0.0
254
+ cls_loss = 0.27981998667294156
255
+ eval_loss = 0.47166980215997406
256
+ global_step = 3699
257
+ loss = 0.27981998667294156
258
+ mcc = 0.5080191328496129
259
+ rep_loss = 0.0
260
+ att_loss = 0.0
261
+ cls_loss = 0.2798082064047836
262
+ eval_loss = 0.4631090304165175
263
+ global_step = 3799
264
+ loss = 0.2798082064047836
265
+ mcc = 0.5080191328496129
266
+ rep_loss = 0.0
267
+ att_loss = 0.0
268
+ cls_loss = 0.2797351769795324
269
+ eval_loss = 0.46201050462144794
270
+ global_step = 3899
271
+ loss = 0.2797351769795324
272
+ mcc = 0.5050401952530084
273
+ rep_loss = 0.0
274
+ att_loss = 0.0
275
+ cls_loss = 0.279704924630922
276
+ eval_loss = 0.458680326739947
277
+ global_step = 3999
278
+ loss = 0.279704924630922
279
+ mcc = 0.5201497752653439
280
+ rep_loss = 0.0
281
+ att_loss = 0.0
282
+ cls_loss = 0.2796514375954612
283
+ eval_loss = 0.46237338853604865
284
+ global_step = 4099
285
+ loss = 0.2796514375954612
286
+ mcc = 0.49253624505108995
287
+ rep_loss = 0.0
288
+ att_loss = 0.0
289
+ cls_loss = 0.27964162459953196
290
+ eval_loss = 0.4619031963926373
291
+ global_step = 4199
292
+ loss = 0.27964162459953196
293
+ mcc = 0.5229745445290679
294
+ rep_loss = 0.0
295
+ att_loss = 0.0
296
+ cls_loss = 0.27961426247175586
297
+ eval_loss = 0.45615032495874347
298
+ global_step = 4299
299
+ loss = 0.27961426247175586
300
+ mcc = 0.5365264430934975
301
+ rep_loss = 0.0
302
+ att_loss = 0.0
303
+ cls_loss = 0.2795747756165357
304
+ eval_loss = 0.46128532922629156
305
+ global_step = 4399
306
+ loss = 0.2795747756165357
307
+ mcc = 0.5041823056504463
308
+ rep_loss = 0.0
309
+ att_loss = 0.0
310
+ cls_loss = 0.2795220803760057
311
+ eval_loss = 0.4602658495758519
312
+ global_step = 4499
313
+ loss = 0.2795220803760057
314
+ mcc = 0.5375605063482544
315
+ rep_loss = 0.0
316
+ att_loss = 0.0
317
+ cls_loss = 0.27950176937822724
318
+ eval_loss = 0.4619640265450333
319
+ global_step = 4599
320
+ loss = 0.27950176937822724
321
+ mcc = 0.5124562838813566
322
+ rep_loss = 0.0
323
+ att_loss = 0.0
324
+ cls_loss = 0.27945331381810273
325
+ eval_loss = 0.4646099471684658
326
+ global_step = 4699
327
+ loss = 0.27945331381810273
328
+ mcc = 0.5169077666628997
329
+ rep_loss = 0.0
330
+ att_loss = 0.0
331
+ cls_loss = 0.27942949730012534
332
+ eval_loss = 0.45465407678575226
333
+ global_step = 4799
334
+ loss = 0.27942949730012534
335
+ mcc = 0.5177285176003892
336
+ rep_loss = 0.0
337
+ att_loss = 0.0
338
+ cls_loss = 0.27937435647265524
339
+ eval_loss = 0.46109452843666077
340
+ global_step = 4899
341
+ loss = 0.27937435647265524
342
+ mcc = 0.5100445720965326
343
+ rep_loss = 0.0
344
+ att_loss = 0.0
345
+ cls_loss = 0.27937307727589655
346
+ eval_loss = 0.4682340549700188
347
+ global_step = 4999
348
+ loss = 0.27937307727589655
349
+ mcc = 0.5113098668014724
350
+ rep_loss = 0.0
351
+ att_loss = 0.0
352
+ cls_loss = 0.27931859925941616
353
+ eval_loss = 0.4559897735263362
354
+ global_step = 5099
355
+ loss = 0.27931859925941616
356
+ mcc = 0.4956987863834426
357
+ rep_loss = 0.0
358
+ att_loss = 0.0
359
+ cls_loss = 0.2792279692418668
360
+ eval_loss = 0.46568602684772376
361
+ global_step = 5199
362
+ loss = 0.2792279692418668
363
+ mcc = 0.5037325824551425
364
+ rep_loss = 0.0
365
+ att_loss = 0.0
366
+ cls_loss = 0.27921356061681935
367
+ eval_loss = 0.4651721232768261
368
+ global_step = 5299
369
+ loss = 0.27921356061681935
370
+ mcc = 0.5043359873367174
371
+ rep_loss = 0.0
372
+ att_loss = 0.0
373
+ cls_loss = 0.27919509032905754
374
+ eval_loss = 0.4558627451911117
375
+ global_step = 5399
376
+ loss = 0.27919509032905754
377
+ mcc = 0.5203811415338604
378
+ rep_loss = 0.0
379
+ att_loss = 0.0
380
+ cls_loss = 0.2791919815044963
381
+ eval_loss = 0.47234560684724286
382
+ global_step = 5499
383
+ loss = 0.2791919815044963
384
+ mcc = 0.5050318665715698
385
+ rep_loss = 0.0
386
+ att_loss = 0.0
387
+ cls_loss = 0.27913230621648655
388
+ eval_loss = 0.4647821206035036
389
+ global_step = 5599
390
+ loss = 0.27913230621648655
391
+ mcc = 0.5309667017559951
392
+ rep_loss = 0.0
393
+ att_loss = 0.0
394
+ cls_loss = 0.2790925793400729
395
+ eval_loss = 0.46153073238604
396
+ global_step = 5699
397
+ loss = 0.2790925793400729
398
+ mcc = 0.5190273679468184
399
+ rep_loss = 0.0
400
+ att_loss = 0.0
401
+ cls_loss = 0.27906418180471865
402
+ eval_loss = 0.4553970116557497
403
+ global_step = 5799
404
+ loss = 0.27906418180471865
405
+ mcc = 0.5290221303314049
406
+ rep_loss = 0.0
407
+ att_loss = 0.0
408
+ cls_loss = 0.2789917427703554
409
+ eval_loss = 0.46314272465127887
410
+ global_step = 5899
411
+ loss = 0.2789917427703554
412
+ mcc = 0.5279776596624234
413
+ rep_loss = 0.0
414
+ att_loss = 0.0
415
+ cls_loss = 0.278957199890885
416
+ eval_loss = 0.45775021115938824
417
+ global_step = 5999
418
+ loss = 0.278957199890885
419
+ mcc = 0.518420673903781
420
+ rep_loss = 0.0
421
+ att_loss = 0.0
422
+ cls_loss = 0.2789460385597266
423
+ eval_loss = 0.45754783352216083
424
+ global_step = 6099
425
+ loss = 0.2789460385597266
426
+ mcc = 0.5120097095655185
427
+ rep_loss = 0.0
428
+ att_loss = 0.0
429
+ cls_loss = 0.27893527109097194
430
+ eval_loss = 0.4572519813523148
431
+ global_step = 6199
432
+ loss = 0.27893527109097194
433
+ mcc = 0.5067159264085137
434
+ rep_loss = 0.0
435
+ att_loss = 0.0
436
+ cls_loss = 0.27890371736703856
437
+ eval_loss = 0.4562020681121133
438
+ global_step = 6299
439
+ loss = 0.27890371736703856
440
+ mcc = 0.5159467834583324
441
+ rep_loss = 0.0
442
+ att_loss = 0.0
443
+ cls_loss = 0.27888854389163475
444
+ eval_loss = 0.4561521221290935
445
+ global_step = 6399
446
+ loss = 0.27888854389163475
447
+ mcc = 0.5068496037498794
448
+ rep_loss = 0.0
449
+ att_loss = 0.0
450
+ cls_loss = 0.2788673949335186
451
+ eval_loss = 0.45499569538867835
452
+ global_step = 6499
453
+ loss = 0.2788673949335186
454
+ mcc = 0.5248136238117787
455
+ rep_loss = 0.0
456
+ att_loss = 0.0
457
+ cls_loss = 0.2757796198129654
458
+ eval_loss = 0.4573383358391849
459
+ global_step = 6599
460
+ loss = 0.2757796198129654
461
+ mcc = 0.526358024246533
462
+ rep_loss = 0.0
463
+ att_loss = 0.0
464
+ cls_loss = 0.27811965489616763
465
+ eval_loss = 0.464380630941102
466
+ global_step = 6699
467
+ loss = 0.27811965489616763
468
+ mcc = 0.5061972812614249
469
+ rep_loss = 0.0
470
+ att_loss = 0.0
471
+ cls_loss = 0.27816279437027724
472
+ eval_loss = 0.45742737885677454
473
+ global_step = 6799
474
+ loss = 0.27816279437027724
475
+ mcc = 0.5094661687755515
476
+ rep_loss = 0.0
477
+ att_loss = 0.0
478
+ cls_loss = 0.27831977841101196
479
+ eval_loss = 0.4616742395993435
480
+ global_step = 6899
481
+ loss = 0.27831977841101196
482
+ mcc = 0.5168700801849877
483
+ rep_loss = 0.0
484
+ att_loss = 0.0
485
+ cls_loss = 0.2787469409332417
486
+ eval_loss = 0.46456035791021405
487
+ global_step = 6999
488
+ loss = 0.2787469409332417
489
+ mcc = 0.5087627070614528
490
+ rep_loss = 0.0
491
+ att_loss = 0.0
492
+ cls_loss = 0.2783590109930152
493
+ eval_loss = 0.4590166509151459
494
+ global_step = 7099
495
+ loss = 0.2783590109930152
496
+ mcc = 0.5003981004491761
497
+ rep_loss = 0.0
498
+ att_loss = 0.0
499
+ cls_loss = 0.2783066115730646
500
+ eval_loss = 0.46331078265652514
501
+ global_step = 7199
502
+ loss = 0.2783066115730646
503
+ mcc = 0.515768451621402
504
+ rep_loss = 0.0
505
+ att_loss = 0.0
506
+ cls_loss = 0.27824770591475745
507
+ eval_loss = 0.46015787756804266
508
+ global_step = 7299
509
+ loss = 0.27824770591475745
510
+ mcc = 0.5237298450652518
511
+ rep_loss = 0.0
512
+ att_loss = 0.0
513
+ cls_loss = 0.2780952813910015
514
+ eval_loss = 0.4625533123811086
515
+ global_step = 7399
516
+ loss = 0.2780952813910015
517
+ mcc = 0.5034296190683365
518
+ rep_loss = 0.0
519
+ att_loss = 0.0
520
+ cls_loss = 0.278015139422058
521
+ eval_loss = 0.4528456592198574
522
+ global_step = 7499
523
+ loss = 0.278015139422058
524
+ mcc = 0.5217876741934422
525
+ rep_loss = 0.0
526
+ att_loss = 0.0
527
+ cls_loss = 0.277956866410624
528
+ eval_loss = 0.4593150651816166
529
+ global_step = 7599
530
+ loss = 0.277956866410624
531
+ mcc = 0.5251026682217866
532
+ rep_loss = 0.0
533
+ att_loss = 0.0
534
+ cls_loss = 0.2779009008537168
535
+ eval_loss = 0.4646720245028987
536
+ global_step = 7699
537
+ loss = 0.2779009008537168
538
+ mcc = 0.5183921815500953
539
+ rep_loss = 0.0
540
+ att_loss = 0.0
541
+ cls_loss = 0.2779220149440821
542
+ eval_loss = 0.454393154743946
543
+ global_step = 7799
544
+ loss = 0.2779220149440821
545
+ mcc = 0.5041352192953922
546
+ rep_loss = 0.0
547
+ att_loss = 0.0
548
+ cls_loss = 0.2777234323528464
549
+ eval_loss = 0.45908459840398846
550
+ global_step = 7899
551
+ loss = 0.2777234323528464
552
+ mcc = 0.5020574037201646
553
+ rep_loss = 0.0
554
+ att_loss = 0.0
555
+ cls_loss = 0.2777911504767729
556
+ eval_loss = 0.4548939312949325
557
+ global_step = 7999
558
+ loss = 0.2777911504767729
559
+ mcc = 0.5196909986566013
560
+ rep_loss = 0.0
561
+ att_loss = 0.0
562
+ cls_loss = 0.27777142050933645
563
+ eval_loss = 0.4575051547903003
564
+ global_step = 8099
565
+ loss = 0.27777142050933645
566
+ mcc = 0.49580015034789016
567
+ rep_loss = 0.0
568
+ att_loss = 0.0
569
+ cls_loss = 0.27780618237103905
570
+ eval_loss = 0.4631824285695047
571
+ global_step = 8199
572
+ loss = 0.27780618237103905
573
+ mcc = 0.5155959050899789
574
+ rep_loss = 0.0
575
+ att_loss = 0.0
576
+ cls_loss = 0.27793682633326366
577
+ eval_loss = 0.465167505271507
578
+ global_step = 8299
579
+ loss = 0.27793682633326366
580
+ mcc = 0.51826530606729
581
+ rep_loss = 0.0
582
+ att_loss = 0.0
583
+ cls_loss = 0.27787920028929436
584
+ eval_loss = 0.4498411010612141
585
+ global_step = 8399
586
+ loss = 0.27787920028929436
587
+ mcc = 0.5065152939803185
588
+ rep_loss = 0.0
589
+ att_loss = 0.0
590
+ cls_loss = 0.2779220895403448
591
+ eval_loss = 0.45216559821909125
592
+ global_step = 8499
593
+ loss = 0.2779220895403448
594
+ mcc = 0.5080191328496129
595
+ rep_loss = 0.0
596
+ att_loss = 0.0
597
+ cls_loss = 0.2778555219416728
598
+ eval_loss = 0.4617597225940589
599
+ global_step = 8599
600
+ loss = 0.2778555219416728
601
+ mcc = 0.5083999234602438
602
+ rep_loss = 0.0
603
+ att_loss = 0.0
604
+ cls_loss = 0.2777616101115262
605
+ eval_loss = 0.4578354196114974
606
+ global_step = 8699
607
+ loss = 0.2777616101115262
608
+ mcc = 0.5031704769687771
609
+ rep_loss = 0.0
610
+ att_loss = 0.0
611
+ cls_loss = 0.27773835413333725
612
+ eval_loss = 0.4657824310389432
613
+ global_step = 8799
614
+ loss = 0.27773835413333725
615
+ mcc = 0.4881240673260976
616
+ rep_loss = 0.0
617
+ att_loss = 0.0
618
+ cls_loss = 0.2777370062798986
619
+ eval_loss = 0.45953314503033954
620
+ global_step = 8899
621
+ loss = 0.2777370062798986
622
+ mcc = 0.5153769103822675
623
+ rep_loss = 0.0
624
+ att_loss = 0.0
625
+ cls_loss = 0.277684324152904
626
+ eval_loss = 0.45517356648589624
627
+ global_step = 8999
628
+ loss = 0.277684324152904
629
+ mcc = 0.5163748285133078
630
+ rep_loss = 0.0
631
+ att_loss = 0.0
632
+ cls_loss = 0.27766840475888105
633
+ eval_loss = 0.457070403026812
634
+ global_step = 9099
635
+ loss = 0.27766840475888105
636
+ mcc = 0.51233675887833
637
+ rep_loss = 0.0
638
+ att_loss = 0.0
639
+ cls_loss = 0.2776113221802378
640
+ eval_loss = 0.45618007399819116
641
+ global_step = 9199
642
+ loss = 0.2776113221802378
643
+ mcc = 0.5248226674672084
644
+ rep_loss = 0.0
645
+ att_loss = 0.0
646
+ cls_loss = 0.2775809703416814
647
+ eval_loss = 0.45970096552010736
648
+ global_step = 9299
649
+ loss = 0.2775809703416814
650
+ mcc = 0.49818194163113544
651
+ rep_loss = 0.0
652
+ att_loss = 0.0
653
+ cls_loss = 0.2775813296447892
654
+ eval_loss = 0.4484571742288994
655
+ global_step = 9399
656
+ loss = 0.2775813296447892
657
+ mcc = 0.5353363425506695
658
+ rep_loss = 0.0
659
+ att_loss = 0.0
660
+ cls_loss = 0.2775996053032064
661
+ eval_loss = 0.45738490603186865
662
+ global_step = 9499
663
+ loss = 0.2775996053032064
664
+ mcc = 0.5274553187190298
665
+ rep_loss = 0.0
666
+ att_loss = 0.0
667
+ cls_loss = 0.2775802656899041
668
+ eval_loss = 0.45940391764496313
669
+ global_step = 9599
670
+ loss = 0.2775802656899041
671
+ mcc = 0.5309667017559951
672
+ rep_loss = 0.0
673
+ att_loss = 0.0
674
+ cls_loss = 0.2775419917792927
675
+ eval_loss = 0.45416359558249964
676
+ global_step = 9699
677
+ loss = 0.2775419917792927
678
+ mcc = 0.5168700801849877
679
+ rep_loss = 0.0
680
+ att_loss = 0.0
681
+ cls_loss = 0.2775549595470955
682
+ eval_loss = 0.45552727580070496
683
+ global_step = 9799
684
+ loss = 0.2775549595470955
685
+ mcc = 0.5302530461642105
686
+ rep_loss = 0.0
687
+ att_loss = 0.0
688
+ cls_loss = 0.2775005057643531
689
+ eval_loss = 0.4519644948569211
690
+ global_step = 9899
691
+ loss = 0.2775005057643531
692
+ mcc = 0.5375605063482544
693
+ rep_loss = 0.0
694
+ att_loss = 0.0
695
+ cls_loss = 0.2775091579102952
696
+ eval_loss = 0.45495487162561127
697
+ global_step = 9999
698
+ loss = 0.2775091579102952
699
+ mcc = 0.5290831606897504
700
+ rep_loss = 0.0
701
+ att_loss = 0.0
702
+ cls_loss = 0.2775382169535103
703
+ eval_loss = 0.45335144888270984
704
+ global_step = 10099
705
+ loss = 0.2775382169535103
706
+ mcc = 0.5212483689279175
707
+ rep_loss = 0.0
708
+ att_loss = 0.0
709
+ cls_loss = 0.2775139581126788
710
+ eval_loss = 0.4594464329156009
711
+ global_step = 10199
712
+ loss = 0.2775139581126788
713
+ mcc = 0.5374399947273891
714
+ rep_loss = 0.0
715
+ att_loss = 0.0
716
+ cls_loss = 0.2774607858602481
717
+ eval_loss = 0.45745504489450745
718
+ global_step = 10299
719
+ loss = 0.2774607858602481
720
+ mcc = 0.5371844138786498
721
+ rep_loss = 0.0
722
+ att_loss = 0.0
723
+ cls_loss = 0.27743388400594265
724
+ eval_loss = 0.45088858676679205
725
+ global_step = 10399
726
+ loss = 0.27743388400594265
727
+ mcc = 0.5347185537666785
728
+ rep_loss = 0.0
729
+ att_loss = 0.0
730
+ cls_loss = 0.27751540343017606
731
+ eval_loss = 0.46303236665147723
732
+ global_step = 10499
733
+ loss = 0.27751540343017606
734
+ mcc = 0.5330871284819242
735
+ rep_loss = 0.0
736
+ att_loss = 0.0
737
+ cls_loss = 0.27752122901506593
738
+ eval_loss = 0.45777365204059717
739
+ global_step = 10599
740
+ loss = 0.27752122901506593
741
+ mcc = 0.5201497752653439
742
+ rep_loss = 0.0
743
+ att_loss = 0.0
744
+ cls_loss = 0.2775007768753793
745
+ eval_loss = 0.4558024289030017
746
+ global_step = 10699
747
+ loss = 0.2775007768753793
748
+ mcc = 0.5228028383317379
749
+ rep_loss = 0.0
750
+ att_loss = 0.0
751
+ cls_loss = 0.2774832700614017
752
+ eval_loss = 0.4519307076027899
753
+ global_step = 10799
754
+ loss = 0.2774832700614017
755
+ mcc = 0.5190273679468184
756
+ rep_loss = 0.0
757
+ att_loss = 0.0
758
+ cls_loss = 0.2774546956747327
759
+ eval_loss = 0.45893278085824213
760
+ global_step = 10899
761
+ loss = 0.2774546956747327
762
+ mcc = 0.5297290847722776
763
+ rep_loss = 0.0
764
+ att_loss = 0.0
765
+ cls_loss = 0.27744613046488037
766
+ eval_loss = 0.45718637018492725
767
+ global_step = 10999
768
+ loss = 0.27744613046488037
769
+ mcc = 0.5184277879580146
770
+ rep_loss = 0.0
771
+ att_loss = 0.0
772
+ cls_loss = 0.2774493484948075
773
+ eval_loss = 0.45472668788649817
774
+ global_step = 11099
775
+ loss = 0.2774493484948075
776
+ mcc = 0.5355562155372715
777
+ rep_loss = 0.0
778
+ att_loss = 0.0
779
+ cls_loss = 0.2774652933344232
780
+ eval_loss = 0.4553719036506884
781
+ global_step = 11199
782
+ loss = 0.2774652933344232
783
+ mcc = 0.5297290847722776
784
+ rep_loss = 0.0
785
+ att_loss = 0.0
786
+ cls_loss = 0.2774399504838448
787
+ eval_loss = 0.45496712760491803
788
+ global_step = 11299
789
+ loss = 0.2774399504838448
790
+ mcc = 0.5357272816819911
791
+ rep_loss = 0.0
792
+ att_loss = 0.0
793
+ cls_loss = 0.27742566522536527
794
+ eval_loss = 0.4532328591202245
795
+ global_step = 11399
796
+ loss = 0.27742566522536527
797
+ mcc = 0.5302530461642105
798
+ rep_loss = 0.0
799
+ att_loss = 0.0
800
+ cls_loss = 0.2774223230147148
801
+ eval_loss = 0.4519491602074016
802
+ global_step = 11499
803
+ loss = 0.2774223230147148
804
+ mcc = 0.5166623535745778
805
+ rep_loss = 0.0
806
+ att_loss = 0.0
807
+ cls_loss = 0.27743097503098557
808
+ eval_loss = 0.4579541466452859
809
+ global_step = 11599
810
+ loss = 0.27743097503098557
811
+ mcc = 0.5281023217797143
812
+ rep_loss = 0.0
813
+ att_loss = 0.0
814
+ cls_loss = 0.27743173339243593
815
+ eval_loss = 0.4504963927196734
816
+ global_step = 11699
817
+ loss = 0.27743173339243593
818
+ mcc = 0.5290831606897504
819
+ rep_loss = 0.0
820
+ att_loss = 0.0
821
+ cls_loss = 0.27745687274361097
822
+ eval_loss = 0.44933091058875574
823
+ global_step = 11799
824
+ loss = 0.27745687274361097
825
+ mcc = 0.5347185537666785
826
+ rep_loss = 0.0
827
+ att_loss = 0.0
828
+ cls_loss = 0.27743749302526766
829
+ eval_loss = 0.448698260567405
830
+ global_step = 11899
831
+ loss = 0.27743749302526766
832
+ mcc = 0.5322060958308948
833
+ rep_loss = 0.0
834
+ att_loss = 0.0
835
+ cls_loss = 0.27743755156887095
836
+ eval_loss = 0.4573155262253501
837
+ global_step = 11999
838
+ loss = 0.27743755156887095
839
+ mcc = 0.5224496771410306
840
+ rep_loss = 0.0
841
+ att_loss = 0.0
842
+ cls_loss = 0.2774356068924156
843
+ eval_loss = 0.4552531224308592
844
+ global_step = 12099
845
+ loss = 0.2774356068924156
846
+ mcc = 0.5324104093270398
847
+ rep_loss = 0.0
848
+ att_loss = 0.0
849
+ cls_loss = 0.27742416586070123
850
+ eval_loss = 0.4579685023336699
851
+ global_step = 12199
852
+ loss = 0.27742416586070123
853
+ mcc = 0.5291785294213451
854
+ rep_loss = 0.0
855
+ att_loss = 0.0
856
+ cls_loss = 0.2774283394823569
857
+ eval_loss = 0.4494276660861391
858
+ global_step = 12299
859
+ loss = 0.2774283394823569
860
+ mcc = 0.5547015581596438
861
+ rep_loss = 0.0
862
+ att_loss = 0.0
863
+ cls_loss = 0.2774310273026533
864
+ eval_loss = 0.45670852155396435
865
+ global_step = 12399
866
+ loss = 0.2774310273026533
867
+ mcc = 0.5395175517784774
868
+ rep_loss = 0.0
869
+ att_loss = 0.0
870
+ cls_loss = 0.2773878394997096
871
+ eval_loss = 0.4560541799574187
872
+ global_step = 12499
873
+ loss = 0.2773878394997096
874
+ mcc = 0.5315672216228357
875
+ rep_loss = 0.0
876
+ att_loss = 0.0
877
+ cls_loss = 0.2774021773165381
878
+ eval_loss = 0.45269398255781695
879
+ global_step = 12599
880
+ loss = 0.2774021773165381
881
+ mcc = 0.5231821039975777
882
+ rep_loss = 0.0
883
+ att_loss = 0.0
884
+ cls_loss = 0.2773917444309081
885
+ eval_loss = 0.4570877570094484
886
+ global_step = 12699
887
+ loss = 0.2773917444309081
888
+ mcc = 0.5369793883294685
889
+ rep_loss = 0.0
890
+ att_loss = 0.0
891
+ cls_loss = 0.2773833233024865
892
+ eval_loss = 0.45557611458229297
893
+ global_step = 12799
894
+ loss = 0.2773833233024865
895
+ mcc = 0.5312319613383731
896
+ rep_loss = 0.0
897
+ att_loss = 0.0
898
+ cls_loss = 0.2773907062796129
899
+ eval_loss = 0.45298474394913874
900
+ global_step = 12899
901
+ loss = 0.2773907062796129
902
+ mcc = 0.5279435340913744
903
+ rep_loss = 0.0
904
+ att_loss = 0.0
905
+ cls_loss = 0.27739593593739925
906
+ eval_loss = 0.4516429973371101
907
+ global_step = 12999
908
+ loss = 0.27739593593739925
909
+ mcc = 0.5455569520342612
910
+ rep_loss = 0.0
911
+ att_loss = 0.0
912
+ cls_loss = 0.2773754865453472
913
+ eval_loss = 0.451772644664302
914
+ global_step = 13099
915
+ loss = 0.2773754865453472
916
+ mcc = 0.5447721171016089
917
+ rep_loss = 0.0
918
+ att_loss = 0.0
919
+ cls_loss = 0.278318057457606
920
+ eval_loss = 0.4590268884644364
921
+ global_step = 13199
922
+ loss = 0.278318057457606
923
+ mcc = 0.5356489226051415
924
+ rep_loss = 0.0
925
+ att_loss = 0.0
926
+ cls_loss = 0.27664143721991724
927
+ eval_loss = 0.45668373776204657
928
+ global_step = 13299
929
+ loss = 0.27664143721991724
930
+ mcc = 0.5395175517784774
931
+ rep_loss = 0.0
932
+ att_loss = 0.0
933
+ cls_loss = 0.27545882497677965
934
+ eval_loss = 0.4490573957110896
935
+ global_step = 13399
936
+ loss = 0.27545882497677965
937
+ mcc = 0.5496207419670193
938
+ rep_loss = 0.0
939
+ att_loss = 0.0
940
+ cls_loss = 0.2757971603121958
941
+ eval_loss = 0.45480099681651953
942
+ global_step = 13499
943
+ loss = 0.2757971603121958
944
+ mcc = 0.5348097624143603
945
+ rep_loss = 0.0
946
+ att_loss = 0.0
947
+ cls_loss = 0.27587504841587657
948
+ eval_loss = 0.45544032255808514
949
+ global_step = 13599
950
+ loss = 0.27587504841587657
951
+ mcc = 0.5254536736633585
952
+ rep_loss = 0.0
953
+ att_loss = 0.0
954
+ cls_loss = 0.2759395760204094
955
+ eval_loss = 0.456780217813723
956
+ global_step = 13699
957
+ loss = 0.2759395760204094
958
+ mcc = 0.5281023217797143
959
+ rep_loss = 0.0
960
+ att_loss = 0.0
961
+ cls_loss = 0.2761271443028364
962
+ eval_loss = 0.4568403245824756
963
+ global_step = 13799
964
+ loss = 0.2761271443028364
965
+ mcc = 0.5270843127054785
966
+ rep_loss = 0.0
967
+ att_loss = 0.0
968
+ cls_loss = 0.2763089490752294
969
+ eval_loss = 0.45502680359464703
970
+ global_step = 13899
971
+ loss = 0.2763089490752294
972
+ mcc = 0.5302530461642105
973
+ rep_loss = 0.0
974
+ att_loss = 0.0
975
+ cls_loss = 0.2763681988449415
976
+ eval_loss = 0.4561975769924395
977
+ global_step = 13999
978
+ loss = 0.2763681988449415
979
+ mcc = 0.5316647141164849
980
+ rep_loss = 0.0
981
+ att_loss = 0.0
982
+ cls_loss = 0.2764051501998807
983
+ eval_loss = 0.45802293582396075
984
+ global_step = 14099
985
+ loss = 0.2764051501998807
986
+ mcc = 0.5403061957257674
987
+ rep_loss = 0.0
988
+ att_loss = 0.0
989
+ cls_loss = 0.2763773106164101
990
+ eval_loss = 0.45300981312087085
991
+ global_step = 14199
992
+ loss = 0.2763773106164101
993
+ mcc = 0.5274553187190298
994
+ rep_loss = 0.0
995
+ att_loss = 0.0
996
+ cls_loss = 0.27634809661330784
997
+ eval_loss = 0.45622625856688526
998
+ global_step = 14299
999
+ loss = 0.27634809661330784
1000
+ mcc = 0.5183921815500953
1001
+ rep_loss = 0.0
1002
+ att_loss = 0.0
1003
+ cls_loss = 0.27630603134730713
1004
+ eval_loss = 0.45476906317653076
1005
+ global_step = 14399
1006
+ loss = 0.27630603134730713
1007
+ mcc = 0.5318161795948887
1008
+ rep_loss = 0.0
1009
+ att_loss = 0.0
1010
+ cls_loss = 0.2763643769406471
1011
+ eval_loss = 0.45554043939619354
1012
+ global_step = 14499
1013
+ loss = 0.2763643769406471
1014
+ mcc = 0.5276117265770821
1015
+ rep_loss = 0.0
1016
+ att_loss = 0.0
1017
+ cls_loss = 0.2765032273920146
1018
+ eval_loss = 0.45379058700619324
1019
+ global_step = 14599
1020
+ loss = 0.2765032273920146
1021
+ mcc = 0.5106329014613062
1022
+ rep_loss = 0.0
1023
+ att_loss = 0.0
1024
+ cls_loss = 0.2764957464535241
1025
+ eval_loss = 0.45894434145002655
1026
+ global_step = 14699
1027
+ loss = 0.2764957464535241
1028
+ mcc = 0.5171981604121658
1029
+ rep_loss = 0.0
1030
+ att_loss = 0.0
1031
+ cls_loss = 0.27650387620355416
1032
+ eval_loss = 0.4566023765188275
1033
+ global_step = 14799
1034
+ loss = 0.27650387620355416
1035
+ mcc = 0.5322060958308948
1036
+ rep_loss = 0.0
1037
+ att_loss = 0.0
1038
+ cls_loss = 0.2765135073292109
1039
+ eval_loss = 0.4491843418641524
1040
+ global_step = 14899
1041
+ loss = 0.2765135073292109
1042
+ mcc = 0.5376769315385652
1043
+ rep_loss = 0.0
1044
+ att_loss = 0.0
1045
+ cls_loss = 0.27645776300979885
1046
+ eval_loss = 0.459045028144663
1047
+ global_step = 14999
1048
+ loss = 0.27645776300979885
1049
+ mcc = 0.5163630963192842
1050
+ rep_loss = 0.0
1051
+ att_loss = 0.0
1052
+ cls_loss = 0.2765224870350924
1053
+ eval_loss = 0.45438164382269886
1054
+ global_step = 15099
1055
+ loss = 0.2765224870350924
1056
+ mcc = 0.5276117265770821
1057
+ rep_loss = 0.0
1058
+ att_loss = 0.0
1059
+ cls_loss = 0.27655044160950176
1060
+ eval_loss = 0.45653185880545416
1061
+ global_step = 15199
1062
+ loss = 0.27655044160950176
1063
+ mcc = 0.5316647141164849
1064
+ rep_loss = 0.0
1065
+ att_loss = 0.0
1066
+ cls_loss = 0.276501307121777
1067
+ eval_loss = 0.45656741749156604
1068
+ global_step = 15299
1069
+ loss = 0.276501307121777
1070
+ mcc = 0.5276117265770821
1071
+ rep_loss = 0.0
1072
+ att_loss = 0.0
1073
+ cls_loss = 0.2765050630943977
1074
+ eval_loss = 0.45284795941728534
1075
+ global_step = 15399
1076
+ loss = 0.2765050630943977
1077
+ mcc = 0.5315672216228357
1078
+ rep_loss = 0.0
1079
+ att_loss = 0.0
1080
+ cls_loss = 0.2764615254801762
1081
+ eval_loss = 0.46013957171729114
1082
+ global_step = 15499
1083
+ loss = 0.2764615254801762
1084
+ mcc = 0.5266763751215275
1085
+ rep_loss = 0.0
1086
+ att_loss = 0.0
1087
+ cls_loss = 0.27637805436200846
1088
+ eval_loss = 0.452160148006497
1089
+ global_step = 15599
1090
+ loss = 0.27637805436200846
1091
+ mcc = 0.5191953567121099
1092
+ rep_loss = 0.0
1093
+ att_loss = 0.0
1094
+ cls_loss = 0.2763865352175824
1095
+ eval_loss = 0.4566154796065706
1096
+ global_step = 15699
1097
+ loss = 0.2763865352175824
1098
+ mcc = 0.5291785294213451
1099
+ rep_loss = 0.0
1100
+ att_loss = 0.0
1101
+ cls_loss = 0.27636008938412504
1102
+ eval_loss = 0.4549913090286833
1103
+ global_step = 15799
1104
+ loss = 0.27636008938412504
1105
+ mcc = 0.5190097111686822
1106
+ rep_loss = 0.0
1107
+ att_loss = 0.0
1108
+ cls_loss = 0.27635927772821206
1109
+ eval_loss = 0.45468395858099964
1110
+ global_step = 15899
1111
+ loss = 0.27635927772821206
1112
+ mcc = 0.5176740389815154
1113
+ rep_loss = 0.0
1114
+ att_loss = 0.0
1115
+ cls_loss = 0.2763913096525186
1116
+ eval_loss = 0.45687262668754114
1117
+ global_step = 15999
1118
+ loss = 0.2763913096525186
1119
+ mcc = 0.5379646517492308
1120
+ rep_loss = 0.0
1121
+ att_loss = 0.0
1122
+ cls_loss = 0.27635131174959077
1123
+ eval_loss = 0.4549617071946462
1124
+ global_step = 16099
1125
+ loss = 0.27635131174959077
1126
+ mcc = 0.5200867163616212
1127
+ rep_loss = 0.0
1128
+ att_loss = 0.0
1129
+ cls_loss = 0.27639669551826385
1130
+ eval_loss = 0.45427083336945734
1131
+ global_step = 16199
1132
+ loss = 0.27639669551826385
1133
+ mcc = 0.5185990890831609
1134
+ rep_loss = 0.0
1135
+ att_loss = 0.0
1136
+ cls_loss = 0.27637253505177495
1137
+ eval_loss = 0.4564370702613484
1138
+ global_step = 16299
1139
+ loss = 0.27637253505177495
1140
+ mcc = 0.5276346700087589
1141
+ rep_loss = 0.0
1142
+ att_loss = 0.0
1143
+ cls_loss = 0.27633983237177234
1144
+ eval_loss = 0.4526894535079147
1145
+ global_step = 16399
1146
+ loss = 0.27633983237177234
1147
+ mcc = 0.5318161795948887
1148
+ rep_loss = 0.0
1149
+ att_loss = 0.0
1150
+ cls_loss = 0.2763634096796183
1151
+ eval_loss = 0.4523286151163506
1152
+ global_step = 16499
1153
+ loss = 0.2763634096796183
1154
+ mcc = 0.5344510385480925
1155
+ rep_loss = 0.0
1156
+ att_loss = 0.0
1157
+ cls_loss = 0.2763351077740057
1158
+ eval_loss = 0.45641895496484003
1159
+ global_step = 16599
1160
+ loss = 0.2763351077740057
1161
+ mcc = 0.524327905037375
1162
+ rep_loss = 0.0
1163
+ att_loss = 0.0
1164
+ cls_loss = 0.27630653749354106
1165
+ eval_loss = 0.45319110335725726
1166
+ global_step = 16699
1167
+ loss = 0.27630653749354106
1168
+ mcc = 0.5338113857914387
1169
+ rep_loss = 0.0
1170
+ att_loss = 0.0
1171
+ cls_loss = 0.27626817112535146
1172
+ eval_loss = 0.45247378132560034
1173
+ global_step = 16799
1174
+ loss = 0.27626817112535146
1175
+ mcc = 0.5309667017559951
1176
+ rep_loss = 0.0
1177
+ att_loss = 0.0
1178
+ cls_loss = 0.276290586126336
1179
+ eval_loss = 0.45359588301543036
1180
+ global_step = 16899
1181
+ loss = 0.276290586126336
1182
+ mcc = 0.5408255169384978
1183
+ rep_loss = 0.0
1184
+ att_loss = 0.0
1185
+ cls_loss = 0.2762416014914814
1186
+ eval_loss = 0.4515194757418199
1187
+ global_step = 16999
1188
+ loss = 0.2762416014914814
1189
+ mcc = 0.5364994308218176
1190
+ rep_loss = 0.0
1191
+ att_loss = 0.0
1192
+ cls_loss = 0.2762412506697214
1193
+ eval_loss = 0.4490665648922776
1194
+ global_step = 17099
1195
+ loss = 0.2762412506697214
1196
+ mcc = 0.528019541905275
1197
+ rep_loss = 0.0
1198
+ att_loss = 0.0
1199
+ cls_loss = 0.2762108766161376
1200
+ eval_loss = 0.45332705523028516
1201
+ global_step = 17199
1202
+ loss = 0.2762108766161376
1203
+ mcc = 0.5348763506104023
1204
+ rep_loss = 0.0
1205
+ att_loss = 0.0
1206
+ cls_loss = 0.2761994298718857
1207
+ eval_loss = 0.45431061856674426
1208
+ global_step = 17299
1209
+ loss = 0.2761994298718857
1210
+ mcc = 0.5395175517784774
1211
+ rep_loss = 0.0
1212
+ att_loss = 0.0
1213
+ cls_loss = 0.27617793641214444
1214
+ eval_loss = 0.4537888720180049
1215
+ global_step = 17399
1216
+ loss = 0.27617793641214444
1217
+ mcc = 0.5290221303314049
1218
+ rep_loss = 0.0
1219
+ att_loss = 0.0
1220
+ cls_loss = 0.2761897478580309
1221
+ eval_loss = 0.45442140915177087
1222
+ global_step = 17499
1223
+ loss = 0.2761897478580309
1224
+ mcc = 0.5276346700087589
1225
+ rep_loss = 0.0
1226
+ att_loss = 0.0
1227
+ cls_loss = 0.2761933956625619
1228
+ eval_loss = 0.4552511428341721
1229
+ global_step = 17599
1230
+ loss = 0.2761933956625619
1231
+ mcc = 0.5223414189412047
1232
+ rep_loss = 0.0
1233
+ att_loss = 0.0
1234
+ cls_loss = 0.27616957312850104
1235
+ eval_loss = 0.453849631728548
1236
+ global_step = 17699
1237
+ loss = 0.27616957312850104
1238
+ mcc = 0.5394751143865678
1239
+ rep_loss = 0.0
1240
+ att_loss = 0.0
1241
+ cls_loss = 0.2761757420592154
1242
+ eval_loss = 0.45676823276461975
1243
+ global_step = 17799
1244
+ loss = 0.2761757420592154
1245
+ mcc = 0.5263771879747187
1246
+ rep_loss = 0.0
1247
+ att_loss = 0.0
1248
+ cls_loss = 0.2761607745487894
1249
+ eval_loss = 0.4525405850374337
1250
+ global_step = 17899
1251
+ loss = 0.2761607745487894
1252
+ mcc = 0.5249677896757049
1253
+ rep_loss = 0.0
1254
+ att_loss = 0.0
1255
+ cls_loss = 0.2761404152210499
1256
+ eval_loss = 0.4527777406302365
1257
+ global_step = 17999
1258
+ loss = 0.2761404152210499
1259
+ mcc = 0.5302530461642105
1260
+ rep_loss = 0.0
1261
+ att_loss = 0.0
1262
+ cls_loss = 0.2761837591353199
1263
+ eval_loss = 0.4547244626464266
1264
+ global_step = 18099
1265
+ loss = 0.2761837591353199
1266
+ mcc = 0.5315672216228357
1267
+ rep_loss = 0.0
1268
+ att_loss = 0.0
1269
+ cls_loss = 0.27617460252472825
1270
+ eval_loss = 0.45115146040916443
1271
+ global_step = 18199
1272
+ loss = 0.27617460252472825
1273
+ mcc = 0.5263343763638897
1274
+ rep_loss = 0.0
1275
+ att_loss = 0.0
1276
+ cls_loss = 0.2761623841555624
1277
+ eval_loss = 0.45427156668720825
1278
+ global_step = 18299
1279
+ loss = 0.2761623841555624
1280
+ mcc = 0.5350117423563097
1281
+ rep_loss = 0.0
1282
+ att_loss = 0.0
1283
+ cls_loss = 0.2761950084643163
1284
+ eval_loss = 0.454286765871626
1285
+ global_step = 18399
1286
+ loss = 0.2761950084643163
1287
+ mcc = 0.5355562155372715
1288
+ rep_loss = 0.0
1289
+ att_loss = 0.0
1290
+ cls_loss = 0.2761831375182427
1291
+ eval_loss = 0.45068027395190613
1292
+ global_step = 18499
1293
+ loss = 0.2761831375182427
1294
+ mcc = 0.5408255169384978
1295
+ rep_loss = 0.0
1296
+ att_loss = 0.0
1297
+ cls_loss = 0.27621336098099886
1298
+ eval_loss = 0.4529677299839078
1299
+ global_step = 18599
1300
+ loss = 0.27621336098099886
1301
+ mcc = 0.5394751143865678
1302
+ rep_loss = 0.0
1303
+ att_loss = 0.0
1304
+ cls_loss = 0.2762250059917718
1305
+ eval_loss = 0.45488957564036053
1306
+ global_step = 18699
1307
+ loss = 0.2762250059917718
1308
+ mcc = 0.538880877181237
1309
+ rep_loss = 0.0
1310
+ att_loss = 0.0
1311
+ cls_loss = 0.27622369788806267
1312
+ eval_loss = 0.4533221423625946
1313
+ global_step = 18799
1314
+ loss = 0.27622369788806267
1315
+ mcc = 0.540145729318548
1316
+ rep_loss = 0.0
1317
+ att_loss = 0.0
1318
+ cls_loss = 0.27624025213194303
1319
+ eval_loss = 0.4541215788234364
1320
+ global_step = 18899
1321
+ loss = 0.27624025213194303
1322
+ mcc = 0.542106330857015
1323
+ rep_loss = 0.0
1324
+ att_loss = 0.0
1325
+ cls_loss = 0.27623185721131605
1326
+ eval_loss = 0.45452457576087024
1327
+ global_step = 18999
1328
+ loss = 0.27623185721131605
1329
+ mcc = 0.540145729318548
1330
+ rep_loss = 0.0
1331
+ att_loss = 0.0
1332
+ cls_loss = 0.27624673165732744
1333
+ eval_loss = 0.454106766166109
1334
+ global_step = 19099
1335
+ loss = 0.27624673165732744
1336
+ mcc = 0.5375122094090742
1337
+ rep_loss = 0.0
1338
+ att_loss = 0.0
1339
+ cls_loss = 0.27626025659864606
1340
+ eval_loss = 0.453075953505256
1341
+ global_step = 19199
1342
+ loss = 0.27626025659864606
1343
+ mcc = 0.5342056019086159
1344
+ rep_loss = 0.0
1345
+ att_loss = 0.0
1346
+ cls_loss = 0.27623782110674755
1347
+ eval_loss = 0.453053484360377
1348
+ global_step = 19299
1349
+ loss = 0.27623782110674755
1350
+ mcc = 0.5335440534839315
1351
+ rep_loss = 0.0
1352
+ att_loss = 0.0
1353
+ cls_loss = 0.27621929033364356
1354
+ eval_loss = 0.45425386320460925
1355
+ global_step = 19399
1356
+ loss = 0.27621929033364356
1357
+ mcc = 0.540145729318548
1358
+ rep_loss = 0.0
1359
+ att_loss = 0.0
1360
+ cls_loss = 0.2762047120405842
1361
+ eval_loss = 0.4529296936410846
1362
+ global_step = 19499
1363
+ loss = 0.2762047120405842
1364
+ mcc = 0.5368415520595031
1365
+ rep_loss = 0.0
1366
+ att_loss = 0.0
1367
+ cls_loss = 0.27618440176101794
1368
+ eval_loss = 0.45266035424940515
1369
+ global_step = 19599
1370
+ loss = 0.27618440176101794
1371
+ mcc = 0.5368415520595031
1372
+ rep_loss = 0.0
1373
+ att_loss = 0.0
1374
+ cls_loss = 0.27617881076093054
1375
+ eval_loss = 0.4528392625577522
1376
+ global_step = 19699
1377
+ loss = 0.27617881076093054
1378
+ mcc = 0.5368415520595031
1379
+ rep_loss = 0.0
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffc37fbbb654c9ae257be69362d40fb94e7e28ecbcd7847abc2dd6fe1c322cf7
3
+ size 270223951
vocab.txt ADDED
The diff for this file is too large to render. See raw diff