takedarn commited on
Commit
c90bc04
·
verified ·
1 Parent(s): b94f288

Upload folder using huggingface_hub

Browse files
Files changed (4) hide show
  1. config.json +29 -0
  2. eval_results.txt +1379 -0
  3. pytorch_model.bin +3 -0
  4. vocab.txt +0 -0
config.json ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "BertForSequenceClassification"
4
+ ],
5
+ "attention_probs_dropout_prob": 0.1,
6
+ "cell": {},
7
+ "classifier_dropout": null,
8
+ "dtype": "float32",
9
+ "emb_size": 312,
10
+ "hidden_act": "gelu",
11
+ "hidden_dropout_prob": 0.1,
12
+ "hidden_size": 312,
13
+ "initializer_range": 0.02,
14
+ "intermediate_size": 1200,
15
+ "layer_norm_eps": 1e-12,
16
+ "max_position_embeddings": 512,
17
+ "model_type": "bert",
18
+ "num_attention_heads": 12,
19
+ "num_hidden_layers": 4,
20
+ "pad_token_id": 0,
21
+ "position_embedding_type": "absolute",
22
+ "pre_trained": "",
23
+ "structure": [],
24
+ "training": "",
25
+ "transformers_version": "4.57.0",
26
+ "type_vocab_size": 2,
27
+ "use_cache": true,
28
+ "vocab_size": 30522
29
+ }
eval_results.txt ADDED
@@ -0,0 +1,1379 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ att_loss = 0.0
2
+ cls_loss = 0.34237186716060447
3
+ eval_loss = 0.6603382482673182
4
+ global_step = 99
5
+ loss = 0.34237186716060447
6
+ mcc = 0.3702633409778515
7
+ rep_loss = 0.0
8
+ att_loss = 0.0
9
+ cls_loss = 0.33177106344520146
10
+ eval_loss = 0.5872409325657468
11
+ global_step = 199
12
+ loss = 0.33177106344520146
13
+ mcc = 0.3709803389600345
14
+ rep_loss = 0.0
15
+ att_loss = 0.0
16
+ cls_loss = 0.3205442242199761
17
+ eval_loss = 0.5501694516702131
18
+ global_step = 299
19
+ loss = 0.3205442242199761
20
+ mcc = 0.3632136143179997
21
+ rep_loss = 0.0
22
+ att_loss = 0.0
23
+ cls_loss = 0.3123153758078888
24
+ eval_loss = 0.53216142726667
25
+ global_step = 399
26
+ loss = 0.3123153758078888
27
+ mcc = 0.37663386957262124
28
+ rep_loss = 0.0
29
+ att_loss = 0.0
30
+ cls_loss = 0.30697973977348847
31
+ eval_loss = 0.5267899740826
32
+ global_step = 499
33
+ loss = 0.30697973977348847
34
+ mcc = 0.3892560665897791
35
+ rep_loss = 0.0
36
+ att_loss = 0.0
37
+ cls_loss = 0.30355875838380025
38
+ eval_loss = 0.5238304472330845
39
+ global_step = 599
40
+ loss = 0.30355875838380025
41
+ mcc = 0.3877546380385484
42
+ rep_loss = 0.0
43
+ att_loss = 0.0
44
+ cls_loss = 0.30093799652971426
45
+ eval_loss = 0.5212509063157168
46
+ global_step = 699
47
+ loss = 0.30093799652971426
48
+ mcc = 0.38221460495175935
49
+ rep_loss = 0.0
50
+ att_loss = 0.0
51
+ cls_loss = 0.298923846292257
52
+ eval_loss = 0.5149777947050153
53
+ global_step = 799
54
+ loss = 0.298923846292257
55
+ mcc = 0.38899362002004945
56
+ rep_loss = 0.0
57
+ att_loss = 0.0
58
+ cls_loss = 0.29705169435602935
59
+ eval_loss = 0.5193736670595227
60
+ global_step = 899
61
+ loss = 0.29705169435602935
62
+ mcc = 0.39097174554766484
63
+ rep_loss = 0.0
64
+ att_loss = 0.0
65
+ cls_loss = 0.29570507263397433
66
+ eval_loss = 0.5197603810917247
67
+ global_step = 999
68
+ loss = 0.29570507263397433
69
+ mcc = 0.37330557017038596
70
+ rep_loss = 0.0
71
+ att_loss = 0.0
72
+ cls_loss = 0.29460890394541434
73
+ eval_loss = 0.5279499075629495
74
+ global_step = 1099
75
+ loss = 0.29460890394541434
76
+ mcc = 0.37165225479127123
77
+ rep_loss = 0.0
78
+ att_loss = 0.0
79
+ cls_loss = 0.29367289988571055
80
+ eval_loss = 0.5174163525754755
81
+ global_step = 1199
82
+ loss = 0.29367289988571055
83
+ mcc = 0.37827883919891614
84
+ rep_loss = 0.0
85
+ att_loss = 0.0
86
+ cls_loss = 0.2929169338101878
87
+ eval_loss = 0.5223202154491887
88
+ global_step = 1299
89
+ loss = 0.2929169338101878
90
+ mcc = 0.37061285503044555
91
+ rep_loss = 0.0
92
+ att_loss = 0.0
93
+ cls_loss = 0.2922824918371682
94
+ eval_loss = 0.5192791611859293
95
+ global_step = 1399
96
+ loss = 0.2922824918371682
97
+ mcc = 0.3840054310253403
98
+ rep_loss = 0.0
99
+ att_loss = 0.0
100
+ cls_loss = 0.2917452016180559
101
+ eval_loss = 0.5148796357891776
102
+ global_step = 1499
103
+ loss = 0.2917452016180559
104
+ mcc = 0.38833086918437604
105
+ rep_loss = 0.0
106
+ att_loss = 0.0
107
+ cls_loss = 0.29132951364582815
108
+ eval_loss = 0.5153409513560209
109
+ global_step = 1599
110
+ loss = 0.29132951364582815
111
+ mcc = 0.41927013804892227
112
+ rep_loss = 0.0
113
+ att_loss = 0.0
114
+ cls_loss = 0.2909143878264312
115
+ eval_loss = 0.5176202645807555
116
+ global_step = 1699
117
+ loss = 0.2909143878264312
118
+ mcc = 0.39895365254134896
119
+ rep_loss = 0.0
120
+ att_loss = 0.0
121
+ cls_loss = 0.29057640186808653
122
+ eval_loss = 0.519390397902691
123
+ global_step = 1799
124
+ loss = 0.29057640186808653
125
+ mcc = 0.3840013666665939
126
+ rep_loss = 0.0
127
+ att_loss = 0.0
128
+ cls_loss = 0.290319570432907
129
+ eval_loss = 0.5133328392650142
130
+ global_step = 1899
131
+ loss = 0.290319570432907
132
+ mcc = 0.4069899871395845
133
+ rep_loss = 0.0
134
+ att_loss = 0.0
135
+ cls_loss = 0.2900308165000402
136
+ eval_loss = 0.5166239133386901
137
+ global_step = 1999
138
+ loss = 0.2900308165000402
139
+ mcc = 0.3819485378858301
140
+ rep_loss = 0.0
141
+ att_loss = 0.0
142
+ cls_loss = 0.28977794074171664
143
+ eval_loss = 0.5148214986830046
144
+ global_step = 2099
145
+ loss = 0.28977794074171664
146
+ mcc = 0.40458001224586415
147
+ rep_loss = 0.0
148
+ att_loss = 0.0
149
+ cls_loss = 0.28947624005800815
150
+ eval_loss = 0.514714679031661
151
+ global_step = 2199
152
+ loss = 0.28947624005800815
153
+ mcc = 0.4026106243439989
154
+ rep_loss = 0.0
155
+ att_loss = 0.0
156
+ cls_loss = 0.28915125764857796
157
+ eval_loss = 0.5223394650401492
158
+ global_step = 2299
159
+ loss = 0.28915125764857796
160
+ mcc = 0.39895365254134896
161
+ rep_loss = 0.0
162
+ att_loss = 0.0
163
+ cls_loss = 0.28900953685059655
164
+ eval_loss = 0.5247616054433765
165
+ global_step = 2399
166
+ loss = 0.28900953685059655
167
+ mcc = 0.38731511142125435
168
+ rep_loss = 0.0
169
+ att_loss = 0.0
170
+ cls_loss = 0.28884948732233756
171
+ eval_loss = 0.525927048740965
172
+ global_step = 2499
173
+ loss = 0.28884948732233756
174
+ mcc = 0.3804125081494791
175
+ rep_loss = 0.0
176
+ att_loss = 0.0
177
+ cls_loss = 0.28874072126353323
178
+ eval_loss = 0.5305289842865684
179
+ global_step = 2599
180
+ loss = 0.28874072126353323
181
+ mcc = 0.36894282240349613
182
+ rep_loss = 0.0
183
+ att_loss = 0.0
184
+ cls_loss = 0.2885687179192652
185
+ eval_loss = 0.5217124169523065
186
+ global_step = 2699
187
+ loss = 0.2885687179192652
188
+ mcc = 0.35918776049405
189
+ rep_loss = 0.0
190
+ att_loss = 0.0
191
+ cls_loss = 0.2884783570299663
192
+ eval_loss = 0.5284617434848439
193
+ global_step = 2799
194
+ loss = 0.2884783570299663
195
+ mcc = 0.3803392011836776
196
+ rep_loss = 0.0
197
+ att_loss = 0.0
198
+ cls_loss = 0.2883057665027146
199
+ eval_loss = 0.5248655911647913
200
+ global_step = 2899
201
+ loss = 0.2883057665027146
202
+ mcc = 0.36407735181256773
203
+ rep_loss = 0.0
204
+ att_loss = 0.0
205
+ cls_loss = 0.2881783898839079
206
+ eval_loss = 0.5342400931950771
207
+ global_step = 2999
208
+ loss = 0.2881783898839079
209
+ mcc = 0.39097174554766484
210
+ rep_loss = 0.0
211
+ att_loss = 0.0
212
+ cls_loss = 0.2880394740685912
213
+ eval_loss = 0.5215818358190132
214
+ global_step = 3099
215
+ loss = 0.2880394740685912
216
+ mcc = 0.3804125081494791
217
+ rep_loss = 0.0
218
+ att_loss = 0.0
219
+ cls_loss = 0.28794247894389213
220
+ eval_loss = 0.5263493223623796
221
+ global_step = 3199
222
+ loss = 0.28794247894389213
223
+ mcc = 0.39780520460046437
224
+ rep_loss = 0.0
225
+ att_loss = 0.0
226
+ cls_loss = 0.2878018494906589
227
+ eval_loss = 0.5152009563012556
228
+ global_step = 3299
229
+ loss = 0.2878018494906589
230
+ mcc = 0.3732051470850359
231
+ rep_loss = 0.0
232
+ att_loss = 0.0
233
+ cls_loss = 0.2876835728426406
234
+ eval_loss = 0.5174267815821099
235
+ global_step = 3399
236
+ loss = 0.2876835728426406
237
+ mcc = 0.3820632828805051
238
+ rep_loss = 0.0
239
+ att_loss = 0.0
240
+ cls_loss = 0.28756312976550563
241
+ eval_loss = 0.5152028862274054
242
+ global_step = 3499
243
+ loss = 0.28756312976550563
244
+ mcc = 0.39327627939877535
245
+ rep_loss = 0.0
246
+ att_loss = 0.0
247
+ cls_loss = 0.2874426774206543
248
+ eval_loss = 0.5117849030277946
249
+ global_step = 3599
250
+ loss = 0.2874426774206543
251
+ mcc = 0.3762322221434117
252
+ rep_loss = 0.0
253
+ att_loss = 0.0
254
+ cls_loss = 0.28736593537425376
255
+ eval_loss = 0.5194391743703322
256
+ global_step = 3699
257
+ loss = 0.28736593537425376
258
+ mcc = 0.37637355975877906
259
+ rep_loss = 0.0
260
+ att_loss = 0.0
261
+ cls_loss = 0.2872757521914193
262
+ eval_loss = 0.5270495496012948
263
+ global_step = 3799
264
+ loss = 0.2872757521914193
265
+ mcc = 0.39438996614158506
266
+ rep_loss = 0.0
267
+ att_loss = 0.0
268
+ cls_loss = 0.28718765729679513
269
+ eval_loss = 0.520123277649735
270
+ global_step = 3899
271
+ loss = 0.28718765729679513
272
+ mcc = 0.37177416903895627
273
+ rep_loss = 0.0
274
+ att_loss = 0.0
275
+ cls_loss = 0.2871156335510472
276
+ eval_loss = 0.5226057451782804
277
+ global_step = 3999
278
+ loss = 0.2871156335510472
279
+ mcc = 0.37302602457804274
280
+ rep_loss = 0.0
281
+ att_loss = 0.0
282
+ cls_loss = 0.28708139837340746
283
+ eval_loss = 0.5150534474488461
284
+ global_step = 4099
285
+ loss = 0.28708139837340746
286
+ mcc = 0.4011346232727083
287
+ rep_loss = 0.0
288
+ att_loss = 0.0
289
+ cls_loss = 0.28702193186677166
290
+ eval_loss = 0.5152694862900358
291
+ global_step = 4199
292
+ loss = 0.28702193186677166
293
+ mcc = 0.39611025073017425
294
+ rep_loss = 0.0
295
+ att_loss = 0.0
296
+ cls_loss = 0.28695012972185185
297
+ eval_loss = 0.521484088717085
298
+ global_step = 4299
299
+ loss = 0.28695012972185185
300
+ mcc = 0.38228296898092495
301
+ rep_loss = 0.0
302
+ att_loss = 0.0
303
+ cls_loss = 0.28689421526367864
304
+ eval_loss = 0.5239615097190394
305
+ global_step = 4399
306
+ loss = 0.28689421526367864
307
+ mcc = 0.3923138769373063
308
+ rep_loss = 0.0
309
+ att_loss = 0.0
310
+ cls_loss = 0.2868007770026358
311
+ eval_loss = 0.5138817682410731
312
+ global_step = 4499
313
+ loss = 0.2868007770026358
314
+ mcc = 0.3908602459650061
315
+ rep_loss = 0.0
316
+ att_loss = 0.0
317
+ cls_loss = 0.2867444366424025
318
+ eval_loss = 0.5129947833942644
319
+ global_step = 4599
320
+ loss = 0.2867444366424025
321
+ mcc = 0.39884193907512194
322
+ rep_loss = 0.0
323
+ att_loss = 0.0
324
+ cls_loss = 0.2866564529814551
325
+ eval_loss = 0.5101995305581526
326
+ global_step = 4699
327
+ loss = 0.2866564529814551
328
+ mcc = 0.403167099827574
329
+ rep_loss = 0.0
330
+ att_loss = 0.0
331
+ cls_loss = 0.2866204083307407
332
+ eval_loss = 0.5110881166024641
333
+ global_step = 4799
334
+ loss = 0.2866204083307407
335
+ mcc = 0.3932731321067742
336
+ rep_loss = 0.0
337
+ att_loss = 0.0
338
+ cls_loss = 0.28653837713046226
339
+ eval_loss = 0.5160060732653646
340
+ global_step = 4899
341
+ loss = 0.28653837713046226
342
+ mcc = 0.3791514250884126
343
+ rep_loss = 0.0
344
+ att_loss = 0.0
345
+ cls_loss = 0.2864541731630237
346
+ eval_loss = 0.5124918773318782
347
+ global_step = 4999
348
+ loss = 0.2864541731630237
349
+ mcc = 0.3890347057339363
350
+ rep_loss = 0.0
351
+ att_loss = 0.0
352
+ cls_loss = 0.28638665469856117
353
+ eval_loss = 0.5217192778081605
354
+ global_step = 5099
355
+ loss = 0.28638665469856117
356
+ mcc = 0.3937806133722603
357
+ rep_loss = 0.0
358
+ att_loss = 0.0
359
+ cls_loss = 0.2863042280092265
360
+ eval_loss = 0.5213332573572794
361
+ global_step = 5199
362
+ loss = 0.2863042280092265
363
+ mcc = 0.38568778619879135
364
+ rep_loss = 0.0
365
+ att_loss = 0.0
366
+ cls_loss = 0.28625702371764217
367
+ eval_loss = 0.5238886927113389
368
+ global_step = 5299
369
+ loss = 0.28625702371764217
370
+ mcc = 0.3885215735722988
371
+ rep_loss = 0.0
372
+ att_loss = 0.0
373
+ cls_loss = 0.28616623083106413
374
+ eval_loss = 0.5150826492092826
375
+ global_step = 5399
376
+ loss = 0.28616623083106413
377
+ mcc = 0.39777291234124745
378
+ rep_loss = 0.0
379
+ att_loss = 0.0
380
+ cls_loss = 0.2861386102331749
381
+ eval_loss = 0.5174173974629604
382
+ global_step = 5499
383
+ loss = 0.2861386102331749
384
+ mcc = 0.38284510021837986
385
+ rep_loss = 0.0
386
+ att_loss = 0.0
387
+ cls_loss = 0.2860565667658922
388
+ eval_loss = 0.520055275071751
389
+ global_step = 5599
390
+ loss = 0.2860565667658922
391
+ mcc = 0.3772922967514493
392
+ rep_loss = 0.0
393
+ att_loss = 0.0
394
+ cls_loss = 0.2860261079673705
395
+ eval_loss = 0.5164578006123052
396
+ global_step = 5699
397
+ loss = 0.2860261079673705
398
+ mcc = 0.39998008459631823
399
+ rep_loss = 0.0
400
+ att_loss = 0.0
401
+ cls_loss = 0.28596524872138884
402
+ eval_loss = 0.5099366253072565
403
+ global_step = 5799
404
+ loss = 0.28596524872138884
405
+ mcc = 0.4085876237775107
406
+ rep_loss = 0.0
407
+ att_loss = 0.0
408
+ cls_loss = 0.28592844469594964
409
+ eval_loss = 0.5119992882916422
410
+ global_step = 5899
411
+ loss = 0.28592844469594964
412
+ mcc = 0.40104837216246975
413
+ rep_loss = 0.0
414
+ att_loss = 0.0
415
+ cls_loss = 0.28590416652666645
416
+ eval_loss = 0.5151183000116637
417
+ global_step = 5999
418
+ loss = 0.28590416652666645
419
+ mcc = 0.37999701664002705
420
+ rep_loss = 0.0
421
+ att_loss = 0.0
422
+ cls_loss = 0.2858548017799278
423
+ eval_loss = 0.5153002630580555
424
+ global_step = 6099
425
+ loss = 0.2858548017799278
426
+ mcc = 0.3734647489671002
427
+ rep_loss = 0.0
428
+ att_loss = 0.0
429
+ cls_loss = 0.28581119698321633
430
+ eval_loss = 0.5087440140319593
431
+ global_step = 6199
432
+ loss = 0.28581119698321633
433
+ mcc = 0.41607779331757044
434
+ rep_loss = 0.0
435
+ att_loss = 0.0
436
+ cls_loss = 0.2857871880051938
437
+ eval_loss = 0.5130369663238525
438
+ global_step = 6299
439
+ loss = 0.2857871880051938
440
+ mcc = 0.40882970414693454
441
+ rep_loss = 0.0
442
+ att_loss = 0.0
443
+ cls_loss = 0.2857193908811193
444
+ eval_loss = 0.5108520045424952
445
+ global_step = 6399
446
+ loss = 0.2857193908811193
447
+ mcc = 0.3940079243628446
448
+ rep_loss = 0.0
449
+ att_loss = 0.0
450
+ cls_loss = 0.28568193774339623
451
+ eval_loss = 0.5132698967601313
452
+ global_step = 6499
453
+ loss = 0.28568193774339623
454
+ mcc = 0.38884978659993197
455
+ rep_loss = 0.0
456
+ att_loss = 0.0
457
+ cls_loss = 0.2834862545132637
458
+ eval_loss = 0.5128394329186642
459
+ global_step = 6599
460
+ loss = 0.2834862545132637
461
+ mcc = 0.3823808296094942
462
+ rep_loss = 0.0
463
+ att_loss = 0.0
464
+ cls_loss = 0.2813756861365758
465
+ eval_loss = 0.5069861809412638
466
+ global_step = 6699
467
+ loss = 0.2813756861365758
468
+ mcc = 0.4117922073135961
469
+ rep_loss = 0.0
470
+ att_loss = 0.0
471
+ cls_loss = 0.2816205664592631
472
+ eval_loss = 0.511738433079286
473
+ global_step = 6799
474
+ loss = 0.2816205664592631
475
+ mcc = 0.4172466675387621
476
+ rep_loss = 0.0
477
+ att_loss = 0.0
478
+ cls_loss = 0.28304927894159365
479
+ eval_loss = 0.5068024947787776
480
+ global_step = 6899
481
+ loss = 0.28304927894159365
482
+ mcc = 0.3996440630136365
483
+ rep_loss = 0.0
484
+ att_loss = 0.0
485
+ cls_loss = 0.2825837999139682
486
+ eval_loss = 0.5051217377185822
487
+ global_step = 6999
488
+ loss = 0.2825837999139682
489
+ mcc = 0.4033762891627765
490
+ rep_loss = 0.0
491
+ att_loss = 0.0
492
+ cls_loss = 0.28276582570776104
493
+ eval_loss = 0.5126414741530563
494
+ global_step = 7099
495
+ loss = 0.28276582570776104
496
+ mcc = 0.3803392011836776
497
+ rep_loss = 0.0
498
+ att_loss = 0.0
499
+ cls_loss = 0.28260714126541125
500
+ eval_loss = 0.5112863851316047
501
+ global_step = 7199
502
+ loss = 0.28260714126541125
503
+ mcc = 0.403167099827574
504
+ rep_loss = 0.0
505
+ att_loss = 0.0
506
+ cls_loss = 0.282591997730461
507
+ eval_loss = 0.5127082331614061
508
+ global_step = 7299
509
+ loss = 0.282591997730461
510
+ mcc = 0.4059864935947653
511
+ rep_loss = 0.0
512
+ att_loss = 0.0
513
+ cls_loss = 0.2825035277883805
514
+ eval_loss = 0.518345855402224
515
+ global_step = 7399
516
+ loss = 0.2825035277883805
517
+ mcc = 0.3830064003070546
518
+ rep_loss = 0.0
519
+ att_loss = 0.0
520
+ cls_loss = 0.2823299742839505
521
+ eval_loss = 0.5192047276280143
522
+ global_step = 7499
523
+ loss = 0.2823299742839505
524
+ mcc = 0.3766911998849963
525
+ rep_loss = 0.0
526
+ att_loss = 0.0
527
+ cls_loss = 0.28240299949133063
528
+ eval_loss = 0.5189248811114918
529
+ global_step = 7599
530
+ loss = 0.28240299949133063
531
+ mcc = 0.39211267993083676
532
+ rep_loss = 0.0
533
+ att_loss = 0.0
534
+ cls_loss = 0.2824035367078107
535
+ eval_loss = 0.5153183214592211
536
+ global_step = 7699
537
+ loss = 0.2824035367078107
538
+ mcc = 0.37999701664002705
539
+ rep_loss = 0.0
540
+ att_loss = 0.0
541
+ cls_loss = 0.2824633766794918
542
+ eval_loss = 0.5169419917193326
543
+ global_step = 7799
544
+ loss = 0.2824633766794918
545
+ mcc = 0.37588272219203145
546
+ rep_loss = 0.0
547
+ att_loss = 0.0
548
+ cls_loss = 0.28245345761348134
549
+ eval_loss = 0.5171206160025164
550
+ global_step = 7899
551
+ loss = 0.28245345761348134
552
+ mcc = 0.3985539058708339
553
+ rep_loss = 0.0
554
+ att_loss = 0.0
555
+ cls_loss = 0.2825832725038216
556
+ eval_loss = 0.5177997441002817
557
+ global_step = 7999
558
+ loss = 0.2825832725038216
559
+ mcc = 0.36977496722249587
560
+ rep_loss = 0.0
561
+ att_loss = 0.0
562
+ cls_loss = 0.28260926252349894
563
+ eval_loss = 0.512401100360986
564
+ global_step = 8099
565
+ loss = 0.28260926252349894
566
+ mcc = 0.3828545419719089
567
+ rep_loss = 0.0
568
+ att_loss = 0.0
569
+ cls_loss = 0.28256619950185097
570
+ eval_loss = 0.5159861039031636
571
+ global_step = 8199
572
+ loss = 0.28256619950185097
573
+ mcc = 0.37193451850694254
574
+ rep_loss = 0.0
575
+ att_loss = 0.0
576
+ cls_loss = 0.28252108295408773
577
+ eval_loss = 0.5178058842817942
578
+ global_step = 8299
579
+ loss = 0.28252108295408773
580
+ mcc = 0.3856835045289885
581
+ rep_loss = 0.0
582
+ att_loss = 0.0
583
+ cls_loss = 0.28255646062928136
584
+ eval_loss = 0.5111542118318153
585
+ global_step = 8399
586
+ loss = 0.28255646062928136
587
+ mcc = 0.39467643430011085
588
+ rep_loss = 0.0
589
+ att_loss = 0.0
590
+ cls_loss = 0.2826366017283011
591
+ eval_loss = 0.5156967594768062
592
+ global_step = 8499
593
+ loss = 0.2826366017283011
594
+ mcc = 0.38195214033316116
595
+ rep_loss = 0.0
596
+ att_loss = 0.0
597
+ cls_loss = 0.28264916480003954
598
+ eval_loss = 0.5102085489215273
599
+ global_step = 8599
600
+ loss = 0.28264916480003954
601
+ mcc = 0.372862717809245
602
+ rep_loss = 0.0
603
+ att_loss = 0.0
604
+ cls_loss = 0.28260060387022595
605
+ eval_loss = 0.5102424206155719
606
+ global_step = 8699
607
+ loss = 0.28260060387022595
608
+ mcc = 0.40131884995908
609
+ rep_loss = 0.0
610
+ att_loss = 0.0
611
+ cls_loss = 0.2826164152520538
612
+ eval_loss = 0.5126803761178796
613
+ global_step = 8799
614
+ loss = 0.2826164152520538
615
+ mcc = 0.4235041043063152
616
+ rep_loss = 0.0
617
+ att_loss = 0.0
618
+ cls_loss = 0.28259986309179413
619
+ eval_loss = 0.5098589604551141
620
+ global_step = 8899
621
+ loss = 0.28259986309179413
622
+ mcc = 0.38990471425985396
623
+ rep_loss = 0.0
624
+ att_loss = 0.0
625
+ cls_loss = 0.2825142649961589
626
+ eval_loss = 0.5173692351037805
627
+ global_step = 8999
628
+ loss = 0.2825142649961589
629
+ mcc = 0.3993849215588643
630
+ rep_loss = 0.0
631
+ att_loss = 0.0
632
+ cls_loss = 0.2825618349491788
633
+ eval_loss = 0.5122251212596893
634
+ global_step = 9099
635
+ loss = 0.2825618349491788
636
+ mcc = 0.3840054310253403
637
+ rep_loss = 0.0
638
+ att_loss = 0.0
639
+ cls_loss = 0.28256867571909855
640
+ eval_loss = 0.5147266279567372
641
+ global_step = 9199
642
+ loss = 0.28256867571909855
643
+ mcc = 0.3985466264666081
644
+ rep_loss = 0.0
645
+ att_loss = 0.0
646
+ cls_loss = 0.28260061660638225
647
+ eval_loss = 0.5119015773137411
648
+ global_step = 9299
649
+ loss = 0.28260061660638225
650
+ mcc = 0.4105276958910593
651
+ rep_loss = 0.0
652
+ att_loss = 0.0
653
+ cls_loss = 0.28252783535678105
654
+ eval_loss = 0.5079709806225516
655
+ global_step = 9399
656
+ loss = 0.28252783535678105
657
+ mcc = 0.40693605005193084
658
+ rep_loss = 0.0
659
+ att_loss = 0.0
660
+ cls_loss = 0.28249339924576194
661
+ eval_loss = 0.5125236321579326
662
+ global_step = 9499
663
+ loss = 0.28249339924576194
664
+ mcc = 0.4039478620313797
665
+ rep_loss = 0.0
666
+ att_loss = 0.0
667
+ cls_loss = 0.2824547092086783
668
+ eval_loss = 0.513409368016503
669
+ global_step = 9599
670
+ loss = 0.2824547092086783
671
+ mcc = 0.4021804836630887
672
+ rep_loss = 0.0
673
+ att_loss = 0.0
674
+ cls_loss = 0.2824284661388428
675
+ eval_loss = 0.5122987113215707
676
+ global_step = 9699
677
+ loss = 0.2824284661388428
678
+ mcc = 0.39213093547272937
679
+ rep_loss = 0.0
680
+ att_loss = 0.0
681
+ cls_loss = 0.28245821747738176
682
+ eval_loss = 0.5084807701183088
683
+ global_step = 9799
684
+ loss = 0.28245821747738176
685
+ mcc = 0.40739278931922274
686
+ rep_loss = 0.0
687
+ att_loss = 0.0
688
+ cls_loss = 0.2824419995738288
689
+ eval_loss = 0.5111486080921057
690
+ global_step = 9899
691
+ loss = 0.2824419995738288
692
+ mcc = 0.4172194430405653
693
+ rep_loss = 0.0
694
+ att_loss = 0.0
695
+ cls_loss = 0.2824013299460837
696
+ eval_loss = 0.5125659370061123
697
+ global_step = 9999
698
+ loss = 0.2824013299460837
699
+ mcc = 0.40544142666175087
700
+ rep_loss = 0.0
701
+ att_loss = 0.0
702
+ cls_loss = 0.2823612241491199
703
+ eval_loss = 0.5126088993115858
704
+ global_step = 10099
705
+ loss = 0.2823612241491199
706
+ mcc = 0.4138332826141097
707
+ rep_loss = 0.0
708
+ att_loss = 0.0
709
+ cls_loss = 0.28233784527314226
710
+ eval_loss = 0.5170806835998188
711
+ global_step = 10199
712
+ loss = 0.28233784527314226
713
+ mcc = 0.4052979142123112
714
+ rep_loss = 0.0
715
+ att_loss = 0.0
716
+ cls_loss = 0.2823012116371169
717
+ eval_loss = 0.5070072204777689
718
+ global_step = 10299
719
+ loss = 0.2823012116371169
720
+ mcc = 0.40891913355202136
721
+ rep_loss = 0.0
722
+ att_loss = 0.0
723
+ cls_loss = 0.282276837615498
724
+ eval_loss = 0.5102173388004303
725
+ global_step = 10399
726
+ loss = 0.282276837615498
727
+ mcc = 0.42573897932394733
728
+ rep_loss = 0.0
729
+ att_loss = 0.0
730
+ cls_loss = 0.28231605232433704
731
+ eval_loss = 0.5103865067164103
732
+ global_step = 10499
733
+ loss = 0.28231605232433704
734
+ mcc = 0.3965913923587624
735
+ rep_loss = 0.0
736
+ att_loss = 0.0
737
+ cls_loss = 0.28234525746875233
738
+ eval_loss = 0.5086130644335891
739
+ global_step = 10599
740
+ loss = 0.28234525746875233
741
+ mcc = 0.42386735506802997
742
+ rep_loss = 0.0
743
+ att_loss = 0.0
744
+ cls_loss = 0.28236741794102604
745
+ eval_loss = 0.5086397772485559
746
+ global_step = 10699
747
+ loss = 0.28236741794102604
748
+ mcc = 0.41021970767701216
749
+ rep_loss = 0.0
750
+ att_loss = 0.0
751
+ cls_loss = 0.2823447209174127
752
+ eval_loss = 0.5109247140812151
753
+ global_step = 10799
754
+ loss = 0.2823447209174127
755
+ mcc = 0.4033271983694075
756
+ rep_loss = 0.0
757
+ att_loss = 0.0
758
+ cls_loss = 0.28235380055874476
759
+ eval_loss = 0.5140562093619144
760
+ global_step = 10899
761
+ loss = 0.28235380055874476
762
+ mcc = 0.4061988397614615
763
+ rep_loss = 0.0
764
+ att_loss = 0.0
765
+ cls_loss = 0.2823390113384371
766
+ eval_loss = 0.51523285742962
767
+ global_step = 10999
768
+ loss = 0.2823390113384371
769
+ mcc = 0.3997736483943066
770
+ rep_loss = 0.0
771
+ att_loss = 0.0
772
+ cls_loss = 0.2823259284451842
773
+ eval_loss = 0.5107357989658009
774
+ global_step = 11099
775
+ loss = 0.2823259284451842
776
+ mcc = 0.39418417780027004
777
+ rep_loss = 0.0
778
+ att_loss = 0.0
779
+ cls_loss = 0.28235181783537155
780
+ eval_loss = 0.5102178933042468
781
+ global_step = 11199
782
+ loss = 0.28235181783537155
783
+ mcc = 0.40458001224586415
784
+ rep_loss = 0.0
785
+ att_loss = 0.0
786
+ cls_loss = 0.2823098915926859
787
+ eval_loss = 0.5139325694604353
788
+ global_step = 11299
789
+ loss = 0.2823098915926859
790
+ mcc = 0.39651505942154824
791
+ rep_loss = 0.0
792
+ att_loss = 0.0
793
+ cls_loss = 0.2822909285620686
794
+ eval_loss = 0.5153398152553674
795
+ global_step = 11399
796
+ loss = 0.2822909285620686
797
+ mcc = 0.40530962152270844
798
+ rep_loss = 0.0
799
+ att_loss = 0.0
800
+ cls_loss = 0.2822838319407785
801
+ eval_loss = 0.5070374842846033
802
+ global_step = 11499
803
+ loss = 0.2822838319407785
804
+ mcc = 0.3898302148823619
805
+ rep_loss = 0.0
806
+ att_loss = 0.0
807
+ cls_loss = 0.2822466105115499
808
+ eval_loss = 0.5146514863678904
809
+ global_step = 11599
810
+ loss = 0.2822466105115499
811
+ mcc = 0.40011410558622174
812
+ rep_loss = 0.0
813
+ att_loss = 0.0
814
+ cls_loss = 0.28226915594529023
815
+ eval_loss = 0.5120623545213179
816
+ global_step = 11699
817
+ loss = 0.28226915594529023
818
+ mcc = 0.41454694915421336
819
+ rep_loss = 0.0
820
+ att_loss = 0.0
821
+ cls_loss = 0.28228479942777907
822
+ eval_loss = 0.5130805644122037
823
+ global_step = 11799
824
+ loss = 0.28228479942777907
825
+ mcc = 0.42072451027133134
826
+ rep_loss = 0.0
827
+ att_loss = 0.0
828
+ cls_loss = 0.28232717272428004
829
+ eval_loss = 0.5160291429721948
830
+ global_step = 11899
831
+ loss = 0.28232717272428004
832
+ mcc = 0.40011410558622174
833
+ rep_loss = 0.0
834
+ att_loss = 0.0
835
+ cls_loss = 0.2823260606085257
836
+ eval_loss = 0.5159690497499524
837
+ global_step = 11999
838
+ loss = 0.2823260606085257
839
+ mcc = 0.37141964356869667
840
+ rep_loss = 0.0
841
+ att_loss = 0.0
842
+ cls_loss = 0.2822958163722137
843
+ eval_loss = 0.5140873636260177
844
+ global_step = 12099
845
+ loss = 0.2822958163722137
846
+ mcc = 0.38482081753749314
847
+ rep_loss = 0.0
848
+ att_loss = 0.0
849
+ cls_loss = 0.2822563194435124
850
+ eval_loss = 0.5150263435912855
851
+ global_step = 12199
852
+ loss = 0.2822563194435124
853
+ mcc = 0.3848259659055644
854
+ rep_loss = 0.0
855
+ att_loss = 0.0
856
+ cls_loss = 0.282232557991611
857
+ eval_loss = 0.5123935414083076
858
+ global_step = 12299
859
+ loss = 0.282232557991611
860
+ mcc = 0.3804125081494791
861
+ rep_loss = 0.0
862
+ att_loss = 0.0
863
+ cls_loss = 0.28227046379584597
864
+ eval_loss = 0.5180137825734688
865
+ global_step = 12399
866
+ loss = 0.28227046379584597
867
+ mcc = 0.38315821810772
868
+ rep_loss = 0.0
869
+ att_loss = 0.0
870
+ cls_loss = 0.28227142532807864
871
+ eval_loss = 0.513143314556642
872
+ global_step = 12499
873
+ loss = 0.28227142532807864
874
+ mcc = 0.4005864260531677
875
+ rep_loss = 0.0
876
+ att_loss = 0.0
877
+ cls_loss = 0.28223702150690483
878
+ eval_loss = 0.5165203602025004
879
+ global_step = 12599
880
+ loss = 0.28223702150690483
881
+ mcc = 0.3825175429116719
882
+ rep_loss = 0.0
883
+ att_loss = 0.0
884
+ cls_loss = 0.28226484132742663
885
+ eval_loss = 0.5177025307308544
886
+ global_step = 12699
887
+ loss = 0.28226484132742663
888
+ mcc = 0.38731511142125435
889
+ rep_loss = 0.0
890
+ att_loss = 0.0
891
+ cls_loss = 0.28226020199148827
892
+ eval_loss = 0.514326117255471
893
+ global_step = 12799
894
+ loss = 0.28226020199148827
895
+ mcc = 0.39651505942154824
896
+ rep_loss = 0.0
897
+ att_loss = 0.0
898
+ cls_loss = 0.282260316372069
899
+ eval_loss = 0.5084026528127266
900
+ global_step = 12899
901
+ loss = 0.282260316372069
902
+ mcc = 0.3811450767088426
903
+ rep_loss = 0.0
904
+ att_loss = 0.0
905
+ cls_loss = 0.2822655938672766
906
+ eval_loss = 0.5095312730832533
907
+ global_step = 12999
908
+ loss = 0.2822655938672766
909
+ mcc = 0.40196041858324394
910
+ rep_loss = 0.0
911
+ att_loss = 0.0
912
+ cls_loss = 0.2822442495780751
913
+ eval_loss = 0.507652967265158
914
+ global_step = 13099
915
+ loss = 0.2822442495780751
916
+ mcc = 0.39783782006586266
917
+ rep_loss = 0.0
918
+ att_loss = 0.0
919
+ cls_loss = 0.28048115968704224
920
+ eval_loss = 0.5102084703517683
921
+ global_step = 13199
922
+ loss = 0.28048115968704224
923
+ mcc = 0.4009077184297449
924
+ rep_loss = 0.0
925
+ att_loss = 0.0
926
+ cls_loss = 0.27984192830706955
927
+ eval_loss = 0.5112800101439158
928
+ global_step = 13299
929
+ loss = 0.27984192830706955
930
+ mcc = 0.40068606376889737
931
+ rep_loss = 0.0
932
+ att_loss = 0.0
933
+ cls_loss = 0.28055651535828147
934
+ eval_loss = 0.5063392763788049
935
+ global_step = 13399
936
+ loss = 0.28055651535828147
937
+ mcc = 0.3879849787696258
938
+ rep_loss = 0.0
939
+ att_loss = 0.0
940
+ cls_loss = 0.28020469887742716
941
+ eval_loss = 0.5110559472531984
942
+ global_step = 13499
943
+ loss = 0.28020469887742716
944
+ mcc = 0.4052979142123112
945
+ rep_loss = 0.0
946
+ att_loss = 0.0
947
+ cls_loss = 0.28019697829388757
948
+ eval_loss = 0.5113063084356713
949
+ global_step = 13599
950
+ loss = 0.28019697829388757
951
+ mcc = 0.4104477269329847
952
+ rep_loss = 0.0
953
+ att_loss = 0.0
954
+ cls_loss = 0.28015780241058474
955
+ eval_loss = 0.5131644308567047
956
+ global_step = 13699
957
+ loss = 0.28015780241058474
958
+ mcc = 0.39008612150299654
959
+ rep_loss = 0.0
960
+ att_loss = 0.0
961
+ cls_loss = 0.2801340272518606
962
+ eval_loss = 0.5113311644756433
963
+ global_step = 13799
964
+ loss = 0.2801340272518606
965
+ mcc = 0.40458001224586415
966
+ rep_loss = 0.0
967
+ att_loss = 0.0
968
+ cls_loss = 0.2801751655188871
969
+ eval_loss = 0.5139215471166553
970
+ global_step = 13899
971
+ loss = 0.2801751655188871
972
+ mcc = 0.39757371367888555
973
+ rep_loss = 0.0
974
+ att_loss = 0.0
975
+ cls_loss = 0.2803018170285726
976
+ eval_loss = 0.5147871501518019
977
+ global_step = 13999
978
+ loss = 0.2803018170285726
979
+ mcc = 0.3954928502055513
980
+ rep_loss = 0.0
981
+ att_loss = 0.0
982
+ cls_loss = 0.28044746648950547
983
+ eval_loss = 0.5145218941298398
984
+ global_step = 14099
985
+ loss = 0.28044746648950547
986
+ mcc = 0.3996634131246967
987
+ rep_loss = 0.0
988
+ att_loss = 0.0
989
+ cls_loss = 0.2806339640358631
990
+ eval_loss = 0.5083598521622744
991
+ global_step = 14199
992
+ loss = 0.2806339640358631
993
+ mcc = 0.3818848270189336
994
+ rep_loss = 0.0
995
+ att_loss = 0.0
996
+ cls_loss = 0.2807077560825752
997
+ eval_loss = 0.5083690303744692
998
+ global_step = 14299
999
+ loss = 0.2807077560825752
1000
+ mcc = 0.40043598733848285
1001
+ rep_loss = 0.0
1002
+ att_loss = 0.0
1003
+ cls_loss = 0.2807342776022636
1004
+ eval_loss = 0.5088989003138109
1005
+ global_step = 14399
1006
+ loss = 0.2807342776022636
1007
+ mcc = 0.40188104133596453
1008
+ rep_loss = 0.0
1009
+ att_loss = 0.0
1010
+ cls_loss = 0.2806438054516627
1011
+ eval_loss = 0.5132724976900852
1012
+ global_step = 14499
1013
+ loss = 0.2806438054516627
1014
+ mcc = 0.40602330795025077
1015
+ rep_loss = 0.0
1016
+ att_loss = 0.0
1017
+ cls_loss = 0.2806220871176256
1018
+ eval_loss = 0.5147652409293435
1019
+ global_step = 14599
1020
+ loss = 0.2806220871176256
1021
+ mcc = 0.39117212929787876
1022
+ rep_loss = 0.0
1023
+ att_loss = 0.0
1024
+ cls_loss = 0.28070966569574723
1025
+ eval_loss = 0.5120624204476675
1026
+ global_step = 14699
1027
+ loss = 0.28070966569574723
1028
+ mcc = 0.4123578103657358
1029
+ rep_loss = 0.0
1030
+ att_loss = 0.0
1031
+ cls_loss = 0.28070613990999144
1032
+ eval_loss = 0.5133554357470889
1033
+ global_step = 14799
1034
+ loss = 0.28070613990999144
1035
+ mcc = 0.3881583196544164
1036
+ rep_loss = 0.0
1037
+ att_loss = 0.0
1038
+ cls_loss = 0.2807093545262614
1039
+ eval_loss = 0.5114469564322269
1040
+ global_step = 14899
1041
+ loss = 0.2807093545262614
1042
+ mcc = 0.39822168961317467
1043
+ rep_loss = 0.0
1044
+ att_loss = 0.0
1045
+ cls_loss = 0.2807347339497145
1046
+ eval_loss = 0.5118169856793953
1047
+ global_step = 14999
1048
+ loss = 0.2807347339497145
1049
+ mcc = 0.3869908951412875
1050
+ rep_loss = 0.0
1051
+ att_loss = 0.0
1052
+ cls_loss = 0.28082120856450704
1053
+ eval_loss = 0.5114837397228588
1054
+ global_step = 15099
1055
+ loss = 0.28082120856450704
1056
+ mcc = 0.39831630919917926
1057
+ rep_loss = 0.0
1058
+ att_loss = 0.0
1059
+ cls_loss = 0.2807593362330797
1060
+ eval_loss = 0.5067198610667026
1061
+ global_step = 15199
1062
+ loss = 0.2807593362330797
1063
+ mcc = 0.40415734458808295
1064
+ rep_loss = 0.0
1065
+ att_loss = 0.0
1066
+ cls_loss = 0.2807870972221527
1067
+ eval_loss = 0.5098130802313486
1068
+ global_step = 15299
1069
+ loss = 0.2807870972221527
1070
+ mcc = 0.37827883919891614
1071
+ rep_loss = 0.0
1072
+ att_loss = 0.0
1073
+ cls_loss = 0.2807835819239312
1074
+ eval_loss = 0.5145537157853445
1075
+ global_step = 15399
1076
+ loss = 0.2807835819239312
1077
+ mcc = 0.38619245355598364
1078
+ rep_loss = 0.0
1079
+ att_loss = 0.0
1080
+ cls_loss = 0.2807902951179102
1081
+ eval_loss = 0.5105155444506443
1082
+ global_step = 15499
1083
+ loss = 0.2807902951179102
1084
+ mcc = 0.38568778619879135
1085
+ rep_loss = 0.0
1086
+ att_loss = 0.0
1087
+ cls_loss = 0.2808664371520466
1088
+ eval_loss = 0.5120808716976282
1089
+ global_step = 15599
1090
+ loss = 0.2808664371520466
1091
+ mcc = 0.3905903182021713
1092
+ rep_loss = 0.0
1093
+ att_loss = 0.0
1094
+ cls_loss = 0.28086480764978766
1095
+ eval_loss = 0.5126627259182207
1096
+ global_step = 15699
1097
+ loss = 0.28086480764978766
1098
+ mcc = 0.3877546380385484
1099
+ rep_loss = 0.0
1100
+ att_loss = 0.0
1101
+ cls_loss = 0.2807757077305287
1102
+ eval_loss = 0.5121393971370928
1103
+ global_step = 15799
1104
+ loss = 0.2807757077305287
1105
+ mcc = 0.39117212929787876
1106
+ rep_loss = 0.0
1107
+ att_loss = 0.0
1108
+ cls_loss = 0.2807666350825768
1109
+ eval_loss = 0.5142692002383146
1110
+ global_step = 15899
1111
+ loss = 0.2807666350825768
1112
+ mcc = 0.3746568093380507
1113
+ rep_loss = 0.0
1114
+ att_loss = 0.0
1115
+ cls_loss = 0.28078636219913994
1116
+ eval_loss = 0.5117888396436517
1117
+ global_step = 15999
1118
+ loss = 0.28078636219913994
1119
+ mcc = 0.3981019614430057
1120
+ rep_loss = 0.0
1121
+ att_loss = 0.0
1122
+ cls_loss = 0.28078779930120157
1123
+ eval_loss = 0.5096124988613706
1124
+ global_step = 16099
1125
+ loss = 0.28078779930120157
1126
+ mcc = 0.3919146115938579
1127
+ rep_loss = 0.0
1128
+ att_loss = 0.0
1129
+ cls_loss = 0.28075273311209464
1130
+ eval_loss = 0.5110085606575012
1131
+ global_step = 16199
1132
+ loss = 0.28075273311209464
1133
+ mcc = 0.40178544404291583
1134
+ rep_loss = 0.0
1135
+ att_loss = 0.0
1136
+ cls_loss = 0.2807791894532431
1137
+ eval_loss = 0.5103965654517665
1138
+ global_step = 16299
1139
+ loss = 0.2807791894532431
1140
+ mcc = 0.4024832514990541
1141
+ rep_loss = 0.0
1142
+ att_loss = 0.0
1143
+ cls_loss = 0.28079897838149276
1144
+ eval_loss = 0.511842996785135
1145
+ global_step = 16399
1146
+ loss = 0.28079897838149276
1147
+ mcc = 0.40339504639994617
1148
+ rep_loss = 0.0
1149
+ att_loss = 0.0
1150
+ cls_loss = 0.28081396074859205
1151
+ eval_loss = 0.5137978602539409
1152
+ global_step = 16499
1153
+ loss = 0.28081396074859205
1154
+ mcc = 0.3779893368407423
1155
+ rep_loss = 0.0
1156
+ att_loss = 0.0
1157
+ cls_loss = 0.28086851178795474
1158
+ eval_loss = 0.5133931411035133
1159
+ global_step = 16599
1160
+ loss = 0.28086851178795474
1161
+ mcc = 0.3815798845625387
1162
+ rep_loss = 0.0
1163
+ att_loss = 0.0
1164
+ cls_loss = 0.28092144247081824
1165
+ eval_loss = 0.5128023479924058
1166
+ global_step = 16699
1167
+ loss = 0.28092144247081824
1168
+ mcc = 0.39087642483600127
1169
+ rep_loss = 0.0
1170
+ att_loss = 0.0
1171
+ cls_loss = 0.28096025591330637
1172
+ eval_loss = 0.5111828834721537
1173
+ global_step = 16799
1174
+ loss = 0.28096025591330637
1175
+ mcc = 0.40529509862645224
1176
+ rep_loss = 0.0
1177
+ att_loss = 0.0
1178
+ cls_loss = 0.28094200728861396
1179
+ eval_loss = 0.5122123658657074
1180
+ global_step = 16899
1181
+ loss = 0.28094200728861396
1182
+ mcc = 0.3997145619263111
1183
+ rep_loss = 0.0
1184
+ att_loss = 0.0
1185
+ cls_loss = 0.28097063498207203
1186
+ eval_loss = 0.5112948065454309
1187
+ global_step = 16999
1188
+ loss = 0.28097063498207203
1189
+ mcc = 0.40011410558622174
1190
+ rep_loss = 0.0
1191
+ att_loss = 0.0
1192
+ cls_loss = 0.2810396369071103
1193
+ eval_loss = 0.5117527923800729
1194
+ global_step = 17099
1195
+ loss = 0.2810396369071103
1196
+ mcc = 0.40602330795025077
1197
+ rep_loss = 0.0
1198
+ att_loss = 0.0
1199
+ cls_loss = 0.28107882297954884
1200
+ eval_loss = 0.5100564261277517
1201
+ global_step = 17199
1202
+ loss = 0.28107882297954884
1203
+ mcc = 0.3940079243628446
1204
+ rep_loss = 0.0
1205
+ att_loss = 0.0
1206
+ cls_loss = 0.2810721668297138
1207
+ eval_loss = 0.5121440327528751
1208
+ global_step = 17299
1209
+ loss = 0.2810721668297138
1210
+ mcc = 0.4061988397614615
1211
+ rep_loss = 0.0
1212
+ att_loss = 0.0
1213
+ cls_loss = 0.2810846810089944
1214
+ eval_loss = 0.5108874918836536
1215
+ global_step = 17399
1216
+ loss = 0.2810846810089944
1217
+ mcc = 0.39117212929787876
1218
+ rep_loss = 0.0
1219
+ att_loss = 0.0
1220
+ cls_loss = 0.281094952950928
1221
+ eval_loss = 0.5103858853831436
1222
+ global_step = 17499
1223
+ loss = 0.281094952950928
1224
+ mcc = 0.4024832514990541
1225
+ rep_loss = 0.0
1226
+ att_loss = 0.0
1227
+ cls_loss = 0.2810448341918224
1228
+ eval_loss = 0.510013351837794
1229
+ global_step = 17599
1230
+ loss = 0.2810448341918224
1231
+ mcc = 0.39624593859516594
1232
+ rep_loss = 0.0
1233
+ att_loss = 0.0
1234
+ cls_loss = 0.28106725430390767
1235
+ eval_loss = 0.5108868804844943
1236
+ global_step = 17699
1237
+ loss = 0.28106725430390767
1238
+ mcc = 0.3996634131246967
1239
+ rep_loss = 0.0
1240
+ att_loss = 0.0
1241
+ cls_loss = 0.28105053143649744
1242
+ eval_loss = 0.5124899862390576
1243
+ global_step = 17799
1244
+ loss = 0.28105053143649744
1245
+ mcc = 0.39008612150299654
1246
+ rep_loss = 0.0
1247
+ att_loss = 0.0
1248
+ cls_loss = 0.28106551141932806
1249
+ eval_loss = 0.5115214387575785
1250
+ global_step = 17899
1251
+ loss = 0.28106551141932806
1252
+ mcc = 0.39213093547272937
1253
+ rep_loss = 0.0
1254
+ att_loss = 0.0
1255
+ cls_loss = 0.28108492543516894
1256
+ eval_loss = 0.510235332178347
1257
+ global_step = 17999
1258
+ loss = 0.28108492543516894
1259
+ mcc = 0.3890770339941176
1260
+ rep_loss = 0.0
1261
+ att_loss = 0.0
1262
+ cls_loss = 0.2810836833317184
1263
+ eval_loss = 0.5114746211153088
1264
+ global_step = 18099
1265
+ loss = 0.2810836833317184
1266
+ mcc = 0.39418417780027004
1267
+ rep_loss = 0.0
1268
+ att_loss = 0.0
1269
+ cls_loss = 0.2810900085169675
1270
+ eval_loss = 0.5144133034980658
1271
+ global_step = 18199
1272
+ loss = 0.2810900085169675
1273
+ mcc = 0.38281831833686425
1274
+ rep_loss = 0.0
1275
+ att_loss = 0.0
1276
+ cls_loss = 0.2811337992779358
1277
+ eval_loss = 0.5112034859079303
1278
+ global_step = 18299
1279
+ loss = 0.2811337992779358
1280
+ mcc = 0.3996440630136365
1281
+ rep_loss = 0.0
1282
+ att_loss = 0.0
1283
+ cls_loss = 0.28113125959784224
1284
+ eval_loss = 0.5127215882142385
1285
+ global_step = 18399
1286
+ loss = 0.28113125959784224
1287
+ mcc = 0.38568778619879135
1288
+ rep_loss = 0.0
1289
+ att_loss = 0.0
1290
+ cls_loss = 0.28110789366587113
1291
+ eval_loss = 0.5109962333332408
1292
+ global_step = 18499
1293
+ loss = 0.28110789366587113
1294
+ mcc = 0.39112585288276486
1295
+ rep_loss = 0.0
1296
+ att_loss = 0.0
1297
+ cls_loss = 0.28111427403913447
1298
+ eval_loss = 0.5127900233774474
1299
+ global_step = 18599
1300
+ loss = 0.28111427403913447
1301
+ mcc = 0.38034948826672105
1302
+ rep_loss = 0.0
1303
+ att_loss = 0.0
1304
+ cls_loss = 0.28112251104482355
1305
+ eval_loss = 0.5124395769653898
1306
+ global_step = 18699
1307
+ loss = 0.28112251104482355
1308
+ mcc = 0.39418417780027004
1309
+ rep_loss = 0.0
1310
+ att_loss = 0.0
1311
+ cls_loss = 0.2811035370392093
1312
+ eval_loss = 0.5116180073131215
1313
+ global_step = 18799
1314
+ loss = 0.2811035370392093
1315
+ mcc = 0.39418417780027004
1316
+ rep_loss = 0.0
1317
+ att_loss = 0.0
1318
+ cls_loss = 0.2810910314499006
1319
+ eval_loss = 0.5112698972225189
1320
+ global_step = 18899
1321
+ loss = 0.2810910314499006
1322
+ mcc = 0.39624593859516594
1323
+ rep_loss = 0.0
1324
+ att_loss = 0.0
1325
+ cls_loss = 0.2810639343202822
1326
+ eval_loss = 0.5118823466878949
1327
+ global_step = 18999
1328
+ loss = 0.2810639343202822
1329
+ mcc = 0.3852178048848588
1330
+ rep_loss = 0.0
1331
+ att_loss = 0.0
1332
+ cls_loss = 0.281047973922413
1333
+ eval_loss = 0.5118935216556896
1334
+ global_step = 19099
1335
+ loss = 0.281047973922413
1336
+ mcc = 0.3916731692515916
1337
+ rep_loss = 0.0
1338
+ att_loss = 0.0
1339
+ cls_loss = 0.281021011028954
1340
+ eval_loss = 0.5107931025100477
1341
+ global_step = 19199
1342
+ loss = 0.281021011028954
1343
+ mcc = 0.3954928502055513
1344
+ rep_loss = 0.0
1345
+ att_loss = 0.0
1346
+ cls_loss = 0.2810025809414747
1347
+ eval_loss = 0.5114801354480513
1348
+ global_step = 19299
1349
+ loss = 0.2810025809414747
1350
+ mcc = 0.397005988404347
1351
+ rep_loss = 0.0
1352
+ att_loss = 0.0
1353
+ cls_loss = 0.2809744835557483
1354
+ eval_loss = 0.5109611894145156
1355
+ global_step = 19399
1356
+ loss = 0.2809744835557483
1357
+ mcc = 0.4011346232727083
1358
+ rep_loss = 0.0
1359
+ att_loss = 0.0
1360
+ cls_loss = 0.2809650007476518
1361
+ eval_loss = 0.5112038516637051
1362
+ global_step = 19499
1363
+ loss = 0.2809650007476518
1364
+ mcc = 0.4032118903317931
1365
+ rep_loss = 0.0
1366
+ att_loss = 0.0
1367
+ cls_loss = 0.2809396656315828
1368
+ eval_loss = 0.5116785367329916
1369
+ global_step = 19599
1370
+ loss = 0.2809396656315828
1371
+ mcc = 0.397005988404347
1372
+ rep_loss = 0.0
1373
+ att_loss = 0.0
1374
+ cls_loss = 0.2809460457934636
1375
+ eval_loss = 0.5114174241369421
1376
+ global_step = 19699
1377
+ loss = 0.2809460457934636
1378
+ mcc = 0.4032118903317931
1379
+ rep_loss = 0.0
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c2228631b6c483c03e774ce5dbe05337af44248e865d3377d9f02dc2a65eb8e
3
+ size 58394600
vocab.txt ADDED
The diff for this file is too large to render. See raw diff