argo11 commited on
Commit
482a6f3
·
verified ·
1 Parent(s): a287c87

ft-transformer best/last checkpoints

Browse files
runs/20260118_ft_141apps/last/ft_transformer_model_meta.json CHANGED
@@ -19,18 +19,18 @@
19
  "eDonkey"
20
  ],
21
  "dropped_rows": 10,
22
- "n_blocks": 6,
23
- "d_block": 512,
24
  "attention_n_heads": 8,
25
  "attention_dropout": 0.1,
26
  "ffn_dropout": 0.1,
27
  "residual_dropout": 0.0,
28
- "ffn_d_hidden_multiplier": 1.333,
29
- "n_epochs": 60,
30
- "patience": 6,
31
- "batch_size": 2048,
32
  "lr": 0.001,
33
- "weight_decay": 1e-05,
34
  "device": "cuda",
35
  "class_weight": {
36
  "mode": "none",
@@ -224,120 +224,636 @@
224
  "train_history": [
225
  {
226
  "epoch": 1.0,
227
- "train_loss": 1.3358488327167073,
228
- "valid_loss": 0.9459041662935941,
229
- "train_accuracy": 0.7063159276281858,
230
- "valid_accuracy": 0.7060240384793129,
231
  "lr": 0.001,
232
- "train_seconds": 221.82446880592033,
233
- "eval_seconds": 102.56885703187436,
234
- "epoch_seconds": 324.3933258377947,
235
- "train_rows_per_sec": 7316.1315734735845
236
  },
237
  {
238
  "epoch": 2.0,
239
- "train_loss": 0.9261272874335473,
240
- "valid_loss": 0.8358800593412148,
241
- "train_accuracy": 0.7377270399785075,
242
- "valid_accuracy": 0.7372219326168373,
243
  "lr": 0.001,
244
- "train_seconds": 221.62941304873675,
245
- "eval_seconds": 103.36996543500572,
246
- "epoch_seconds": 324.9993784837425,
247
- "train_rows_per_sec": 7322.570491323378
248
  },
249
  {
250
  "epoch": 3.0,
251
- "train_loss": 0.8910257922295213,
252
- "valid_loss": 0.8538549528931672,
253
- "train_accuracy": 0.731172095333222,
254
- "valid_accuracy": 0.7304063471641471,
255
  "lr": 0.001,
256
- "train_seconds": 222.4989249939099,
257
- "eval_seconds": 102.44063991401345,
258
- "epoch_seconds": 324.93956490792334,
259
- "train_rows_per_sec": 7293.954341776802
260
  },
261
  {
262
  "epoch": 4.0,
263
- "train_loss": 0.9769936021309332,
264
- "valid_loss": 1.4864348622987855,
265
- "train_accuracy": 0.5550777406083073,
266
- "valid_accuracy": 0.5556726300728696,
267
  "lr": 0.001,
268
- "train_seconds": 220.36866204300895,
269
- "eval_seconds": 102.35863702790812,
270
- "epoch_seconds": 322.72729907091707,
271
- "train_rows_per_sec": 7364.463644487083
272
  },
273
  {
274
  "epoch": 5.0,
275
- "train_loss": 1.2474059249834635,
276
- "valid_loss": 1.0632081533378026,
277
- "train_accuracy": 0.6651253899662147,
278
- "valid_accuracy": 0.6652747122739692,
279
  "lr": 0.001,
280
- "train_seconds": 220.8876668442972,
281
- "eval_seconds": 102.75199961429462,
282
- "epoch_seconds": 323.6396664585918,
283
- "train_rows_per_sec": 7347.15986268248
284
  },
285
  {
286
  "epoch": 6.0,
287
- "train_loss": 1.2964940690453086,
288
- "valid_loss": 1.0685923693315038,
289
- "train_accuracy": 0.671127003130821,
290
- "valid_accuracy": 0.6716836178244104,
291
  "lr": 0.001,
292
- "train_seconds": 218.024026687257,
293
- "eval_seconds": 102.13358042296022,
294
- "epoch_seconds": 320.1576071102172,
295
- "train_rows_per_sec": 7443.661254490786
296
  },
297
  {
298
  "epoch": 7.0,
299
- "train_loss": 1.0754953560432299,
300
- "valid_loss": 0.9625826617456832,
301
- "train_accuracy": 0.6992631078866989,
302
- "valid_accuracy": 0.7005893161492589,
303
  "lr": 0.001,
304
- "train_seconds": 217.86366034299135,
305
- "eval_seconds": 102.43207142595202,
306
- "epoch_seconds": 320.29573176894337,
307
- "train_rows_per_sec": 7449.140427756558
308
  },
309
  {
310
  "epoch": 8.0,
311
- "train_loss": 1.0774475758493622,
312
- "valid_loss": 0.9348634067571389,
313
- "train_accuracy": 0.7058876811036067,
314
- "valid_accuracy": 0.7061072230047729,
315
- "lr": 0.001,
316
- "train_seconds": 217.7801923188381,
317
- "eval_seconds": 102.54709787573665,
318
- "epoch_seconds": 320.32729019457474,
319
- "train_rows_per_sec": 7451.9954396220755
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
320
  }
321
  ],
322
  "train_result": {
323
  "metrics": {
324
- "train_logloss": 0.9315963242016221,
325
- "train_accuracy": 0.7058876811036067,
326
- "train_f1_macro": 0.29700525732803845,
327
- "valid_logloss": 0.9348585613508533,
328
- "valid_accuracy": 0.7061072230047729,
329
- "valid_f1_macro": 0.2974434879891297,
330
- "test_logloss": 0.9355261024341314,
331
- "test_accuracy": 0.7054417468010928,
332
- "test_f1_macro": 0.3020941288739866,
333
- "overfit_gap_valid_logloss": 0.0032622371492312396,
334
- "overfit_gap_test_logloss": 0.0039297782325092845,
335
- "overfit_gap_valid_f1_macro": -0.0004382306610912212,
336
- "overfit_gap_test_f1_macro": -0.00508887154594817,
337
- "best_epoch": 2.0,
338
- "best_valid_logloss": 0.9348585613508533,
339
- "best_valid_accuracy": 0.7061072230047729,
340
- "best_valid_f1_macro": 0.2974434879891297
341
  },
342
  "n_rows": 2704829,
343
  "n_features": 56,
 
19
  "eDonkey"
20
  ],
21
  "dropped_rows": 10,
22
+ "n_blocks": 4,
23
+ "d_block": 256,
24
  "attention_n_heads": 8,
25
  "attention_dropout": 0.1,
26
  "ffn_dropout": 0.1,
27
  "residual_dropout": 0.0,
28
+ "ffn_d_hidden_multiplier": 2.0,
29
+ "n_epochs": 100,
30
+ "patience": 12,
31
+ "batch_size": 1024,
32
  "lr": 0.001,
33
+ "weight_decay": 0.0001,
34
  "device": "cuda",
35
  "class_weight": {
36
  "mode": "none",
 
224
  "train_history": [
225
  {
226
  "epoch": 1.0,
227
+ "train_loss": 1.0820218957184993,
228
+ "valid_loss": 0.8103469731902355,
229
+ "train_accuracy": 0.7475009196517093,
230
+ "valid_accuracy": 0.7470876173363945,
231
  "lr": 0.001,
232
+ "train_seconds": 64.16830076603219,
233
+ "eval_seconds": 33.973765483126044,
234
+ "epoch_seconds": 98.14206624915823,
235
+ "train_rows_per_sec": 25291.25721931363
236
  },
237
  {
238
  "epoch": 2.0,
239
+ "train_loss": 0.8105412084973573,
240
+ "valid_loss": 0.7371084651784771,
241
+ "train_accuracy": 0.7664633060508461,
242
+ "valid_accuracy": 0.7650369893856546,
243
  "lr": 0.001,
244
+ "train_seconds": 63.68453805660829,
245
+ "eval_seconds": 33.999106251168996,
246
+ "epoch_seconds": 97.68364430777729,
247
+ "train_rows_per_sec": 25483.375549610326
248
  },
249
  {
250
  "epoch": 3.0,
251
+ "train_loss": 0.7313179358322913,
252
+ "valid_loss": 0.6841807827381646,
253
+ "train_accuracy": 0.7863801584450523,
254
+ "valid_accuracy": 0.7839975155555062,
255
  "lr": 0.001,
256
+ "train_seconds": 63.437448346056044,
257
+ "eval_seconds": 33.59120648866519,
258
+ "epoch_seconds": 97.02865483472124,
259
+ "train_rows_per_sec": 25582.633638524912
260
  },
261
  {
262
  "epoch": 4.0,
263
+ "train_loss": 0.7070826306328036,
264
+ "valid_loss": 0.6529311272958276,
265
+ "train_accuracy": 0.7943609483534692,
266
+ "valid_accuracy": 0.7919407134644322,
267
  "lr": 0.001,
268
+ "train_seconds": 63.00751159898937,
269
+ "eval_seconds": 33.50558300456032,
270
+ "epoch_seconds": 96.51309460354969,
271
+ "train_rows_per_sec": 25757.19876590129
272
  },
273
  {
274
  "epoch": 5.0,
275
+ "train_loss": 0.6632884027454004,
276
+ "valid_loss": 0.6292482220157558,
277
+ "train_accuracy": 0.8017409607633756,
278
+ "valid_accuracy": 0.7977229622564079,
279
  "lr": 0.001,
280
+ "train_seconds": 63.04453998291865,
281
+ "eval_seconds": 33.355517863761634,
282
+ "epoch_seconds": 96.40005784668028,
283
+ "train_rows_per_sec": 25742.070612930307
284
  },
285
  {
286
  "epoch": 6.0,
287
+ "train_loss": 0.64503756189948,
288
+ "valid_loss": 0.6537572209686322,
289
+ "train_accuracy": 0.7971713546823982,
290
+ "valid_accuracy": 0.7926561003833882,
291
  "lr": 0.001,
292
+ "train_seconds": 63.07321646483615,
293
+ "eval_seconds": 33.55945497285575,
294
+ "epoch_seconds": 96.6326714376919,
295
+ "train_rows_per_sec": 25730.366880921298
296
  },
297
  {
298
  "epoch": 7.0,
299
+ "train_loss": 0.6202571140102784,
300
+ "valid_loss": 0.6236088287176843,
301
+ "train_accuracy": 0.8047473129841265,
302
+ "valid_accuracy": 0.7994550489309864,
303
  "lr": 0.001,
304
+ "train_seconds": 63.71714582014829,
305
+ "eval_seconds": 33.65691030398011,
306
+ "epoch_seconds": 97.3740561241284,
307
+ "train_rows_per_sec": 25470.3342265343
308
  },
309
  {
310
  "epoch": 8.0,
311
+ "train_loss": 0.6027121601420622,
312
+ "valid_loss": 0.5947417731208476,
313
+ "train_accuracy": 0.8130380424635698,
314
+ "valid_accuracy": 0.8077346820317728,
315
+ "lr": 0.001,
316
+ "train_seconds": 62.91284818807617,
317
+ "eval_seconds": 33.667090175207704,
318
+ "epoch_seconds": 96.57993836328387,
319
+ "train_rows_per_sec": 25795.954987578938
320
+ },
321
+ {
322
+ "epoch": 9.0,
323
+ "train_loss": 0.5878799089685975,
324
+ "valid_loss": 0.5691886309865292,
325
+ "train_accuracy": 0.8229289967262248,
326
+ "valid_accuracy": 0.8167980982168935,
327
+ "lr": 0.001,
328
+ "train_seconds": 63.03727223165333,
329
+ "eval_seconds": 33.70051255216822,
330
+ "epoch_seconds": 96.73778478382155,
331
+ "train_rows_per_sec": 25745.038491451152
332
+ },
333
+ {
334
+ "epoch": 10.0,
335
+ "train_loss": 0.5819709924117248,
336
+ "valid_loss": 0.565472413157245,
337
+ "train_accuracy": 0.8250554409799267,
338
+ "valid_accuracy": 0.8174136637052976,
339
+ "lr": 0.001,
340
+ "train_seconds": 63.19497093511745,
341
+ "eval_seconds": 34.04710213886574,
342
+ "epoch_seconds": 97.24207307398319,
343
+ "train_rows_per_sec": 25680.793518620892
344
+ },
345
+ {
346
+ "epoch": 11.0,
347
+ "train_loss": 0.5658281126985039,
348
+ "valid_loss": 0.5592924923775101,
349
+ "train_accuracy": 0.8270826799236181,
350
+ "valid_accuracy": 0.8188998938935164,
351
+ "lr": 0.001,
352
+ "train_seconds": 63.33684863895178,
353
+ "eval_seconds": 33.97817206289619,
354
+ "epoch_seconds": 97.31502070184797,
355
+ "train_rows_per_sec": 25623.267258704884
356
+ },
357
+ {
358
+ "epoch": 12.0,
359
+ "train_loss": 0.5546503029411147,
360
+ "valid_loss": 0.5446304631030402,
361
+ "train_accuracy": 0.8322715489645985,
362
+ "valid_accuracy": 0.8235360447791543,
363
+ "lr": 0.001,
364
+ "train_seconds": 63.314998568966985,
365
+ "eval_seconds": 34.06828756863251,
366
+ "epoch_seconds": 97.3832861375995,
367
+ "train_rows_per_sec": 25632.109874127702
368
+ },
369
+ {
370
+ "epoch": 13.0,
371
+ "train_loss": 0.5455316337313185,
372
+ "valid_loss": 0.542088924317369,
373
+ "train_accuracy": 0.8345249267205498,
374
+ "valid_accuracy": 0.825070337137639,
375
+ "lr": 0.001,
376
+ "train_seconds": 63.744275709148496,
377
+ "eval_seconds": 33.986425776965916,
378
+ "epoch_seconds": 97.73070148611441,
379
+ "train_rows_per_sec": 25459.493922323818
380
+ },
381
+ {
382
+ "epoch": 14.0,
383
+ "train_loss": 0.5374383660709068,
384
+ "valid_loss": 0.546989832122745,
385
+ "train_accuracy": 0.833115102190712,
386
+ "valid_accuracy": 0.8232458232125494,
387
+ "lr": 0.001,
388
+ "train_seconds": 63.319708260241896,
389
+ "eval_seconds": 34.049483039882034,
390
+ "epoch_seconds": 97.36919130012393,
391
+ "train_rows_per_sec": 25630.203369382994
392
+ },
393
+ {
394
+ "epoch": 15.0,
395
+ "train_loss": 0.5287376385946003,
396
+ "valid_loss": 0.5553689658191119,
397
+ "train_accuracy": 0.8307637514888498,
398
+ "valid_accuracy": 0.8197114051530041,
399
+ "lr": 0.001,
400
+ "train_seconds": 63.43099932698533,
401
+ "eval_seconds": 33.6594194509089,
402
+ "epoch_seconds": 97.09041877789423,
403
+ "train_rows_per_sec": 25585.234620599364
404
+ },
405
+ {
406
+ "epoch": 16.0,
407
+ "train_loss": 0.5214578927503399,
408
+ "valid_loss": 0.5328890868869306,
409
+ "train_accuracy": 0.8394556154826831,
410
+ "valid_accuracy": 0.8273348047751615,
411
+ "lr": 0.001,
412
+ "train_seconds": 63.4428806649521,
413
+ "eval_seconds": 33.94598149927333,
414
+ "epoch_seconds": 97.38886216422543,
415
+ "train_rows_per_sec": 25580.443116551938
416
+ },
417
+ {
418
+ "epoch": 17.0,
419
+ "train_loss": 0.5136345790951786,
420
+ "valid_loss": 0.5242198813277066,
421
+ "train_accuracy": 0.8428483138486299,
422
+ "valid_accuracy": 0.8300041037699227,
423
+ "lr": 0.001,
424
+ "train_seconds": 63.277302644215524,
425
+ "eval_seconds": 33.96833814168349,
426
+ "epoch_seconds": 97.24564078589901,
427
+ "train_rows_per_sec": 25647.3795845082
428
+ },
429
+ {
430
+ "epoch": 18.0,
431
+ "train_loss": 0.5085902087883994,
432
+ "valid_loss": 0.5208335089548324,
433
+ "train_accuracy": 0.8451756334505517,
434
+ "valid_accuracy": 0.8317565244396136,
435
+ "lr": 0.001,
436
+ "train_seconds": 63.33510157139972,
437
+ "eval_seconds": 34.10430253529921,
438
+ "epoch_seconds": 97.43940410669893,
439
+ "train_rows_per_sec": 25623.974063899706
440
+ },
441
+ {
442
+ "epoch": 19.0,
443
+ "train_loss": 0.5016847469641207,
444
+ "valid_loss": 0.5300784743688508,
445
+ "train_accuracy": 0.8426579135952559,
446
+ "valid_accuracy": 0.8282258034700887,
447
+ "lr": 0.001,
448
+ "train_seconds": 63.72320907516405,
449
+ "eval_seconds": 33.997835143934935,
450
+ "epoch_seconds": 97.72104421909899,
451
+ "train_rows_per_sec": 25467.910727561266
452
+ },
453
+ {
454
+ "epoch": 20.0,
455
+ "train_loss": 0.49550204444382845,
456
+ "valid_loss": 0.5166273402694493,
457
+ "train_accuracy": 0.8465041219498218,
458
+ "valid_accuracy": 0.8319654100257687,
459
+ "lr": 0.001,
460
+ "train_seconds": 63.395974493119866,
461
+ "eval_seconds": 33.953488319180906,
462
+ "epoch_seconds": 97.34946281230077,
463
+ "train_rows_per_sec": 25599.369880750506
464
+ },
465
+ {
466
+ "epoch": 21.0,
467
+ "train_loss": 0.48959602875288355,
468
+ "valid_loss": 0.5132080860759901,
469
+ "train_accuracy": 0.8497785133622159,
470
+ "valid_accuracy": 0.8336475859850712,
471
+ "lr": 0.001,
472
+ "train_seconds": 63.34947727294639,
473
+ "eval_seconds": 34.09483556402847,
474
+ "epoch_seconds": 97.44431283697486,
475
+ "train_rows_per_sec": 25618.159294473986
476
+ },
477
+ {
478
+ "epoch": 22.0,
479
+ "train_loss": 0.4840707175175098,
480
+ "valid_loss": 0.5225206141435808,
481
+ "train_accuracy": 0.8487371656981312,
482
+ "valid_accuracy": 0.8317047651793273,
483
+ "lr": 0.001,
484
+ "train_seconds": 63.332320482004434,
485
+ "eval_seconds": 33.94683784805238,
486
+ "epoch_seconds": 97.27915833005682,
487
+ "train_rows_per_sec": 25625.099280250408
488
+ },
489
+ {
490
+ "epoch": 23.0,
491
+ "train_loss": 0.47849724452578307,
492
+ "valid_loss": 0.508108733450758,
493
+ "train_accuracy": 0.8548768036418823,
494
+ "valid_accuracy": 0.8372060351297493,
495
+ "lr": 0.001,
496
+ "train_seconds": 62.94049229286611,
497
+ "eval_seconds": 33.64570001279935,
498
+ "epoch_seconds": 96.58619230566546,
499
+ "train_rows_per_sec": 25784.625141610857
500
+ },
501
+ {
502
+ "epoch": 24.0,
503
+ "train_loss": 0.4743075716006643,
504
+ "valid_loss": 0.5187592181907034,
505
+ "train_accuracy": 0.8523627808788851,
506
+ "valid_accuracy": 0.8339969609920032,
507
+ "lr": 0.001,
508
+ "train_seconds": 62.940594538580626,
509
+ "eval_seconds": 33.573294749017805,
510
+ "epoch_seconds": 96.51388928759843,
511
+ "train_rows_per_sec": 25784.583255012225
512
+ },
513
+ {
514
+ "epoch": 25.0,
515
+ "train_loss": 0.4686912119200553,
516
+ "valid_loss": 0.5063637984046864,
517
+ "train_accuracy": 0.8556100602810899,
518
+ "valid_accuracy": 0.8371653671395245,
519
+ "lr": 0.001,
520
+ "train_seconds": 63.331458281259984,
521
+ "eval_seconds": 33.37883689114824,
522
+ "epoch_seconds": 96.71029517240822,
523
+ "train_rows_per_sec": 25625.448142889538
524
+ },
525
+ {
526
+ "epoch": 26.0,
527
+ "train_loss": 0.46572147837196615,
528
+ "valid_loss": 0.502626194733077,
529
+ "train_accuracy": 0.8581450332337789,
530
+ "valid_accuracy": 0.8381987038002389,
531
+ "lr": 0.001,
532
+ "train_seconds": 63.06501075765118,
533
+ "eval_seconds": 33.2926743873395,
534
+ "epoch_seconds": 96.35768514499068,
535
+ "train_rows_per_sec": 25733.71478895858
536
+ },
537
+ {
538
+ "epoch": 27.0,
539
+ "train_loss": 0.46094266448863297,
540
+ "valid_loss": 0.502584141177356,
541
+ "train_accuracy": 0.8593792458794366,
542
+ "valid_accuracy": 0.8384963195468846,
543
+ "lr": 0.001,
544
+ "train_seconds": 62.76579191396013,
545
+ "eval_seconds": 33.69062760518864,
546
+ "epoch_seconds": 96.45641951914877,
547
+ "train_rows_per_sec": 25856.393275889528
548
+ },
549
+ {
550
+ "epoch": 28.0,
551
+ "train_loss": 0.4558331838917657,
552
+ "valid_loss": 0.5052939294529322,
553
+ "train_accuracy": 0.8593059202155159,
554
+ "valid_accuracy": 0.8372041865847392,
555
+ "lr": 0.001,
556
+ "train_seconds": 62.96537010092288,
557
+ "eval_seconds": 33.25173534685746,
558
+ "epoch_seconds": 96.21710544778034,
559
+ "train_rows_per_sec": 25774.43755827639
560
+ },
561
+ {
562
+ "epoch": 29.0,
563
+ "train_loss": 0.4565059190668894,
564
+ "valid_loss": 0.5004870219469522,
565
+ "train_accuracy": 0.86285574500415,
566
+ "valid_accuracy": 0.8397366932487439,
567
+ "lr": 0.001,
568
+ "train_seconds": 62.873661659192294,
569
+ "eval_seconds": 33.49827020801604,
570
+ "epoch_seconds": 96.37193186720833,
571
+ "train_rows_per_sec": 25812.03252956603
572
+ },
573
+ {
574
+ "epoch": 30.0,
575
+ "train_loss": 0.4475665768990381,
576
+ "valid_loss": 0.501518010755117,
577
+ "train_accuracy": 0.8612709247721821,
578
+ "valid_accuracy": 0.838507410816946,
579
+ "lr": 0.001,
580
+ "train_seconds": 63.05255681602284,
581
+ "eval_seconds": 34.09806349920109,
582
+ "epoch_seconds": 97.15062031522393,
583
+ "train_rows_per_sec": 25738.797630924797
584
+ },
585
+ {
586
+ "epoch": 31.0,
587
+ "train_loss": 0.44393566570447446,
588
+ "valid_loss": 0.5087924569788862,
589
+ "train_accuracy": 0.8623486271772023,
590
+ "valid_accuracy": 0.8377217791876015,
591
+ "lr": 0.001,
592
+ "train_seconds": 63.35609852382913,
593
+ "eval_seconds": 34.17835011333227,
594
+ "epoch_seconds": 97.5344486371614,
595
+ "train_rows_per_sec": 25615.48197904903
596
+ },
597
+ {
598
+ "epoch": 32.0,
599
+ "train_loss": 0.44107461225723243,
600
+ "valid_loss": 0.5111384269533176,
601
+ "train_accuracy": 0.8630677116292654,
602
+ "valid_accuracy": 0.8384464088316086,
603
+ "lr": 0.001,
604
+ "train_seconds": 63.45186144113541,
605
+ "eval_seconds": 33.95439840015024,
606
+ "epoch_seconds": 97.40625984128565,
607
+ "train_rows_per_sec": 25576.822541377598
608
+ },
609
+ {
610
+ "epoch": 33.0,
611
+ "train_loss": 0.43758223716768935,
612
+ "valid_loss": 0.49973840580545437,
613
+ "train_accuracy": 0.8660907007653598,
614
+ "valid_accuracy": 0.840485353977884,
615
+ "lr": 0.001,
616
+ "train_seconds": 63.224658409599215,
617
+ "eval_seconds": 33.89740962907672,
618
+ "epoch_seconds": 97.12206803867593,
619
+ "train_rows_per_sec": 25668.73496549568
620
+ },
621
+ {
622
+ "epoch": 34.0,
623
+ "train_loss": 0.4336172381786142,
624
+ "valid_loss": 0.5000819149224655,
625
+ "train_accuracy": 0.8677285126536065,
626
+ "valid_accuracy": 0.8412377117970445,
627
+ "lr": 0.001,
628
+ "train_seconds": 63.381494055036455,
629
+ "eval_seconds": 33.83945573028177,
630
+ "epoch_seconds": 97.22094978531823,
631
+ "train_rows_per_sec": 25605.21843474973
632
+ },
633
+ {
634
+ "epoch": 35.0,
635
+ "train_loss": 0.42942445964467263,
636
+ "valid_loss": 0.5066212020772166,
637
+ "train_accuracy": 0.8674345938158737,
638
+ "valid_accuracy": 0.8402210120414222,
639
+ "lr": 0.001,
640
+ "train_seconds": 63.38268358493224,
641
+ "eval_seconds": 33.69065831974149,
642
+ "epoch_seconds": 97.07334190467373,
643
+ "train_rows_per_sec": 25604.73789067849
644
+ },
645
+ {
646
+ "epoch": 36.0,
647
+ "train_loss": 0.42654681942816414,
648
+ "valid_loss": 0.4978872144380003,
649
+ "train_accuracy": 0.8704711389570626,
650
+ "valid_accuracy": 0.8418015180251623,
651
+ "lr": 0.001,
652
+ "train_seconds": 63.19224369432777,
653
+ "eval_seconds": 33.944326273631305,
654
+ "epoch_seconds": 97.13656996795908,
655
+ "train_rows_per_sec": 25681.901846217777
656
+ },
657
+ {
658
+ "epoch": 37.0,
659
+ "train_loss": 0.424747936770743,
660
+ "valid_loss": 0.5056363287855411,
661
+ "train_accuracy": 0.8679164481787816,
662
+ "valid_accuracy": 0.8394649571322412,
663
+ "lr": 0.001,
664
+ "train_seconds": 63.22434198483825,
665
+ "eval_seconds": 34.19630459835753,
666
+ "epoch_seconds": 97.42064658319578,
667
+ "train_rows_per_sec": 25668.863432207567
668
+ },
669
+ {
670
+ "epoch": 38.0,
671
+ "train_loss": 0.4224049084382102,
672
+ "valid_loss": 0.5032070239685433,
673
+ "train_accuracy": 0.8701470271988918,
674
+ "valid_accuracy": 0.840278316936739,
675
+ "lr": 0.001,
676
+ "train_seconds": 63.390172947663814,
677
+ "eval_seconds": 33.98761875927448,
678
+ "epoch_seconds": 97.3777917069383,
679
+ "train_rows_per_sec": 25601.712766108023
680
+ },
681
+ {
682
+ "epoch": 39.0,
683
+ "train_loss": 0.41783615943009167,
684
+ "valid_loss": 0.4948694319490674,
685
+ "train_accuracy": 0.8743228929500764,
686
+ "valid_accuracy": 0.8441436245531142,
687
+ "lr": 0.001,
688
+ "train_seconds": 63.22260568803176,
689
+ "eval_seconds": 33.92868220806122,
690
+ "epoch_seconds": 97.15128789609298,
691
+ "train_rows_per_sec": 25669.568382045025
692
+ },
693
+ {
694
+ "epoch": 40.0,
695
+ "train_loss": 0.41417582740166964,
696
+ "valid_loss": 0.49532948228722484,
697
+ "train_accuracy": 0.8748010502206855,
698
+ "valid_accuracy": 0.843975406957184,
699
+ "lr": 0.001,
700
+ "train_seconds": 63.263892388902605,
701
+ "eval_seconds": 33.99912789603695,
702
+ "epoch_seconds": 97.26302028493956,
703
+ "train_rows_per_sec": 25652.81614390011
704
+ },
705
+ {
706
+ "epoch": 41.0,
707
+ "train_loss": 0.4119304350874025,
708
+ "valid_loss": 0.5005550107342985,
709
+ "train_accuracy": 0.8746808947209835,
710
+ "valid_accuracy": 0.8430474373620523,
711
+ "lr": 0.001,
712
+ "train_seconds": 63.1627330170013,
713
+ "eval_seconds": 33.891046753153205,
714
+ "epoch_seconds": 97.0537797701545,
715
+ "train_rows_per_sec": 25693.900857063458
716
+ },
717
+ {
718
+ "epoch": 42.0,
719
+ "train_loss": 0.4088314933167647,
720
+ "valid_loss": 0.4987784830293493,
721
+ "train_accuracy": 0.8753513007911161,
722
+ "valid_accuracy": 0.8425926952895376,
723
+ "lr": 0.001,
724
+ "train_seconds": 63.21076052309945,
725
+ "eval_seconds": 34.080719009041786,
726
+ "epoch_seconds": 97.29147953214124,
727
+ "train_rows_per_sec": 25674.378643283937
728
+ },
729
+ {
730
+ "epoch": 43.0,
731
+ "train_loss": 0.40698394876925353,
732
+ "valid_loss": 0.5021275761334792,
733
+ "train_accuracy": 0.8761332358122542,
734
+ "valid_accuracy": 0.8433321132936266,
735
+ "lr": 0.001,
736
+ "train_seconds": 62.83131029084325,
737
+ "eval_seconds": 33.47180753201246,
738
+ "epoch_seconds": 96.30311782285571,
739
+ "train_rows_per_sec": 25829.431098725847
740
+ },
741
+ {
742
+ "epoch": 44.0,
743
+ "train_loss": 0.40532815200673294,
744
+ "valid_loss": 0.4974711690598039,
745
+ "train_accuracy": 0.878889418120805,
746
+ "valid_accuracy": 0.8449921067128063,
747
+ "lr": 0.001,
748
+ "train_seconds": 63.32379973074421,
749
+ "eval_seconds": 33.24089104682207,
750
+ "epoch_seconds": 96.56469077756628,
751
+ "train_rows_per_sec": 25628.547353453752
752
+ },
753
+ {
754
+ "epoch": 45.0,
755
+ "train_loss": 0.40171810097122795,
756
+ "valid_loss": 0.5032399542390286,
757
+ "train_accuracy": 0.8774512492166786,
758
+ "valid_accuracy": 0.8435206648846693,
759
+ "lr": 0.001,
760
+ "train_seconds": 62.93412214005366,
761
+ "eval_seconds": 33.482022404205054,
762
+ "epoch_seconds": 96.41614454425871,
763
+ "train_rows_per_sec": 25787.23504537655
764
+ },
765
+ {
766
+ "epoch": 46.0,
767
+ "train_loss": 0.39931669598122127,
768
+ "valid_loss": 0.5028289541292281,
769
+ "train_accuracy": 0.8779300226693376,
770
+ "valid_accuracy": 0.8437850068211311,
771
+ "lr": 0.001,
772
+ "train_seconds": 62.876390965189785,
773
+ "eval_seconds": 33.69999274611473,
774
+ "epoch_seconds": 96.57638371130452,
775
+ "train_rows_per_sec": 25810.91209415126
776
+ },
777
+ {
778
+ "epoch": 47.0,
779
+ "train_loss": 0.39676706285130714,
780
+ "valid_loss": 0.500185925309284,
781
+ "train_accuracy": 0.8799313819669393,
782
+ "valid_accuracy": 0.8439735584121738,
783
+ "lr": 0.001,
784
+ "train_seconds": 62.65322900284082,
785
+ "eval_seconds": 33.51263489108533,
786
+ "epoch_seconds": 96.16586389392614,
787
+ "train_rows_per_sec": 25902.846921527616
788
+ },
789
+ {
790
+ "epoch": 48.0,
791
+ "train_loss": 0.3954523505848665,
792
+ "valid_loss": 0.49874948486263226,
793
+ "train_accuracy": 0.8813553786839214,
794
+ "valid_accuracy": 0.8454080293401064,
795
+ "lr": 0.001,
796
+ "train_seconds": 62.96290503628552,
797
+ "eval_seconds": 33.50567141920328,
798
+ "epoch_seconds": 96.4685764554888,
799
+ "train_rows_per_sec": 25775.446654895044
800
+ },
801
+ {
802
+ "epoch": 49.0,
803
+ "train_loss": 0.3928473410170161,
804
+ "valid_loss": 0.5009219435189758,
805
+ "train_accuracy": 0.8814336338042402,
806
+ "valid_accuracy": 0.8449181649123975,
807
+ "lr": 0.001,
808
+ "train_seconds": 62.933298285119236,
809
+ "eval_seconds": 33.53859194600955,
810
+ "epoch_seconds": 96.47189023112878,
811
+ "train_rows_per_sec": 25787.57262407362
812
+ },
813
+ {
814
+ "epoch": 50.0,
815
+ "train_loss": 0.3908199260663535,
816
+ "valid_loss": 0.5015645899258849,
817
+ "train_accuracy": 0.8812463144611149,
818
+ "valid_accuracy": 0.844964378537653,
819
+ "lr": 0.001,
820
+ "train_seconds": 63.514217879623175,
821
+ "eval_seconds": 33.935506734997034,
822
+ "epoch_seconds": 97.44972461462021,
823
+ "train_rows_per_sec": 25551.711950162622
824
+ },
825
+ {
826
+ "epoch": 51.0,
827
+ "train_loss": 0.3881921176466656,
828
+ "valid_loss": 0.5009191166363051,
829
+ "train_accuracy": 0.8833382525200305,
830
+ "valid_accuracy": 0.845570701301006,
831
+ "lr": 0.001,
832
+ "train_seconds": 63.34409616421908,
833
+ "eval_seconds": 34.00553934276104,
834
+ "epoch_seconds": 97.34963550698012,
835
+ "train_rows_per_sec": 25620.33556833224
836
  }
837
  ],
838
  "train_result": {
839
  "metrics": {
840
+ "train_logloss": 0.3317659795132071,
841
+ "train_accuracy": 0.8833382525200305,
842
+ "train_f1_macro": 0.7447494709952788,
843
+ "valid_logloss": 0.5006793475467268,
844
+ "valid_accuracy": 0.845570701301006,
845
+ "valid_f1_macro": 0.5819535036954402,
846
+ "test_logloss": 0.50240012996618,
847
+ "test_accuracy": 0.8443469645042387,
848
+ "test_f1_macro": 0.6060827027497421,
849
+ "overfit_gap_valid_logloss": 0.16891336803351975,
850
+ "overfit_gap_test_logloss": 0.17063415045297292,
851
+ "overfit_gap_valid_f1_macro": 0.16279596729983858,
852
+ "overfit_gap_test_f1_macro": 0.1386667682455367,
853
+ "best_epoch": 39.0,
854
+ "best_valid_logloss": 0.5006793475467268,
855
+ "best_valid_accuracy": 0.845570701301006,
856
+ "best_valid_f1_macro": 0.5819535036954402
857
  },
858
  "n_rows": 2704829,
859
  "n_features": 56,