ribesstefano commited on
Commit
6241086
·
verified ·
1 Parent(s): 2dd00bf

Training in progress, step 20000, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3efb1b806a1369fca34a3e3273471a9c86ec0acbe20b2e1c6271278f4ada404a
3
  size 409608164
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:835536a9f4bc9598d2aa3d301a8969869c1e49d0f59b9b2fd55cab35a3ffcfcf
3
  size 409608164
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:110a93e7b792f45fc0500576ccbd59c0bb82a66066fe3977c2bcd7d8084b21d3
3
  size 814647162
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a29aea1f4bc620e4c56dc629ab7626d669e605a3ac2ec6a60c73ef081803e046
3
  size 814647162
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed8a996caa4721c8629cbedbae34cd38c3fcc2d3348e4fa1f806a13c16379e70
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d17dc07ba223f477f407e44715d157a31fe9df81f7f77bc0d31d54494107c73d
3
  size 14244
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.5455028328611898,
3
  "best_model_checkpoint": "/mimer/NOBACKUP/groups/naiss2023-6-290/stefano/models//PROTAC-Splitter-EncoderDecoder-lr_reduce-opt25-rand-smiles/checkpoint-10000",
4
- "epoch": 1.4795817715525745,
5
  "eval_steps": 2500,
6
- "global_step": 15000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -343,6 +343,76 @@
343
  "learning_rate": 5e-05,
344
  "loss": 0.0035,
345
  "step": 15000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
346
  }
347
  ],
348
  "logging_steps": 500,
@@ -362,7 +432,7 @@
362
  "attributes": {}
363
  }
364
  },
365
- "total_flos": 1.309637623513728e+17,
366
  "train_batch_size": 128,
367
  "trial_name": null,
368
  "trial_params": null
 
1
  {
2
  "best_metric": 0.5455028328611898,
3
  "best_model_checkpoint": "/mimer/NOBACKUP/groups/naiss2023-6-290/stefano/models//PROTAC-Splitter-EncoderDecoder-lr_reduce-opt25-rand-smiles/checkpoint-10000",
4
+ "epoch": 1.9727756954034326,
5
  "eval_steps": 2500,
6
+ "global_step": 20000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
343
  "learning_rate": 5e-05,
344
  "loss": 0.0035,
345
  "step": 15000
346
+ },
347
+ {
348
+ "epoch": 1.5289011639376602,
349
+ "grad_norm": 0.044646210968494415,
350
+ "learning_rate": 5e-05,
351
+ "loss": 0.0022,
352
+ "step": 15500
353
+ },
354
+ {
355
+ "epoch": 1.578220556322746,
356
+ "grad_norm": 0.04811064526438713,
357
+ "learning_rate": 5e-05,
358
+ "loss": 0.0021,
359
+ "step": 16000
360
+ },
361
+ {
362
+ "epoch": 1.627539948707832,
363
+ "grad_norm": 0.054762303829193115,
364
+ "learning_rate": 5e-05,
365
+ "loss": 0.0024,
366
+ "step": 16500
367
+ },
368
+ {
369
+ "epoch": 1.6768593410929178,
370
+ "grad_norm": 0.04429342970252037,
371
+ "learning_rate": 5e-05,
372
+ "loss": 0.0022,
373
+ "step": 17000
374
+ },
375
+ {
376
+ "epoch": 1.7261787334780037,
377
+ "grad_norm": 0.06518573313951492,
378
+ "learning_rate": 5e-05,
379
+ "loss": 0.0022,
380
+ "step": 17500
381
+ },
382
+ {
383
+ "epoch": 1.7754981258630895,
384
+ "grad_norm": 0.043648600578308105,
385
+ "learning_rate": 5e-05,
386
+ "loss": 0.0021,
387
+ "step": 18000
388
+ },
389
+ {
390
+ "epoch": 1.8248175182481752,
391
+ "grad_norm": 0.044574983417987823,
392
+ "learning_rate": 5e-05,
393
+ "loss": 0.0021,
394
+ "step": 18500
395
+ },
396
+ {
397
+ "epoch": 1.874136910633261,
398
+ "grad_norm": 0.05319111794233322,
399
+ "learning_rate": 5e-05,
400
+ "loss": 0.0021,
401
+ "step": 19000
402
+ },
403
+ {
404
+ "epoch": 1.9234563030183467,
405
+ "grad_norm": 0.05567469820380211,
406
+ "learning_rate": 5e-05,
407
+ "loss": 0.0021,
408
+ "step": 19500
409
+ },
410
+ {
411
+ "epoch": 1.9727756954034326,
412
+ "grad_norm": 0.045425355434417725,
413
+ "learning_rate": 5e-05,
414
+ "loss": 0.0019,
415
+ "step": 20000
416
  }
417
  ],
418
  "logging_steps": 500,
 
432
  "attributes": {}
433
  }
434
  },
435
+ "total_flos": 1.746034901972567e+17,
436
  "train_batch_size": 128,
437
  "trial_name": null,
438
  "trial_params": null