ribesstefano commited on
Commit
54eac4a
·
verified ·
1 Parent(s): 959b13a

Training in progress, step 500000, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fb6c56954e78dc0009a37a49227c9d09ca6b44ee0bf58f8054ecb3de57d1f0ca
3
  size 409608164
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6cfa7c7e92be438dcf3db7b213e9dec445fc69325f8af229476e4fade60f1c4f
3
  size 409608164
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:48c7a81d5ad9f4939a3a394ee2ec0cee99260435a555fb2a922706840415be41
3
  size 814647162
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47400866d2b3874aa8db515822b34e6309789728f282f9bb86b1432c96816298
3
  size 814647162
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:851e62cc221f5b89fc632a61a046dd22f6c0b1983df71dc5cf6a85d362878b7f
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6bb40df1d2cacfe96f8a1f89857bbc3220c52b2d5fca642cb88aa8e9fbbc97a5
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2c87680c6a6ccbae9d154900996c944b2bf164f9842479579468f42223a09d2f
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6052cb7a9c038f97f0bff232e594126132c8dd3530545ea97f7bd3c6962c6a4
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.9890306854029252,
3
  "best_model_checkpoint": "/mimer/NOBACKUP/groups/naiss2023-6-290/stefano/models//PROTAC-Splitter-Trial-15/checkpoint-480000",
4
- "epoch": 45.88014981273408,
5
  "eval_steps": 10000,
6
- "global_step": 490000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -4235,6 +4235,118 @@
4235
  "eval_tanimoto_similarity": 0.0,
4236
  "eval_valid": 1.0,
4237
  "step": 490000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4238
  }
4239
  ],
4240
  "logging_steps": 1000,
@@ -4249,12 +4361,12 @@
4249
  "should_evaluate": false,
4250
  "should_log": false,
4251
  "should_save": true,
4252
- "should_training_stop": false
4253
  },
4254
  "attributes": {}
4255
  }
4256
  },
4257
- "total_flos": 4.214983293542787e+18,
4258
  "train_batch_size": 128,
4259
  "trial_name": null,
4260
  "trial_params": null
 
1
  {
2
  "best_metric": 0.9890306854029252,
3
  "best_model_checkpoint": "/mimer/NOBACKUP/groups/naiss2023-6-290/stefano/models//PROTAC-Splitter-Trial-15/checkpoint-480000",
4
+ "epoch": 46.81647940074907,
5
  "eval_steps": 10000,
6
+ "global_step": 500000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
4235
  "eval_tanimoto_similarity": 0.0,
4236
  "eval_valid": 1.0,
4237
  "step": 490000
4238
+ },
4239
+ {
4240
+ "epoch": 45.97378277153558,
4241
+ "grad_norm": 0.012753269635140896,
4242
+ "learning_rate": 8.518086768107509e-06,
4243
+ "loss": 0.0003,
4244
+ "step": 491000
4245
+ },
4246
+ {
4247
+ "epoch": 46.06741573033708,
4248
+ "grad_norm": 0.0015431916108354926,
4249
+ "learning_rate": 1.510764106820829e-05,
4250
+ "loss": 0.0003,
4251
+ "step": 492000
4252
+ },
4253
+ {
4254
+ "epoch": 46.161048689138575,
4255
+ "grad_norm": 0.02155626006424427,
4256
+ "learning_rate": 2.25881865139301e-05,
4257
+ "loss": 0.0004,
4258
+ "step": 493000
4259
+ },
4260
+ {
4261
+ "epoch": 46.254681647940075,
4262
+ "grad_norm": 0.01683797501027584,
4263
+ "learning_rate": 3.0298952869963953e-05,
4264
+ "loss": 0.0003,
4265
+ "step": 494000
4266
+ },
4267
+ {
4268
+ "epoch": 46.348314606741575,
4269
+ "grad_norm": 0.009855197742581367,
4270
+ "learning_rate": 3.750390492464676e-05,
4271
+ "loss": 0.0003,
4272
+ "step": 495000
4273
+ },
4274
+ {
4275
+ "epoch": 46.441947565543074,
4276
+ "grad_norm": 0.003276103874668479,
4277
+ "learning_rate": 4.351529023344395e-05,
4278
+ "loss": 0.0003,
4279
+ "step": 496000
4280
+ },
4281
+ {
4282
+ "epoch": 46.53558052434457,
4283
+ "grad_norm": 0.001958276843652129,
4284
+ "learning_rate": 4.775928888612517e-05,
4285
+ "loss": 0.0003,
4286
+ "step": 497000
4287
+ },
4288
+ {
4289
+ "epoch": 46.62921348314607,
4290
+ "grad_norm": 0.0038878321647644043,
4291
+ "learning_rate": 4.983891000015541e-05,
4292
+ "loss": 0.0003,
4293
+ "step": 498000
4294
+ },
4295
+ {
4296
+ "epoch": 46.72284644194757,
4297
+ "grad_norm": 0.0057247113436460495,
4298
+ "learning_rate": 4.816788519950127e-07,
4299
+ "loss": 0.0003,
4300
+ "step": 499000
4301
+ },
4302
+ {
4303
+ "epoch": 46.81647940074907,
4304
+ "grad_norm": 0.004408022854477167,
4305
+ "learning_rate": 3.17712320846264e-06,
4306
+ "loss": 0.0003,
4307
+ "step": 500000
4308
+ },
4309
+ {
4310
+ "epoch": 46.81647940074907,
4311
+ "eval_all_ligands_equal": 0.9880269572698595,
4312
+ "eval_e3_equal": 0.9950530542013192,
4313
+ "eval_e3_graph_edit_distance": Infinity,
4314
+ "eval_e3_graph_edit_distance_norm": Infinity,
4315
+ "eval_e3_has_attachment_point(s)": 1.0,
4316
+ "eval_e3_heavy_atoms_difference": 0.004086607398910238,
4317
+ "eval_e3_heavy_atoms_difference_norm": 0.00021304401339568784,
4318
+ "eval_e3_tanimoto_similarity": 0.0,
4319
+ "eval_e3_valid": 1.0,
4320
+ "eval_has_all_attachment_points": 1.0,
4321
+ "eval_has_three_substructures": 1.0,
4322
+ "eval_heavy_atoms_difference": -0.00014338973329509606,
4323
+ "eval_heavy_atoms_difference_norm": -2.106863305601476e-06,
4324
+ "eval_linker_equal": 0.9881703470031545,
4325
+ "eval_linker_graph_edit_distance": 0.11578720963579008,
4326
+ "eval_linker_graph_edit_distance_norm": Infinity,
4327
+ "eval_linker_has_attachment_point(s)": 1.0,
4328
+ "eval_linker_heavy_atoms_difference": -0.016633209062231143,
4329
+ "eval_linker_heavy_atoms_difference_norm": -0.0027458937792369477,
4330
+ "eval_linker_tanimoto_similarity": 0.0,
4331
+ "eval_linker_valid": 1.0,
4332
+ "eval_loss": 0.00021886541799176484,
4333
+ "eval_num_fragments": 3.0,
4334
+ "eval_poi_equal": 0.9930455979351879,
4335
+ "eval_poi_graph_edit_distance": Infinity,
4336
+ "eval_poi_graph_edit_distance_norm": Infinity,
4337
+ "eval_poi_has_attachment_point(s)": 1.0,
4338
+ "eval_poi_heavy_atoms_difference": 0.01240321193002581,
4339
+ "eval_poi_heavy_atoms_difference_norm": 0.00025383141098379934,
4340
+ "eval_poi_tanimoto_similarity": 0.0,
4341
+ "eval_poi_valid": 1.0,
4342
+ "eval_reassembly": 0.9997132205334098,
4343
+ "eval_reassembly_nostereo": 0.9997132205334098,
4344
+ "eval_runtime": 2712.3666,
4345
+ "eval_samples_per_second": 5.142,
4346
+ "eval_steps_per_second": 0.08,
4347
+ "eval_tanimoto_similarity": 0.0,
4348
+ "eval_valid": 1.0,
4349
+ "step": 500000
4350
  }
4351
  ],
4352
  "logging_steps": 1000,
 
4361
  "should_evaluate": false,
4362
  "should_log": false,
4363
  "should_save": true,
4364
+ "should_training_stop": true
4365
  },
4366
  "attributes": {}
4367
  }
4368
  },
4369
+ "total_flos": 4.3010984555114865e+18,
4370
  "train_batch_size": 128,
4371
  "trial_name": null,
4372
  "trial_params": null