ribesstefano commited on
Commit
af175fa
·
verified ·
1 Parent(s): a4ef32a

Training in progress, step 10000, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e6cbbdadb20e64f15020e12e55a078248311e1c567876699b4eaa4cb8702b5b5
3
  size 409608164
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36370843d1d338dddd594e733dae27f05afc004e2523c3386fdaf524aabe6609
3
  size 409608164
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:758abb36ef13388f8f3eca1eb622dac5b2c61c10eea0fcb8626ab377f7e69eb2
3
  size 814647162
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:378fd576cfae3e233cce3eacb8db2b87c8b786da267ce70ad55847ef31647f54
3
  size 814647162
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e73cd41e4817e0862853abe9773b0e01081cac4bb2de2949d6cd33bd2894c93d
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79869b2e85a7837bbc4b2150e9097dcfdcaeff6d2060f8e854fab9dfebd663d8
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a7c3ad366a455d36d790316ad7de46df5551299c0b50500acfaef90eebc7bbcf
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d92c5a2febec6a3debc54e07f631908af44ee341af8b138c2ac3072c6cfbde8
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 0.0,
3
- "best_model_checkpoint": "/mimer/NOBACKUP/groups/naiss2023-6-290/stefano/models//PROTAC-Splitter-EncoderDecoder-lr_cosine-opt25-rand-smiles/trial-number=21-learning_rate=1.6e-06-warmup_ratio=0.080-num_cycles=1.500/checkpoint-5000",
4
- "epoch": 0.49319392385085814,
5
  "eval_steps": 2500,
6
- "global_step": 5000,
7
  "is_hyper_param_search": true,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -119,6 +119,160 @@
119
  "eval_tanimoto_similarity": 0.0,
120
  "eval_valid": 0.1528060097216085,
121
  "step": 5000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
122
  }
123
  ],
124
  "logging_steps": 500,
@@ -133,12 +287,12 @@
133
  "should_evaluate": false,
134
  "should_log": false,
135
  "should_save": true,
136
- "should_training_stop": false
137
  },
138
  "attributes": {}
139
  }
140
  },
141
- "total_flos": 4.364959997072179e+16,
142
  "train_batch_size": 128,
143
  "trial_name": "trial-number=21-learning_rate=1.6e-06-warmup_ratio=0.080-num_cycles=1.500",
144
  "trial_params": {
 
1
  {
2
+ "best_metric": 8.837825894829872e-05,
3
+ "best_model_checkpoint": "/mimer/NOBACKUP/groups/naiss2023-6-290/stefano/models//PROTAC-Splitter-EncoderDecoder-lr_cosine-opt25-rand-smiles/trial-number=21-learning_rate=1.6e-06-warmup_ratio=0.080-num_cycles=1.500/checkpoint-10000",
4
+ "epoch": 0.9863878477017163,
5
  "eval_steps": 2500,
6
+ "global_step": 10000,
7
  "is_hyper_param_search": true,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
119
  "eval_tanimoto_similarity": 0.0,
120
  "eval_valid": 0.1528060097216085,
121
  "step": 5000
122
+ },
123
+ {
124
+ "epoch": 0.542513316235944,
125
+ "grad_norm": 1.3835140466690063,
126
+ "learning_rate": 9.304780137412219e-07,
127
+ "loss": 0.8874,
128
+ "step": 5500
129
+ },
130
+ {
131
+ "epoch": 0.5918327086210298,
132
+ "grad_norm": 1.3169989585876465,
133
+ "learning_rate": 1.302486007417367e-06,
134
+ "loss": 0.8215,
135
+ "step": 6000
136
+ },
137
+ {
138
+ "epoch": 0.6411521010061156,
139
+ "grad_norm": 1.280273675918579,
140
+ "learning_rate": 1.5501941814704978e-06,
141
+ "loss": 0.7438,
142
+ "step": 6500
143
+ },
144
+ {
145
+ "epoch": 0.6904714933912014,
146
+ "grad_norm": 1.4349747896194458,
147
+ "learning_rate": 1.6113648928799203e-06,
148
+ "loss": 0.669,
149
+ "step": 7000
150
+ },
151
+ {
152
+ "epoch": 0.7397908857762873,
153
+ "grad_norm": 1.2315547466278076,
154
+ "learning_rate": 1.4706287622758396e-06,
155
+ "loss": 0.6043,
156
+ "step": 7500
157
+ },
158
+ {
159
+ "epoch": 0.7397908857762873,
160
+ "eval_all_ligands_equal": 0.0,
161
+ "eval_e3_equal": 0.05612019443216969,
162
+ "eval_e3_graph_edit_distance": 9.999999999999999e+63,
163
+ "eval_e3_graph_edit_distance_norm": 1.0,
164
+ "eval_e3_has_attachment_point(s)": 0.9729562527618206,
165
+ "eval_e3_heavy_atoms_difference": 0.5429960229783474,
166
+ "eval_e3_heavy_atoms_difference_norm": -0.029541020730058737,
167
+ "eval_e3_tanimoto_similarity": 0.0,
168
+ "eval_e3_valid": 0.9729562527618206,
169
+ "eval_has_all_attachment_points": 0.7827662395050817,
170
+ "eval_has_three_substructures": 0.9756076005302695,
171
+ "eval_heavy_atoms_difference": 61.464250994255416,
172
+ "eval_heavy_atoms_difference_norm": 0.796061917426111,
173
+ "eval_linker_equal": 0.0015024304021210783,
174
+ "eval_linker_graph_edit_distance": 9.999999999999999e+63,
175
+ "eval_linker_graph_edit_distance_norm": 1.0,
176
+ "eval_linker_has_attachment_point(s)": 0.9462660185594344,
177
+ "eval_linker_heavy_atoms_difference": 7.653822359699514,
178
+ "eval_linker_heavy_atoms_difference_norm": 0.35586072765620425,
179
+ "eval_linker_tanimoto_similarity": 0.0,
180
+ "eval_linker_valid": 0.9462660185594344,
181
+ "eval_loss": 0.6581697463989258,
182
+ "eval_num_fragments": 3.012372956252762,
183
+ "eval_poi_equal": 0.0015024304021210783,
184
+ "eval_poi_graph_edit_distance": 9.999999999999999e+63,
185
+ "eval_poi_graph_edit_distance_norm": 1.0,
186
+ "eval_poi_has_attachment_point(s)": 0.3093239063190455,
187
+ "eval_poi_heavy_atoms_difference": 25.47229341581971,
188
+ "eval_poi_heavy_atoms_difference_norm": 0.778111477675356,
189
+ "eval_poi_tanimoto_similarity": 0.0,
190
+ "eval_poi_valid": 0.3093239063190455,
191
+ "eval_reassembly": 0.0,
192
+ "eval_reassembly_nostereo": 0.0,
193
+ "eval_runtime": 1364.8374,
194
+ "eval_samples_per_second": 8.29,
195
+ "eval_steps_per_second": 0.13,
196
+ "eval_tanimoto_similarity": 0.0,
197
+ "eval_valid": 0.2988952717631463,
198
+ "step": 7500
199
+ },
200
+ {
201
+ "epoch": 0.789110278161373,
202
+ "grad_norm": 1.26154363155365,
203
+ "learning_rate": 1.1633462903366549e-06,
204
+ "loss": 0.5573,
205
+ "step": 8000
206
+ },
207
+ {
208
+ "epoch": 0.8384296705464589,
209
+ "grad_norm": 1.3200926780700684,
210
+ "learning_rate": 7.667233943405157e-07,
211
+ "loss": 0.5213,
212
+ "step": 8500
213
+ },
214
+ {
215
+ "epoch": 0.8877490629315447,
216
+ "grad_norm": 1.1365368366241455,
217
+ "learning_rate": 3.804131208984208e-07,
218
+ "loss": 0.5012,
219
+ "step": 9000
220
+ },
221
+ {
222
+ "epoch": 0.9370684553166305,
223
+ "grad_norm": 1.3047261238098145,
224
+ "learning_rate": 1.014774300592085e-07,
225
+ "loss": 0.4905,
226
+ "step": 9500
227
+ },
228
+ {
229
+ "epoch": 0.9863878477017163,
230
+ "grad_norm": 1.003517985343933,
231
+ "learning_rate": 0.0,
232
+ "loss": 0.4875,
233
+ "step": 10000
234
+ },
235
+ {
236
+ "epoch": 0.9863878477017163,
237
+ "eval_all_ligands_equal": 8.837825894829872e-05,
238
+ "eval_e3_equal": 0.07397260273972603,
239
+ "eval_e3_graph_edit_distance": 9.999999999999999e+63,
240
+ "eval_e3_graph_edit_distance_norm": 1.0,
241
+ "eval_e3_has_attachment_point(s)": 0.98285461776403,
242
+ "eval_e3_heavy_atoms_difference": -0.7978789217852408,
243
+ "eval_e3_heavy_atoms_difference_norm": -0.06986969786045168,
244
+ "eval_e3_tanimoto_similarity": 0.0,
245
+ "eval_e3_valid": 0.98285461776403,
246
+ "eval_has_all_attachment_points": 0.8105170128148476,
247
+ "eval_has_three_substructures": 0.9845338046840477,
248
+ "eval_heavy_atoms_difference": 54.63950508174989,
249
+ "eval_heavy_atoms_difference_norm": 0.7006005159368531,
250
+ "eval_linker_equal": 0.0016791869200176756,
251
+ "eval_linker_graph_edit_distance": 9.999999999999999e+63,
252
+ "eval_linker_graph_edit_distance_norm": 1.0,
253
+ "eval_linker_has_attachment_point(s)": 0.9719840919133893,
254
+ "eval_linker_heavy_atoms_difference": 7.197967300044189,
255
+ "eval_linker_heavy_atoms_difference_norm": 0.32378217560050643,
256
+ "eval_linker_tanimoto_similarity": 0.0,
257
+ "eval_linker_valid": 0.9719840919133893,
258
+ "eval_loss": 0.5798121094703674,
259
+ "eval_num_fragments": 3.00415377817057,
260
+ "eval_poi_equal": 0.009721608484312859,
261
+ "eval_poi_graph_edit_distance": 9.999999999999999e+63,
262
+ "eval_poi_graph_edit_distance_norm": 1.0,
263
+ "eval_poi_has_attachment_point(s)": 0.3849756959787892,
264
+ "eval_poi_heavy_atoms_difference": 22.694829871851525,
265
+ "eval_poi_heavy_atoms_difference_norm": 0.6749048721453627,
266
+ "eval_poi_tanimoto_similarity": 0.0,
267
+ "eval_poi_valid": 0.3849756959787892,
268
+ "eval_reassembly": 8.837825894829872e-05,
269
+ "eval_reassembly_nostereo": 8.837825894829872e-05,
270
+ "eval_runtime": 1432.419,
271
+ "eval_samples_per_second": 7.899,
272
+ "eval_steps_per_second": 0.124,
273
+ "eval_tanimoto_similarity": 0.0,
274
+ "eval_valid": 0.38011489173663277,
275
+ "step": 10000
276
  }
277
  ],
278
  "logging_steps": 500,
 
287
  "should_evaluate": false,
288
  "should_log": false,
289
  "should_save": true,
290
+ "should_training_stop": true
291
  },
292
  "attributes": {}
293
  }
294
  },
295
+ "total_flos": 8.729673191023411e+16,
296
  "train_batch_size": 128,
297
  "trial_name": "trial-number=21-learning_rate=1.6e-06-warmup_ratio=0.080-num_cycles=1.500",
298
  "trial_params": {