ribesstefano commited on
Commit
31e9109
·
verified ·
1 Parent(s): d3c24b6

Training in progress, step 5000, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7bf9c6ea4115da7ecb26efa2880f84d13e203883e1744e63861c53658f9277f2
3
  size 409608164
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1982171a3f3820e5b58f6001600cc37642dc0186945f9750c194a1fa5b77dc7b
3
  size 409608164
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2b6e2d89d31809aafc6d9f1a3d4b804a258907c5f3f1057e64ab7c0b2b18e13b
3
  size 814647162
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df855786c8c1dcf532c502a2b833691d5e70e66943335a077622d762846c4f43
3
  size 814647162
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e864df1cdce41b5f6008f2f3056157fe1a59741e45538c35750dad335d89adcf
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e7771a01cd6f59c5ffb87e70f444df0eea884e2c0b2aaf819bce5c2c8e7a461
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3b2e2f4a4d698b32d29e4f198023bd7f534f0e63616c12fe3bd5d6eef023d892
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93005377f6086337612335e1f5fcb47fe8e2d6ecd39daaae4c9fed9a1602b473
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,278 +1,124 @@
1
  {
2
- "best_metric": 0.16827220503756077,
3
- "best_model_checkpoint": "/mimer/NOBACKUP/groups/naiss2023-6-290/stefano/models//PROTAC-Splitter-EncoderDecoder-lr_cosine-opt25-rand-smiles/trial-number=0-learning_rate=1.3e-05-warmup_ratio=0.100-num_cycles=7.500/checkpoint-10000",
4
- "epoch": 0.9863878477017163,
5
  "eval_steps": 2500,
6
- "global_step": 10000,
7
  "is_hyper_param_search": true,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.049319392385085814,
13
- "grad_norm": 1.1925102472305298,
14
- "learning_rate": 9.50852571041643e-06,
15
- "loss": 3.5759,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.09863878477017163,
20
- "grad_norm": 1.0559757947921753,
21
- "learning_rate": 6.9505467525657206e-06,
22
- "loss": 0.7964,
23
  "step": 1000
24
  },
25
  {
26
  "epoch": 0.14795817715525744,
27
- "grad_norm": 0.9585791230201721,
28
- "learning_rate": 2.6025037504397807e-06,
29
- "loss": 0.5237,
30
  "step": 1500
31
  },
32
  {
33
  "epoch": 0.19727756954034326,
34
- "grad_norm": 0.8004510998725891,
35
- "learning_rate": 1.2979375408792664e-05,
36
- "loss": 0.44,
37
  "step": 2000
38
  },
39
  {
40
  "epoch": 0.24659696192542907,
41
- "grad_norm": 0.5827901363372803,
42
- "learning_rate": 2.9673475846258797e-07,
43
- "loss": 0.3022,
44
  "step": 2500
45
  },
46
  {
47
  "epoch": 0.2959163543105149,
48
- "grad_norm": 0.9724856615066528,
49
- "learning_rate": 1.0734810793876912e-05,
50
- "loss": 0.2719,
51
  "step": 3000
52
  },
53
  {
54
  "epoch": 0.3452357466956007,
55
- "grad_norm": 0.5034233331680298,
56
- "learning_rate": 6.2863182132847955e-06,
57
- "loss": 0.2177,
58
  "step": 3500
59
  },
60
  {
61
  "epoch": 0.3945551390806865,
62
- "grad_norm": 0.5209541320800781,
63
- "learning_rate": 3.1491776008674324e-06,
64
- "loss": 0.1838,
65
  "step": 4000
66
  },
67
  {
68
  "epoch": 0.4438745314657723,
69
- "grad_norm": 0.5501710772514343,
70
- "learning_rate": 1.2746394296240856e-05,
71
- "loss": 0.1695,
72
  "step": 4500
73
  },
74
  {
75
  "epoch": 0.49319392385085814,
76
- "grad_norm": 0.6129121780395508,
77
- "learning_rate": 1.3243314463025088e-07,
78
- "loss": 0.1406,
79
  "step": 5000
80
  },
81
  {
82
  "epoch": 0.49319392385085814,
83
- "eval_all_ligands_equal": 0.007247017233760495,
84
- "eval_e3_equal": 0.39010163499779055,
85
  "eval_e3_graph_edit_distance": 9.999999999999999e+63,
86
  "eval_e3_graph_edit_distance_norm": 1.0,
87
- "eval_e3_has_attachment_point(s)": 0.997348652231551,
88
- "eval_e3_heavy_atoms_difference": -1.0644277507733098,
89
- "eval_e3_heavy_atoms_difference_norm": -0.05826937320242394,
90
  "eval_e3_tanimoto_similarity": 0.0,
91
- "eval_e3_valid": 0.997348652231551,
92
- "eval_has_all_attachment_points": 0.9711886875828546,
93
- "eval_has_three_substructures": 0.9977021652673442,
94
- "eval_heavy_atoms_difference": 11.813079982324348,
95
- "eval_heavy_atoms_difference_norm": 0.1508348868839678,
96
- "eval_linker_equal": 0.02615996464869642,
97
  "eval_linker_graph_edit_distance": 9.999999999999999e+63,
98
  "eval_linker_graph_edit_distance_norm": 1.0,
99
- "eval_linker_has_attachment_point(s)": 0.9928413610251878,
100
- "eval_linker_heavy_atoms_difference": 2.933097657976138,
101
- "eval_linker_heavy_atoms_difference_norm": 0.08887640414726028,
102
  "eval_linker_tanimoto_similarity": 0.0,
103
- "eval_linker_valid": 0.9928413610251878,
104
- "eval_loss": 0.33352142572402954,
105
  "eval_num_fragments": 2.9984091913389306,
106
- "eval_poi_equal": 0.4074237737516571,
107
  "eval_poi_graph_edit_distance": 9.999999999999999e+63,
108
  "eval_poi_graph_edit_distance_norm": 1.0,
109
- "eval_poi_has_attachment_point(s)": 0.8798055678303137,
110
- "eval_poi_heavy_atoms_difference": 3.964825452938577,
111
- "eval_poi_heavy_atoms_difference_norm": 0.11040993122450134,
112
  "eval_poi_tanimoto_similarity": 0.0,
113
- "eval_poi_valid": 0.8798055678303137,
114
- "eval_reassembly": 0.00760053026955369,
115
- "eval_reassembly_nostereo": 0.010251878038002652,
116
- "eval_runtime": 1609.8438,
117
- "eval_samples_per_second": 7.029,
118
- "eval_steps_per_second": 0.11,
119
- "eval_tanimoto_similarity": 0.0,
120
- "eval_valid": 0.8760936809544851,
121
- "step": 5000
122
- },
123
- {
124
- "epoch": 0.542513316235944,
125
- "grad_norm": 0.5318701863288879,
126
- "learning_rate": 1.1237446278275383e-05,
127
- "loss": 0.1316,
128
- "step": 5500
129
- },
130
- {
131
- "epoch": 0.5918327086210298,
132
- "grad_norm": 0.3978229761123657,
133
- "learning_rate": 5.625686628642194e-06,
134
- "loss": 0.1163,
135
- "step": 6000
136
- },
137
- {
138
- "epoch": 0.6411521010061156,
139
- "grad_norm": 0.3678536117076874,
140
- "learning_rate": 3.7307809795190627e-06,
141
- "loss": 0.1024,
142
- "step": 6500
143
- },
144
- {
145
- "epoch": 0.6904714933912014,
146
- "grad_norm": 0.4965149462223053,
147
- "learning_rate": 1.2452489342403467e-05,
148
- "loss": 0.0972,
149
- "step": 7000
150
- },
151
- {
152
- "epoch": 0.7397908857762873,
153
- "grad_norm": 0.4630180895328522,
154
- "learning_rate": 3.319116134821198e-08,
155
- "loss": 0.0827,
156
- "step": 7500
157
- },
158
- {
159
- "epoch": 0.7397908857762873,
160
- "eval_all_ligands_equal": 0.061511268228015906,
161
- "eval_e3_equal": 0.5425541316836058,
162
- "eval_e3_graph_edit_distance": 9.999999999999999e+63,
163
- "eval_e3_graph_edit_distance_norm": 1.0,
164
- "eval_e3_has_attachment_point(s)": 0.9982324348210341,
165
- "eval_e3_heavy_atoms_difference": -0.41617322138753865,
166
- "eval_e3_heavy_atoms_difference_norm": -0.030251585246387123,
167
- "eval_e3_tanimoto_similarity": 0.0,
168
- "eval_e3_valid": 0.9982324348210341,
169
- "eval_has_all_attachment_points": 0.9847105612019443,
170
- "eval_has_three_substructures": 0.9987627043747238,
171
- "eval_heavy_atoms_difference": 6.157048166151127,
172
- "eval_heavy_atoms_difference_norm": 0.0799003116743603,
173
- "eval_linker_equal": 0.12072470172337604,
174
- "eval_linker_graph_edit_distance": 9.999999999999999e+63,
175
- "eval_linker_graph_edit_distance_norm": 1.0,
176
- "eval_linker_has_attachment_point(s)": 0.9971718957136544,
177
- "eval_linker_heavy_atoms_difference": 1.4752982766239504,
178
- "eval_linker_heavy_atoms_difference_norm": 0.026323008455953905,
179
- "eval_linker_tanimoto_similarity": 0.0,
180
- "eval_linker_valid": 0.9971718957136544,
181
- "eval_loss": 0.31108492612838745,
182
- "eval_num_fragments": 2.999646486964207,
183
- "eval_poi_equal": 0.5619973486522315,
184
- "eval_poi_graph_edit_distance": 9.999999999999999e+63,
185
- "eval_poi_graph_edit_distance_norm": 1.0,
186
- "eval_poi_has_attachment_point(s)": 0.9346884666372073,
187
- "eval_poi_heavy_atoms_difference": 1.8780380026513477,
188
- "eval_poi_heavy_atoms_difference_norm": 0.053725194951032486,
189
- "eval_poi_tanimoto_similarity": 0.0,
190
- "eval_poi_valid": 0.9346884666372073,
191
- "eval_reassembly": 0.0625718073353955,
192
- "eval_reassembly_nostereo": 0.07618205921343349,
193
- "eval_runtime": 1600.5588,
194
- "eval_samples_per_second": 7.069,
195
  "eval_steps_per_second": 0.111,
196
  "eval_tanimoto_similarity": 0.0,
197
- "eval_valid": 0.9327441449403446,
198
- "step": 7500
199
- },
200
- {
201
- "epoch": 0.789110278161373,
202
- "grad_norm": 0.36397504806518555,
203
- "learning_rate": 1.1694228723322586e-05,
204
- "loss": 0.0784,
205
- "step": 8000
206
- },
207
- {
208
- "epoch": 0.8384296705464589,
209
- "grad_norm": 0.3220004737377167,
210
- "learning_rate": 4.975250136973397e-06,
211
- "loss": 0.0712,
212
- "step": 8500
213
- },
214
- {
215
- "epoch": 0.8877490629315447,
216
- "grad_norm": 0.33015140891075134,
217
- "learning_rate": 4.341505051882401e-06,
218
- "loss": 0.0627,
219
- "step": 9000
220
- },
221
- {
222
- "epoch": 0.9370684553166305,
223
- "grad_norm": 0.3355898857116699,
224
- "learning_rate": 1.2100595958768545e-05,
225
- "loss": 0.0608,
226
- "step": 9500
227
- },
228
- {
229
- "epoch": 0.9863878477017163,
230
- "grad_norm": 0.2892158329486847,
231
- "learning_rate": 0.0,
232
- "loss": 0.0528,
233
- "step": 10000
234
- },
235
- {
236
- "epoch": 0.9863878477017163,
237
- "eval_all_ligands_equal": 0.16827220503756077,
238
- "eval_e3_equal": 0.639063190455148,
239
- "eval_e3_graph_edit_distance": 9.999999999999999e+63,
240
- "eval_e3_graph_edit_distance_norm": 1.0,
241
- "eval_e3_has_attachment_point(s)": 0.9983208130799823,
242
- "eval_e3_heavy_atoms_difference": -0.2734423331860362,
243
- "eval_e3_heavy_atoms_difference_norm": -0.024892349019047463,
244
- "eval_e3_tanimoto_similarity": 0.0,
245
- "eval_e3_valid": 0.9983208130799823,
246
- "eval_has_all_attachment_points": 0.9885992045956694,
247
- "eval_has_three_substructures": 0.9992045956694653,
248
- "eval_heavy_atoms_difference": 4.554838709677419,
249
- "eval_heavy_atoms_difference_norm": 0.058807906961281145,
250
- "eval_linker_equal": 0.28501988510826337,
251
- "eval_linker_graph_edit_distance": 9.999999999999999e+63,
252
- "eval_linker_graph_edit_distance_norm": 1.0,
253
- "eval_linker_has_attachment_point(s)": 0.9977905435262925,
254
- "eval_linker_heavy_atoms_difference": 0.91064958020327,
255
- "eval_linker_heavy_atoms_difference_norm": 0.007958336622586505,
256
- "eval_linker_tanimoto_similarity": 0.0,
257
- "eval_linker_valid": 0.9977905435262925,
258
- "eval_loss": 0.30263492465019226,
259
- "eval_num_fragments": 2.999734865223155,
260
- "eval_poi_equal": 0.632523199292974,
261
- "eval_poi_graph_edit_distance": 9.999999999999999e+63,
262
- "eval_poi_graph_edit_distance_norm": 1.0,
263
- "eval_poi_has_attachment_point(s)": 0.9508616880247459,
264
- "eval_poi_heavy_atoms_difference": 1.4015908086610693,
265
- "eval_poi_heavy_atoms_difference_norm": 0.0383393486603852,
266
- "eval_poi_tanimoto_similarity": 0.0,
267
- "eval_poi_valid": 0.9508616880247459,
268
- "eval_reassembly": 0.1715422006186478,
269
- "eval_reassembly_nostereo": 0.1992045956694653,
270
- "eval_runtime": 1518.0837,
271
- "eval_samples_per_second": 7.453,
272
- "eval_steps_per_second": 0.117,
273
- "eval_tanimoto_similarity": 0.0,
274
- "eval_valid": 0.9489173663278834,
275
- "step": 10000
276
  }
277
  ],
278
  "logging_steps": 500,
@@ -287,17 +133,17 @@
287
  "should_evaluate": false,
288
  "should_log": false,
289
  "should_save": true,
290
- "should_training_stop": true
291
  },
292
  "attributes": {}
293
  }
294
  },
295
- "total_flos": 8.729673191023411e+16,
296
  "train_batch_size": 128,
297
- "trial_name": "trial-number=0-learning_rate=1.3e-05-warmup_ratio=0.100-num_cycles=7.500",
298
  "trial_params": {
299
- "learning_rate": 1.329291894316217e-05,
300
- "num_cycles": 7.5,
301
- "warmup_ratio": 0.09999999999999999
302
  }
303
  }
 
1
  {
2
+ "best_metric": 0.038974812196199735,
3
+ "best_model_checkpoint": "/mimer/NOBACKUP/groups/naiss2023-6-290/stefano/models//PROTAC-Splitter-EncoderDecoder-lr_cosine-opt25-rand-smiles/trial-number=1-learning_rate=2.0e-05-warmup_ratio=0.090-num_cycles=8.500/checkpoint-5000",
4
+ "epoch": 0.49319392385085814,
5
  "eval_steps": 2500,
6
+ "global_step": 5000,
7
  "is_hyper_param_search": true,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.049319392385085814,
13
+ "grad_norm": 1.1311782598495483,
14
+ "learning_rate": 1.4046924613685011e-05,
15
+ "loss": 3.1644,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.09863878477017163,
20
+ "grad_norm": 0.9366589784622192,
21
+ "learning_rate": 8.278052011897948e-06,
22
+ "loss": 0.6401,
23
  "step": 1000
24
  },
25
  {
26
  "epoch": 0.14795817715525744,
27
+ "grad_norm": 0.9480023980140686,
28
+ "learning_rate": 8.711793227257574e-06,
29
+ "loss": 0.4026,
30
  "step": 1500
31
  },
32
  {
33
  "epoch": 0.19727756954034326,
34
+ "grad_norm": 0.6237757205963135,
35
+ "learning_rate": 1.3493023962384968e-05,
36
+ "loss": 0.3056,
37
  "step": 2000
38
  },
39
  {
40
  "epoch": 0.24659696192542907,
41
+ "grad_norm": 0.546779215335846,
42
+ "learning_rate": 3.844673201988863e-06,
43
+ "loss": 0.215,
44
  "step": 2500
45
  },
46
  {
47
  "epoch": 0.2959163543105149,
48
+ "grad_norm": 0.6261709332466125,
49
+ "learning_rate": 1.765819137898168e-05,
50
+ "loss": 0.1886,
51
  "step": 3000
52
  },
53
  {
54
  "epoch": 0.3452357466956007,
55
+ "grad_norm": 0.3576153814792633,
56
+ "learning_rate": 6.844894722497407e-07,
57
+ "loss": 0.1428,
58
  "step": 3500
59
  },
60
  {
61
  "epoch": 0.3945551390806865,
62
+ "grad_norm": 0.5195497870445251,
63
+ "learning_rate": 1.958347656200152e-05,
64
+ "loss": 0.1311,
65
  "step": 4000
66
  },
67
  {
68
  "epoch": 0.4438745314657723,
69
+ "grad_norm": 0.48624593019485474,
70
+ "learning_rate": 1.341743352364844e-07,
71
+ "loss": 0.1046,
72
  "step": 4500
73
  },
74
  {
75
  "epoch": 0.49319392385085814,
76
+ "grad_norm": 0.45008236169815063,
77
+ "learning_rate": 1.871878422530564e-05,
78
+ "loss": 0.0948,
79
  "step": 5000
80
  },
81
  {
82
  "epoch": 0.49319392385085814,
83
+ "eval_all_ligands_equal": 0.038974812196199735,
84
+ "eval_e3_equal": 0.5149801148917367,
85
  "eval_e3_graph_edit_distance": 9.999999999999999e+63,
86
  "eval_e3_graph_edit_distance_norm": 1.0,
87
+ "eval_e3_has_attachment_point(s)": 0.9974370304904994,
88
+ "eval_e3_heavy_atoms_difference": -0.5439681838267786,
89
+ "eval_e3_heavy_atoms_difference_norm": -0.03979103911128965,
90
  "eval_e3_tanimoto_similarity": 0.0,
91
+ "eval_e3_valid": 0.9974370304904994,
92
+ "eval_has_all_attachment_points": 0.9802916482545294,
93
+ "eval_has_three_substructures": 0.9978789217852408,
94
+ "eval_heavy_atoms_difference": 9.873530711444985,
95
+ "eval_heavy_atoms_difference_norm": 0.12658016008251008,
96
+ "eval_linker_equal": 0.08758285461776404,
97
  "eval_linker_graph_edit_distance": 9.999999999999999e+63,
98
  "eval_linker_graph_edit_distance_norm": 1.0,
99
+ "eval_linker_has_attachment_point(s)": 0.9955810870525851,
100
+ "eval_linker_heavy_atoms_difference": 3.0841361025187806,
101
+ "eval_linker_heavy_atoms_difference_norm": 0.12312258066016835,
102
  "eval_linker_tanimoto_similarity": 0.0,
103
+ "eval_linker_valid": 0.9955810870525851,
104
+ "eval_loss": 0.31889262795448303,
105
  "eval_num_fragments": 2.9984091913389306,
106
+ "eval_poi_equal": 0.5147149801148917,
107
  "eval_poi_graph_edit_distance": 9.999999999999999e+63,
108
  "eval_poi_graph_edit_distance_norm": 1.0,
109
+ "eval_poi_has_attachment_point(s)": 0.9095006628369421,
110
+ "eval_poi_heavy_atoms_difference": 3.1498011489173665,
111
+ "eval_poi_heavy_atoms_difference_norm": 0.09194667815914018,
112
  "eval_poi_tanimoto_similarity": 0.0,
113
+ "eval_poi_valid": 0.9095006628369421,
114
+ "eval_reassembly": 0.04030048608042421,
115
+ "eval_reassembly_nostereo": 0.04904993371630579,
116
+ "eval_runtime": 1598.7498,
117
+ "eval_samples_per_second": 7.077,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
118
  "eval_steps_per_second": 0.111,
119
  "eval_tanimoto_similarity": 0.0,
120
+ "eval_valid": 0.9072912063632347,
121
+ "step": 5000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
122
  }
123
  ],
124
  "logging_steps": 500,
 
133
  "should_evaluate": false,
134
  "should_log": false,
135
  "should_save": true,
136
+ "should_training_stop": false
137
  },
138
  "attributes": {}
139
  }
140
  },
141
+ "total_flos": 4.364959997072179e+16,
142
  "train_batch_size": 128,
143
+ "trial_name": "trial-number=1-learning_rate=2.0e-05-warmup_ratio=0.090-num_cycles=8.500",
144
  "trial_params": {
145
+ "learning_rate": 1.9637600609931647e-05,
146
+ "num_cycles": 8.5,
147
+ "warmup_ratio": 0.09
148
  }
149
  }
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e738cf844f012a143f915952b9b5d140ea4bbe7014578abe5deedc776149cbdd
3
  size 7480
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b7a3dced9d5154a95ec1a0505e00dc47ab6d5dbc40b63df76ec9c233913bd4b
3
  size 7480