Training in progress, step 75000, checkpoint
Browse files
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 409608164
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e0e439abda96a6c46bd7b0745803bc82dce328f1c1e77e3fddc886596e3dbfb7
|
| 3 |
size 409608164
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 814647162
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1cdcf98b9479df166ebb42e0d57dcece23e53751bdb535d71086a4aad3bedb9e
|
| 3 |
size 814647162
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:abdff6153a7eb893e8cec9e7179db9e14b6c114d35d35782f9954977f7dd1863
|
| 3 |
size 14244
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2a8d5a368b4e2efb2f49235ac9b3e52ed97f90c05247b4e0747718cbca6efeec
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -1,9 +1,9 @@
|
|
| 1 |
{
|
| 2 |
"best_metric": 0.5924220963172805,
|
| 3 |
"best_model_checkpoint": "/mimer/NOBACKUP/groups/naiss2023-6-290/stefano/models//PROTAC-Splitter-EncoderDecoder-lr_cosine-rand-smiles/checkpoint-70000",
|
| 4 |
-
"epoch":
|
| 5 |
"eval_steps": 2500,
|
| 6 |
-
"global_step":
|
| 7 |
"is_hyper_param_search": false,
|
| 8 |
"is_local_process_zero": true,
|
| 9 |
"is_world_process_zero": true,
|
|
@@ -1155,6 +1155,160 @@
|
|
| 1155 |
"eval_tanimoto_similarity": 0.0,
|
| 1156 |
"eval_valid": 0.9464412181303116,
|
| 1157 |
"step": 70000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1158 |
}
|
| 1159 |
],
|
| 1160 |
"logging_steps": 500,
|
|
@@ -1174,7 +1328,7 @@
|
|
| 1174 |
"attributes": {}
|
| 1175 |
}
|
| 1176 |
},
|
| 1177 |
-
"total_flos": 6.
|
| 1178 |
"train_batch_size": 128,
|
| 1179 |
"trial_name": null,
|
| 1180 |
"trial_params": null
|
|
|
|
| 1 |
{
|
| 2 |
"best_metric": 0.5924220963172805,
|
| 3 |
"best_model_checkpoint": "/mimer/NOBACKUP/groups/naiss2023-6-290/stefano/models//PROTAC-Splitter-EncoderDecoder-lr_cosine-rand-smiles/checkpoint-70000",
|
| 4 |
+
"epoch": 7.397908857762872,
|
| 5 |
"eval_steps": 2500,
|
| 6 |
+
"global_step": 75000,
|
| 7 |
"is_hyper_param_search": false,
|
| 8 |
"is_local_process_zero": true,
|
| 9 |
"is_world_process_zero": true,
|
|
|
|
| 1155 |
"eval_tanimoto_similarity": 0.0,
|
| 1156 |
"eval_valid": 0.9464412181303116,
|
| 1157 |
"step": 70000
|
| 1158 |
+
},
|
| 1159 |
+
{
|
| 1160 |
+
"epoch": 6.9540343262971,
|
| 1161 |
+
"grad_norm": 0.01884830743074417,
|
| 1162 |
+
"learning_rate": 1.001811555300422e-05,
|
| 1163 |
+
"loss": 0.0003,
|
| 1164 |
+
"step": 70500
|
| 1165 |
+
},
|
| 1166 |
+
{
|
| 1167 |
+
"epoch": 7.0033537186821855,
|
| 1168 |
+
"grad_norm": 0.007204363122582436,
|
| 1169 |
+
"learning_rate": 9.705293329559965e-06,
|
| 1170 |
+
"loss": 0.0004,
|
| 1171 |
+
"step": 71000
|
| 1172 |
+
},
|
| 1173 |
+
{
|
| 1174 |
+
"epoch": 7.052673111067271,
|
| 1175 |
+
"grad_norm": 0.009515893645584583,
|
| 1176 |
+
"learning_rate": 9.396866661960307e-06,
|
| 1177 |
+
"loss": 0.0003,
|
| 1178 |
+
"step": 71500
|
| 1179 |
+
},
|
| 1180 |
+
{
|
| 1181 |
+
"epoch": 7.101992503452357,
|
| 1182 |
+
"grad_norm": 0.01400610152631998,
|
| 1183 |
+
"learning_rate": 9.091675648786607e-06,
|
| 1184 |
+
"loss": 0.0003,
|
| 1185 |
+
"step": 72000
|
| 1186 |
+
},
|
| 1187 |
+
{
|
| 1188 |
+
"epoch": 7.151311895837443,
|
| 1189 |
+
"grad_norm": 0.010973923839628696,
|
| 1190 |
+
"learning_rate": 8.790417638516349e-06,
|
| 1191 |
+
"loss": 0.0003,
|
| 1192 |
+
"step": 72500
|
| 1193 |
+
},
|
| 1194 |
+
{
|
| 1195 |
+
"epoch": 7.151311895837443,
|
| 1196 |
+
"eval_all_ligands_equal": 0.5918909348441926,
|
| 1197 |
+
"eval_e3_equal": 0.8251593484419264,
|
| 1198 |
+
"eval_e3_graph_edit_distance": Infinity,
|
| 1199 |
+
"eval_e3_graph_edit_distance_norm": Infinity,
|
| 1200 |
+
"eval_e3_has_attachment_point(s)": 0.9886685552407932,
|
| 1201 |
+
"eval_e3_heavy_atoms_difference": 0.3155099150141643,
|
| 1202 |
+
"eval_e3_heavy_atoms_difference_norm": 0.004674876264079149,
|
| 1203 |
+
"eval_e3_tanimoto_similarity": 0.0,
|
| 1204 |
+
"eval_e3_valid": 0.9886685552407932,
|
| 1205 |
+
"eval_has_all_attachment_points": 0.9888456090651558,
|
| 1206 |
+
"eval_has_three_substructures": 0.9991147308781869,
|
| 1207 |
+
"eval_heavy_atoms_difference": 4.57542492917847,
|
| 1208 |
+
"eval_heavy_atoms_difference_norm": 0.06105317584065338,
|
| 1209 |
+
"eval_linker_equal": 0.8426876770538244,
|
| 1210 |
+
"eval_linker_graph_edit_distance": 3.718130311614731e+61,
|
| 1211 |
+
"eval_linker_graph_edit_distance_norm": Infinity,
|
| 1212 |
+
"eval_linker_has_attachment_point(s)": 0.9962818696883853,
|
| 1213 |
+
"eval_linker_heavy_atoms_difference": 0.26044617563739375,
|
| 1214 |
+
"eval_linker_heavy_atoms_difference_norm": 0.004330713276040957,
|
| 1215 |
+
"eval_linker_tanimoto_similarity": 0.0,
|
| 1216 |
+
"eval_linker_valid": 0.9962818696883853,
|
| 1217 |
+
"eval_loss": 0.39214199781417847,
|
| 1218 |
+
"eval_num_fragments": 3.0001770538243626,
|
| 1219 |
+
"eval_poi_equal": 0.7898371104815864,
|
| 1220 |
+
"eval_poi_graph_edit_distance": Infinity,
|
| 1221 |
+
"eval_poi_graph_edit_distance_norm": Infinity,
|
| 1222 |
+
"eval_poi_has_attachment_point(s)": 0.9601628895184136,
|
| 1223 |
+
"eval_poi_heavy_atoms_difference": 1.192723087818697,
|
| 1224 |
+
"eval_poi_heavy_atoms_difference_norm": 0.035486140958842484,
|
| 1225 |
+
"eval_poi_tanimoto_similarity": 0.0,
|
| 1226 |
+
"eval_poi_valid": 0.9601628895184136,
|
| 1227 |
+
"eval_reassembly": 0.5992386685552408,
|
| 1228 |
+
"eval_reassembly_nostereo": 0.630842776203966,
|
| 1229 |
+
"eval_runtime": 2302.3208,
|
| 1230 |
+
"eval_samples_per_second": 4.906,
|
| 1231 |
+
"eval_steps_per_second": 0.077,
|
| 1232 |
+
"eval_tanimoto_similarity": 0.0,
|
| 1233 |
+
"eval_valid": 0.9479461756373938,
|
| 1234 |
+
"step": 72500
|
| 1235 |
+
},
|
| 1236 |
+
{
|
| 1237 |
+
"epoch": 7.200631288222529,
|
| 1238 |
+
"grad_norm": 0.003939173649996519,
|
| 1239 |
+
"learning_rate": 8.493167110937786e-06,
|
| 1240 |
+
"loss": 0.0003,
|
| 1241 |
+
"step": 73000
|
| 1242 |
+
},
|
| 1243 |
+
{
|
| 1244 |
+
"epoch": 7.249950680607615,
|
| 1245 |
+
"grad_norm": 0.006046623457223177,
|
| 1246 |
+
"learning_rate": 8.199997555072267e-06,
|
| 1247 |
+
"loss": 0.0003,
|
| 1248 |
+
"step": 73500
|
| 1249 |
+
},
|
| 1250 |
+
{
|
| 1251 |
+
"epoch": 7.299270072992701,
|
| 1252 |
+
"grad_norm": 0.008457995019853115,
|
| 1253 |
+
"learning_rate": 7.911555290403444e-06,
|
| 1254 |
+
"loss": 0.0003,
|
| 1255 |
+
"step": 74000
|
| 1256 |
+
},
|
| 1257 |
+
{
|
| 1258 |
+
"epoch": 7.348589465377787,
|
| 1259 |
+
"grad_norm": 0.0126716373488307,
|
| 1260 |
+
"learning_rate": 7.626755570937758e-06,
|
| 1261 |
+
"loss": 0.0003,
|
| 1262 |
+
"step": 74500
|
| 1263 |
+
},
|
| 1264 |
+
{
|
| 1265 |
+
"epoch": 7.397908857762872,
|
| 1266 |
+
"grad_norm": 0.0033882916904985905,
|
| 1267 |
+
"learning_rate": 7.346251025449738e-06,
|
| 1268 |
+
"loss": 0.0003,
|
| 1269 |
+
"step": 75000
|
| 1270 |
+
},
|
| 1271 |
+
{
|
| 1272 |
+
"epoch": 7.397908857762872,
|
| 1273 |
+
"eval_all_ligands_equal": 0.5922450424929179,
|
| 1274 |
+
"eval_e3_equal": 0.8269298866855525,
|
| 1275 |
+
"eval_e3_graph_edit_distance": Infinity,
|
| 1276 |
+
"eval_e3_graph_edit_distance_norm": Infinity,
|
| 1277 |
+
"eval_e3_has_attachment_point(s)": 0.9876062322946175,
|
| 1278 |
+
"eval_e3_heavy_atoms_difference": 0.2445113314447592,
|
| 1279 |
+
"eval_e3_heavy_atoms_difference_norm": 0.0028633304101074964,
|
| 1280 |
+
"eval_e3_tanimoto_similarity": 0.0,
|
| 1281 |
+
"eval_e3_valid": 0.9876062322946175,
|
| 1282 |
+
"eval_has_all_attachment_points": 0.9893767705382436,
|
| 1283 |
+
"eval_has_three_substructures": 0.9987606232294618,
|
| 1284 |
+
"eval_heavy_atoms_difference": 4.683958923512748,
|
| 1285 |
+
"eval_heavy_atoms_difference_norm": 0.06305476454593091,
|
| 1286 |
+
"eval_linker_equal": 0.8430417847025495,
|
| 1287 |
+
"eval_linker_graph_edit_distance": 2.8328611898017e+61,
|
| 1288 |
+
"eval_linker_graph_edit_distance_norm": Infinity,
|
| 1289 |
+
"eval_linker_has_attachment_point(s)": 0.9971671388101983,
|
| 1290 |
+
"eval_linker_heavy_atoms_difference": 0.24026203966005666,
|
| 1291 |
+
"eval_linker_heavy_atoms_difference_norm": 0.004181593662072319,
|
| 1292 |
+
"eval_linker_tanimoto_similarity": 0.0,
|
| 1293 |
+
"eval_linker_valid": 0.9971671388101983,
|
| 1294 |
+
"eval_loss": 0.39461877942085266,
|
| 1295 |
+
"eval_num_fragments": 2.9998229461756374,
|
| 1296 |
+
"eval_poi_equal": 0.7895715297450425,
|
| 1297 |
+
"eval_poi_graph_edit_distance": Infinity,
|
| 1298 |
+
"eval_poi_graph_edit_distance_norm": Infinity,
|
| 1299 |
+
"eval_poi_has_attachment_point(s)": 0.9584808781869688,
|
| 1300 |
+
"eval_poi_heavy_atoms_difference": 1.2901912181303117,
|
| 1301 |
+
"eval_poi_heavy_atoms_difference_norm": 0.03941144643806612,
|
| 1302 |
+
"eval_poi_tanimoto_similarity": 0.0,
|
| 1303 |
+
"eval_poi_valid": 0.9584808781869688,
|
| 1304 |
+
"eval_reassembly": 0.5990616147308782,
|
| 1305 |
+
"eval_reassembly_nostereo": 0.6306657223796034,
|
| 1306 |
+
"eval_runtime": 2312.2916,
|
| 1307 |
+
"eval_samples_per_second": 4.885,
|
| 1308 |
+
"eval_steps_per_second": 0.077,
|
| 1309 |
+
"eval_tanimoto_similarity": 0.0,
|
| 1310 |
+
"eval_valid": 0.9463526912181303,
|
| 1311 |
+
"step": 75000
|
| 1312 |
}
|
| 1313 |
],
|
| 1314 |
"logging_steps": 500,
|
|
|
|
| 1328 |
"attributes": {}
|
| 1329 |
}
|
| 1330 |
},
|
| 1331 |
+
"total_flos": 6.546932506690821e+17,
|
| 1332 |
"train_batch_size": 128,
|
| 1333 |
"trial_name": null,
|
| 1334 |
"trial_params": null
|