ribesstefano commited on
Commit
d5ac0b8
·
verified ·
1 Parent(s): 57f3528

Training in progress, step 5000, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5e7fe164acee2bf98394cc1f6ca77bde3bf4fe3c18a172150d217aa0744f7c0d
3
  size 409608164
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4f84b63c76ad39c4d29b5e1779cdb4ddf62f0fcbbfc8c6195f3d5135f1c7187
3
  size 409608164
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:982416f84073374fbfc9bc102c3b314f16c390ffafe0595ec3c0a1bc9bb2bdbc
3
  size 814647162
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf2ca9e924d1cab355d6dcbab707f5dbf8b39eed6e13d75f60b419650e16b97c
3
  size 814647162
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:59e8ca36bfab9e84d90a7d949d509b7af9d968ff1c66c18555967285cddf14a3
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b925556f82b124035f3ca7135a752041c7e1c8d324e6a65157a89e3b81097bc3
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d150c531f1bb84bb58605a639401cc62d9ee0f1aeab46fc43a18748a772f2c54
3
  size 1192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4adbc58e93a831eb642bd288aafadcc9d5456925c59a14e4d584eec75bb8c5c3
3
  size 1192
last-checkpoint/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.39628811312417145,
3
- "best_model_checkpoint": "/mimer/NOBACKUP/groups/naiss2023-6-290/stefano/models//PROTAC-Splitter-EncoderDecoder-lr_reduce-opt25/trial-number=0-learning_rate=2.0e-05-warmup_ratio=0.060-min_lr=0.000-factor=0.910/checkpoint-5000",
4
  "epoch": 0.49319392385085814,
5
  "eval_steps": 2500,
6
  "global_step": 5000,
@@ -10,114 +10,114 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.049319392385085814,
13
- "grad_norm": 0.9932323098182678,
14
- "learning_rate": 1.9906996673933362e-05,
15
- "loss": 1.3472,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.09863878477017163,
20
- "grad_norm": 0.6675044894218445,
21
- "learning_rate": 1.9906996673933362e-05,
22
- "loss": 0.3791,
23
  "step": 1000
24
  },
25
  {
26
  "epoch": 0.14795817715525744,
27
- "grad_norm": 0.5713032484054565,
28
- "learning_rate": 1.9906996673933362e-05,
29
- "loss": 0.197,
30
  "step": 1500
31
  },
32
  {
33
  "epoch": 0.19727756954034326,
34
- "grad_norm": 0.4924110472202301,
35
- "learning_rate": 1.9906996673933362e-05,
36
- "loss": 0.1224,
37
  "step": 2000
38
  },
39
  {
40
  "epoch": 0.24659696192542907,
41
- "grad_norm": 0.38072213530540466,
42
- "learning_rate": 1.9906996673933362e-05,
43
- "loss": 0.0814,
44
  "step": 2500
45
  },
46
  {
47
  "epoch": 0.2959163543105149,
48
- "grad_norm": 0.2933690547943115,
49
- "learning_rate": 1.9906996673933362e-05,
50
- "loss": 0.0578,
51
  "step": 3000
52
  },
53
  {
54
  "epoch": 0.3452357466956007,
55
- "grad_norm": 0.24898405373096466,
56
- "learning_rate": 1.9906996673933362e-05,
57
- "loss": 0.0432,
58
  "step": 3500
59
  },
60
  {
61
  "epoch": 0.3945551390806865,
62
- "grad_norm": 0.27284932136535645,
63
- "learning_rate": 1.9906996673933362e-05,
64
- "loss": 0.0338,
65
  "step": 4000
66
  },
67
  {
68
  "epoch": 0.4438745314657723,
69
- "grad_norm": 0.24178475141525269,
70
- "learning_rate": 1.9906996673933362e-05,
71
- "loss": 0.027,
72
  "step": 4500
73
  },
74
  {
75
  "epoch": 0.49319392385085814,
76
- "grad_norm": 0.2615422010421753,
77
- "learning_rate": 1.9906996673933362e-05,
78
- "loss": 0.0224,
79
  "step": 5000
80
  },
81
  {
82
  "epoch": 0.49319392385085814,
83
- "eval_all_ligands_equal": 0.39628811312417145,
84
- "eval_e3_equal": 0.7779054352629253,
85
  "eval_e3_graph_edit_distance": 9.999999999999999e+63,
86
  "eval_e3_graph_edit_distance_norm": 1.0,
87
- "eval_e3_has_attachment_point(s)": 0.9931064958020327,
88
- "eval_e3_heavy_atoms_difference": 0.30676093680954486,
89
- "eval_e3_heavy_atoms_difference_norm": 0.002422775502318104,
90
  "eval_e3_tanimoto_similarity": 0.0,
91
- "eval_e3_valid": 0.9931064958020327,
92
- "eval_has_all_attachment_points": 0.9843570481661511,
93
- "eval_has_three_substructures": 0.9992929739284137,
94
- "eval_heavy_atoms_difference": 8.062218294299603,
95
- "eval_heavy_atoms_difference_norm": 0.10429584967389881,
96
- "eval_linker_equal": 0.5711886875828546,
97
  "eval_linker_graph_edit_distance": 9.999999999999999e+63,
98
  "eval_linker_graph_edit_distance_norm": 1.0,
99
- "eval_linker_has_attachment_point(s)": 0.9961997348652232,
100
- "eval_linker_heavy_atoms_difference": 0.9341581970835174,
101
- "eval_linker_heavy_atoms_difference_norm": 0.024806250123980716,
102
  "eval_linker_tanimoto_similarity": 0.0,
103
- "eval_linker_valid": 0.9961997348652232,
104
- "eval_loss": 0.28600096702575684,
105
- "eval_num_fragments": 2.999646486964207,
106
- "eval_poi_equal": 0.70234202386213,
107
  "eval_poi_graph_edit_distance": 9.999999999999999e+63,
108
  "eval_poi_graph_edit_distance_norm": 1.0,
109
- "eval_poi_has_attachment_point(s)": 0.9204595669465312,
110
- "eval_poi_heavy_atoms_difference": 2.6359699513919574,
111
- "eval_poi_heavy_atoms_difference_norm": 0.07909068566841335,
112
  "eval_poi_tanimoto_similarity": 0.0,
113
- "eval_poi_valid": 0.9204595669465312,
114
- "eval_reassembly": 0.40247459125055235,
115
- "eval_reassembly_nostereo": 0.4217410517012815,
116
- "eval_runtime": 1470.3159,
117
- "eval_samples_per_second": 7.696,
118
- "eval_steps_per_second": 0.12,
119
  "eval_tanimoto_similarity": 0.0,
120
- "eval_valid": 0.9122403888643393,
121
  "step": 5000
122
  }
123
  ],
@@ -140,11 +140,11 @@
140
  },
141
  "total_flos": 4.33139477262336e+16,
142
  "train_batch_size": 128,
143
- "trial_name": "trial-number=0-learning_rate=2.0e-05-warmup_ratio=0.060-min_lr=0.000-factor=0.910",
144
  "trial_params": {
145
- "factor": 0.91,
146
- "learning_rate": 1.9906996673933362e-05,
147
- "min_lr": 2.910635913133059e-09,
148
  "warmup_ratio": 0.06
149
  }
150
  }
 
1
  {
2
+ "best_metric": 0.4479010163499779,
3
+ "best_model_checkpoint": "/mimer/NOBACKUP/groups/naiss2023-6-290/stefano/models//PROTAC-Splitter-EncoderDecoder-lr_reduce-opt25/trial-number=1-learning_rate=2.5e-05-warmup_ratio=0.060-min_lr=0.000-factor=0.810/checkpoint-5000",
4
  "epoch": 0.49319392385085814,
5
  "eval_steps": 2500,
6
  "global_step": 5000,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.049319392385085814,
13
+ "grad_norm": 0.8631236553192139,
14
+ "learning_rate": 2.4519131356633107e-05,
15
+ "loss": 1.2428,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.09863878477017163,
20
+ "grad_norm": 0.6576346158981323,
21
+ "learning_rate": 2.4519131356633107e-05,
22
+ "loss": 0.3154,
23
  "step": 1000
24
  },
25
  {
26
  "epoch": 0.14795817715525744,
27
+ "grad_norm": 0.5040571093559265,
28
+ "learning_rate": 2.4519131356633107e-05,
29
+ "loss": 0.1531,
30
  "step": 1500
31
  },
32
  {
33
  "epoch": 0.19727756954034326,
34
+ "grad_norm": 0.47591033577919006,
35
+ "learning_rate": 2.4519131356633107e-05,
36
+ "loss": 0.0904,
37
  "step": 2000
38
  },
39
  {
40
  "epoch": 0.24659696192542907,
41
+ "grad_norm": 0.3052867352962494,
42
+ "learning_rate": 2.4519131356633107e-05,
43
+ "loss": 0.0588,
44
  "step": 2500
45
  },
46
  {
47
  "epoch": 0.2959163543105149,
48
+ "grad_norm": 0.26361268758773804,
49
+ "learning_rate": 2.4519131356633107e-05,
50
+ "loss": 0.0418,
51
  "step": 3000
52
  },
53
  {
54
  "epoch": 0.3452357466956007,
55
+ "grad_norm": 0.23498503863811493,
56
+ "learning_rate": 2.4519131356633107e-05,
57
+ "loss": 0.0308,
58
  "step": 3500
59
  },
60
  {
61
  "epoch": 0.3945551390806865,
62
+ "grad_norm": 0.2148304432630539,
63
+ "learning_rate": 2.4519131356633107e-05,
64
+ "loss": 0.0245,
65
  "step": 4000
66
  },
67
  {
68
  "epoch": 0.4438745314657723,
69
+ "grad_norm": 0.19326996803283691,
70
+ "learning_rate": 2.4519131356633107e-05,
71
+ "loss": 0.0193,
72
  "step": 4500
73
  },
74
  {
75
  "epoch": 0.49319392385085814,
76
+ "grad_norm": 0.23251751065254211,
77
+ "learning_rate": 2.4519131356633107e-05,
78
+ "loss": 0.0162,
79
  "step": 5000
80
  },
81
  {
82
  "epoch": 0.49319392385085814,
83
+ "eval_all_ligands_equal": 0.4479010163499779,
84
+ "eval_e3_equal": 0.7840035351303579,
85
  "eval_e3_graph_edit_distance": 9.999999999999999e+63,
86
  "eval_e3_graph_edit_distance_norm": 1.0,
87
+ "eval_e3_has_attachment_point(s)": 0.9891294741493593,
88
+ "eval_e3_heavy_atoms_difference": 0.4326999558108705,
89
+ "eval_e3_heavy_atoms_difference_norm": 0.00617409936456833,
90
  "eval_e3_tanimoto_similarity": 0.0,
91
+ "eval_e3_valid": 0.9891294741493593,
92
+ "eval_has_all_attachment_points": 0.9788775961113566,
93
+ "eval_has_three_substructures": 0.9994697304463102,
94
+ "eval_heavy_atoms_difference": 8.114007954043306,
95
+ "eval_heavy_atoms_difference_norm": 0.10592343628762439,
96
+ "eval_linker_equal": 0.636411842686699,
97
  "eval_linker_graph_edit_distance": 9.999999999999999e+63,
98
  "eval_linker_graph_edit_distance_norm": 1.0,
99
+ "eval_linker_has_attachment_point(s)": 0.9965532479010164,
100
+ "eval_linker_heavy_atoms_difference": 0.6443658859920459,
101
+ "eval_linker_heavy_atoms_difference_norm": 0.010009960469603861,
102
  "eval_linker_tanimoto_similarity": 0.0,
103
+ "eval_linker_valid": 0.9965532479010164,
104
+ "eval_loss": 0.2841632664203644,
105
+ "eval_num_fragments": 3.0001767565178965,
106
+ "eval_poi_equal": 0.7266460450729121,
107
  "eval_poi_graph_edit_distance": 9.999999999999999e+63,
108
  "eval_poi_graph_edit_distance_norm": 1.0,
109
+ "eval_poi_has_attachment_point(s)": 0.9194874060980999,
110
+ "eval_poi_heavy_atoms_difference": 2.440300486080424,
111
+ "eval_poi_heavy_atoms_difference_norm": 0.07726015738826272,
112
  "eval_poi_tanimoto_similarity": 0.0,
113
+ "eval_poi_valid": 0.9194874060980999,
114
+ "eval_reassembly": 0.4547945205479452,
115
+ "eval_reassembly_nostereo": 0.4756517896597437,
116
+ "eval_runtime": 1574.3525,
117
+ "eval_samples_per_second": 7.187,
118
+ "eval_steps_per_second": 0.112,
119
  "eval_tanimoto_similarity": 0.0,
120
+ "eval_valid": 0.9072912063632347,
121
  "step": 5000
122
  }
123
  ],
 
140
  },
141
  "total_flos": 4.33139477262336e+16,
142
  "train_batch_size": 128,
143
+ "trial_name": "trial-number=1-learning_rate=2.5e-05-warmup_ratio=0.060-min_lr=0.000-factor=0.810",
144
  "trial_params": {
145
+ "factor": 0.81,
146
+ "learning_rate": 2.4519131356633107e-05,
147
+ "min_lr": 4.1003934714656736e-09,
148
  "warmup_ratio": 0.06
149
  }
150
  }
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed9fa2c5779e79b2d5ae66e6d1c4f9a70b8ce9f13125f8a9d13bcd0dfdaa4af9
3
  size 7480
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3eec7615192e1bb866379e3b01579890ccadb1f12990ad30b73a3999ff22d577
3
  size 7480