ribesstefano commited on
Commit
ed2409f
·
verified ·
1 Parent(s): 22a04bf

Training in progress, step 90000, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bade3186c939746aee4449e0ff57101ff4b77afbea832800d563cd2a9dff5c23
3
  size 409608164
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b81440045302c1eefa2e9bb46e7e8805c428a04de6a24fe9f46587ea87bfcca5
3
  size 409608164
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ab2838167b6f207e5ff9462a8152a1096f09984f229962c877b90f52c09efede
3
  size 814647162
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38443ec18070df18bce237a22d7bb5dd387c0d4bdddae00cc86604fb8052b6af
3
  size 814647162
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:74e388ca8334252df148488d1991df78557ce10af3baa0d6ba3c2b6ef12523fe
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:786a7eab19dbd8ac17ba3425052b6357a24dca38614d2d72a333d8bc2f3e9ec5
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bc672e72b4f6931672a9ebc2cb446a053ea93c3be41c5f8f873f2559810a72c6
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0dbdf033488efc02bdb5bbd298068b0b31fd085c69e24df4fc9494f6089deaa4
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.5959631728045326,
3
  "best_model_checkpoint": "/mimer/NOBACKUP/groups/naiss2023-6-290/stefano/models//PROTAC-Splitter-EncoderDecoder-lr_cosine-rand-smiles/checkpoint-85000",
4
- "epoch": 8.384296705464589,
5
  "eval_steps": 2500,
6
- "global_step": 85000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -1617,6 +1617,160 @@
1617
  "eval_tanimoto_similarity": 0.0,
1618
  "eval_valid": 0.9502478753541076,
1619
  "step": 85000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1620
  }
1621
  ],
1622
  "logging_steps": 500,
@@ -1636,7 +1790,7 @@
1636
  "attributes": {}
1637
  }
1638
  },
1639
- "total_flos": 7.419926048624763e+17,
1640
  "train_batch_size": 128,
1641
  "trial_name": null,
1642
  "trial_params": null
 
1
  {
2
  "best_metric": 0.5959631728045326,
3
  "best_model_checkpoint": "/mimer/NOBACKUP/groups/naiss2023-6-290/stefano/models//PROTAC-Splitter-EncoderDecoder-lr_cosine-rand-smiles/checkpoint-85000",
4
+ "epoch": 8.877490629315448,
5
  "eval_steps": 2500,
6
+ "global_step": 90000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
1617
  "eval_tanimoto_similarity": 0.0,
1618
  "eval_valid": 0.9502478753541076,
1619
  "step": 85000
1620
+ },
1621
+ {
1622
+ "epoch": 8.433616097849674,
1623
+ "grad_norm": 0.011240696534514427,
1624
+ "learning_rate": 2.5622964623348843e-06,
1625
+ "loss": 0.0002,
1626
+ "step": 85500
1627
+ },
1628
+ {
1629
+ "epoch": 8.48293549023476,
1630
+ "grad_norm": 0.01842450723052025,
1631
+ "learning_rate": 2.3917244156542534e-06,
1632
+ "loss": 0.0002,
1633
+ "step": 86000
1634
+ },
1635
+ {
1636
+ "epoch": 8.532254882619846,
1637
+ "grad_norm": 0.005196568090468645,
1638
+ "learning_rate": 2.2267417957134883e-06,
1639
+ "loss": 0.0002,
1640
+ "step": 86500
1641
+ },
1642
+ {
1643
+ "epoch": 8.581574275004932,
1644
+ "grad_norm": 0.009838773868978024,
1645
+ "learning_rate": 2.0673893910399504e-06,
1646
+ "loss": 0.0002,
1647
+ "step": 87000
1648
+ },
1649
+ {
1650
+ "epoch": 8.630893667390017,
1651
+ "grad_norm": 0.04019368812441826,
1652
+ "learning_rate": 1.914008280031923e-06,
1653
+ "loss": 0.0002,
1654
+ "step": 87500
1655
+ },
1656
+ {
1657
+ "epoch": 8.630893667390017,
1658
+ "eval_all_ligands_equal": 0.5953434844192634,
1659
+ "eval_e3_equal": 0.8263101983002833,
1660
+ "eval_e3_graph_edit_distance": Infinity,
1661
+ "eval_e3_graph_edit_distance_norm": Infinity,
1662
+ "eval_e3_has_attachment_point(s)": 0.9887570821529745,
1663
+ "eval_e3_heavy_atoms_difference": 0.1730701133144476,
1664
+ "eval_e3_heavy_atoms_difference_norm": 0.0008003837390301783,
1665
+ "eval_e3_tanimoto_similarity": 0.0,
1666
+ "eval_e3_valid": 0.9887570821529745,
1667
+ "eval_has_all_attachment_points": 0.9884029745042493,
1668
+ "eval_has_three_substructures": 0.9995573654390935,
1669
+ "eval_heavy_atoms_difference": 4.526203966005665,
1670
+ "eval_heavy_atoms_difference_norm": 0.061568743782646304,
1671
+ "eval_linker_equal": 0.8501239376770539,
1672
+ "eval_linker_graph_edit_distance": Infinity,
1673
+ "eval_linker_graph_edit_distance_norm": Infinity,
1674
+ "eval_linker_has_attachment_point(s)": 0.9972556657223796,
1675
+ "eval_linker_heavy_atoms_difference": 0.20635623229461755,
1676
+ "eval_linker_heavy_atoms_difference_norm": 0.0013172185920579528,
1677
+ "eval_linker_tanimoto_similarity": 0.0,
1678
+ "eval_linker_valid": 0.9972556657223796,
1679
+ "eval_loss": 0.3990042209625244,
1680
+ "eval_num_fragments": 3.0000885269121813,
1681
+ "eval_poi_equal": 0.7899256373937678,
1682
+ "eval_poi_graph_edit_distance": Infinity,
1683
+ "eval_poi_graph_edit_distance_norm": Infinity,
1684
+ "eval_poi_has_attachment_point(s)": 0.9604284702549575,
1685
+ "eval_poi_heavy_atoms_difference": 1.170325779036827,
1686
+ "eval_poi_heavy_atoms_difference_norm": 0.03487419309053563,
1687
+ "eval_poi_tanimoto_similarity": 0.0,
1688
+ "eval_poi_valid": 0.9604284702549575,
1689
+ "eval_reassembly": 0.6017174220963173,
1690
+ "eval_reassembly_nostereo": 0.632878895184136,
1691
+ "eval_runtime": 2317.1407,
1692
+ "eval_samples_per_second": 4.875,
1693
+ "eval_steps_per_second": 0.076,
1694
+ "eval_tanimoto_similarity": 0.0,
1695
+ "eval_valid": 0.9478576487252125,
1696
+ "step": 87500
1697
+ },
1698
+ {
1699
+ "epoch": 8.680213059775104,
1700
+ "grad_norm": 0.009999396279454231,
1701
+ "learning_rate": 1.7660216417237113e-06,
1702
+ "loss": 0.0002,
1703
+ "step": 88000
1704
+ },
1705
+ {
1706
+ "epoch": 8.72953245216019,
1707
+ "grad_norm": 0.0032589335460215807,
1708
+ "learning_rate": 1.6237791221752203e-06,
1709
+ "loss": 0.0002,
1710
+ "step": 88500
1711
+ },
1712
+ {
1713
+ "epoch": 8.778851844545276,
1714
+ "grad_norm": 0.007267610169947147,
1715
+ "learning_rate": 1.4873158878961374e-06,
1716
+ "loss": 0.0002,
1717
+ "step": 89000
1718
+ },
1719
+ {
1720
+ "epoch": 8.82817123693036,
1721
+ "grad_norm": 0.02816702425479889,
1722
+ "learning_rate": 1.3566656765878621e-06,
1723
+ "loss": 0.0002,
1724
+ "step": 89500
1725
+ },
1726
+ {
1727
+ "epoch": 8.877490629315448,
1728
+ "grad_norm": 0.009792421944439411,
1729
+ "learning_rate": 1.2318607888025413e-06,
1730
+ "loss": 0.0002,
1731
+ "step": 90000
1732
+ },
1733
+ {
1734
+ "epoch": 8.877490629315448,
1735
+ "eval_all_ligands_equal": 0.5956090651558074,
1736
+ "eval_e3_equal": 0.8270184135977338,
1737
+ "eval_e3_graph_edit_distance": Infinity,
1738
+ "eval_e3_graph_edit_distance_norm": Infinity,
1739
+ "eval_e3_has_attachment_point(s)": 0.9861898016997167,
1740
+ "eval_e3_heavy_atoms_difference": 0.2705382436260623,
1741
+ "eval_e3_heavy_atoms_difference_norm": 0.0048639786608157655,
1742
+ "eval_e3_tanimoto_similarity": 0.0,
1743
+ "eval_e3_valid": 0.9861898016997167,
1744
+ "eval_has_all_attachment_points": 0.9884029745042493,
1745
+ "eval_has_three_substructures": 0.9995573654390935,
1746
+ "eval_heavy_atoms_difference": 4.702195467422096,
1747
+ "eval_heavy_atoms_difference_norm": 0.06408037436572298,
1748
+ "eval_linker_equal": 0.8497698300283286,
1749
+ "eval_linker_graph_edit_distance": 3.009915014164306e+61,
1750
+ "eval_linker_graph_edit_distance_norm": 0.02778354797312324,
1751
+ "eval_linker_has_attachment_point(s)": 0.9969900849858357,
1752
+ "eval_linker_heavy_atoms_difference": 0.1989199716713881,
1753
+ "eval_linker_heavy_atoms_difference_norm": 0.00136169255914937,
1754
+ "eval_linker_tanimoto_similarity": 0.0,
1755
+ "eval_linker_valid": 0.9969900849858357,
1756
+ "eval_loss": 0.39773058891296387,
1757
+ "eval_num_fragments": 3.000265580736544,
1758
+ "eval_poi_equal": 0.7905453257790368,
1759
+ "eval_poi_graph_edit_distance": Infinity,
1760
+ "eval_poi_graph_edit_distance_norm": Infinity,
1761
+ "eval_poi_has_attachment_point(s)": 0.9607825779036827,
1762
+ "eval_poi_heavy_atoms_difference": 1.1535056657223797,
1763
+ "eval_poi_heavy_atoms_difference_norm": 0.03463791665241003,
1764
+ "eval_poi_tanimoto_similarity": 0.0,
1765
+ "eval_poi_valid": 0.9607825779036827,
1766
+ "eval_reassembly": 0.6021600566572238,
1767
+ "eval_reassembly_nostereo": 0.6329674220963173,
1768
+ "eval_runtime": 2308.9117,
1769
+ "eval_samples_per_second": 4.892,
1770
+ "eval_steps_per_second": 0.077,
1771
+ "eval_tanimoto_similarity": 0.0,
1772
+ "eval_valid": 0.9456444759206799,
1773
+ "step": 90000
1774
  }
1775
  ],
1776
  "logging_steps": 500,
 
1790
  "attributes": {}
1791
  }
1792
  },
1793
+ "total_flos": 7.856150564898939e+17,
1794
  "train_batch_size": 128,
1795
  "trial_name": null,
1796
  "trial_params": null