rootxhacker commited on
Commit
025c665
·
verified ·
1 Parent(s): ddb7fd4

Training in progress, step 10500, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5a0635af77a0cc188290373b523679a526e8c1ad75d8c7f25b922fea9cf62dca
3
  size 36730224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4324a3a5915156493f27435981bc5e067e17329d248df8e005af28872089db08
3
  size 36730224
last-checkpoint/ar_diffusion_info.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1bf901e73d41ea0ccfa16c6684d24d585b1f05ef9f57a4524e8694a26b9940a3
3
  size 1544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:586643082c797c6471cec4d99035ab6336a6eec2692a30ba5ac6aa1ea78f1ad3
3
  size 1544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4b950c496923243d0912e84a1eb84cb370513a822a8463c038d022e062e515bc
3
  size 73588346
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:435157f2e32de040f237ef44fcb2f7d2ce0740bd523e00f2682e862fe6e5b77b
3
  size 73588346
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2b4e6f78506ab09c8a3ff311a2dfeb7a6190585c49701c5bd2fcc763c2b50448
3
  size 14180
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:371a8ee92df296caadab094d1243e6f6a8e33531055d940b9b2beb58c3296d37
3
  size 14180
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f2a8c76f206a59cf071ae08cd5fd0af4dd2719f5d4bfbabc67d57af26f56bb51
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5b29e642bf24d79ebcf705888b6c986c0f26a1dd38cc2f292d82caae0977305
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dca9e86a8e1c5a776637e4448f160d7ddd557ac645e78f5bee2fc465ee6ebde3
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d497e82650965830e0a6f7b87b60635133c5dcd48d2ca0d74cebf5c5827dfab0
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 9500,
3
  "best_metric": 4.357193470001221,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-9500",
5
- "epoch": 0.7691716021844474,
6
  "eval_steps": 250,
7
- "global_step": 10000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -1728,6 +1728,92 @@
1728
  "eval_samples_per_second": 53.935,
1729
  "eval_steps_per_second": 13.484,
1730
  "step": 10000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1731
  }
1732
  ],
1733
  "logging_steps": 50,
 
2
  "best_global_step": 9500,
3
  "best_metric": 4.357193470001221,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-9500",
5
+ "epoch": 0.8076301822936697,
6
  "eval_steps": 250,
7
+ "global_step": 10500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
1728
  "eval_samples_per_second": 53.935,
1729
  "eval_steps_per_second": 13.484,
1730
  "step": 10000
1731
+ },
1732
+ {
1733
+ "epoch": 0.7730174601953695,
1734
+ "grad_norm": 3.882775068283081,
1735
+ "learning_rate": 0.00015044541983741527,
1736
+ "loss": 4.5207,
1737
+ "step": 10050
1738
+ },
1739
+ {
1740
+ "epoch": 0.7768633182062918,
1741
+ "grad_norm": 5.814795017242432,
1742
+ "learning_rate": 0.0001501856998155988,
1743
+ "loss": 4.2462,
1744
+ "step": 10100
1745
+ },
1746
+ {
1747
+ "epoch": 0.780709176217214,
1748
+ "grad_norm": 4.733581066131592,
1749
+ "learning_rate": 0.00014992597979378232,
1750
+ "loss": 4.5563,
1751
+ "step": 10150
1752
+ },
1753
+ {
1754
+ "epoch": 0.7845550342281363,
1755
+ "grad_norm": 4.805403232574463,
1756
+ "learning_rate": 0.00014966625977196583,
1757
+ "loss": 4.4353,
1758
+ "step": 10200
1759
+ },
1760
+ {
1761
+ "epoch": 0.7884008922390585,
1762
+ "grad_norm": 5.814332008361816,
1763
+ "learning_rate": 0.00014940653975014935,
1764
+ "loss": 4.4004,
1765
+ "step": 10250
1766
+ },
1767
+ {
1768
+ "epoch": 0.7884008922390585,
1769
+ "eval_loss": 4.41144323348999,
1770
+ "eval_runtime": 18.5402,
1771
+ "eval_samples_per_second": 53.937,
1772
+ "eval_steps_per_second": 13.484,
1773
+ "step": 10250
1774
+ },
1775
+ {
1776
+ "epoch": 0.7922467502499808,
1777
+ "grad_norm": 5.321393013000488,
1778
+ "learning_rate": 0.00014914681972833286,
1779
+ "loss": 4.4383,
1780
+ "step": 10300
1781
+ },
1782
+ {
1783
+ "epoch": 0.796092608260903,
1784
+ "grad_norm": 3.681452751159668,
1785
+ "learning_rate": 0.00014888709970651637,
1786
+ "loss": 4.5094,
1787
+ "step": 10350
1788
+ },
1789
+ {
1790
+ "epoch": 0.7999384662718253,
1791
+ "grad_norm": 4.766401767730713,
1792
+ "learning_rate": 0.0001486273796846999,
1793
+ "loss": 4.3104,
1794
+ "step": 10400
1795
+ },
1796
+ {
1797
+ "epoch": 0.8037843242827475,
1798
+ "grad_norm": 4.676774024963379,
1799
+ "learning_rate": 0.00014836765966288342,
1800
+ "loss": 4.516,
1801
+ "step": 10450
1802
+ },
1803
+ {
1804
+ "epoch": 0.8076301822936697,
1805
+ "grad_norm": 3.623643159866333,
1806
+ "learning_rate": 0.00014810793964106694,
1807
+ "loss": 4.5146,
1808
+ "step": 10500
1809
+ },
1810
+ {
1811
+ "epoch": 0.8076301822936697,
1812
+ "eval_loss": 4.398375034332275,
1813
+ "eval_runtime": 18.4969,
1814
+ "eval_samples_per_second": 54.063,
1815
+ "eval_steps_per_second": 13.516,
1816
+ "step": 10500
1817
  }
1818
  ],
1819
  "logging_steps": 50,