rootxhacker commited on
Commit
c4956fb
·
verified ·
1 Parent(s): faed739

Training in progress, step 6000, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4eb8910307bec61db122da2594e6b3f530d868dc95f89d2ca698471ef1bf7e40
3
  size 36730224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d3519cd9f54111b61d5c7bda32b6503a50d9a901f0867b18c77e1c8775d34cc
3
  size 36730224
last-checkpoint/ar_diffusion_info.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7f7c3bd2e2b53a0436de47612a1d9d71e57d2e478df8b52acc7aec65dc000186
3
  size 1736
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc8be5680951e9b7e427f6500eddc8c10ce019d345c9c9f83581fc8bb331d518
3
  size 1736
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:42be51fbf276340c9331b95a10d361ad5f54ac5fddd8d3003ab5a2b3205b1bf3
3
  size 73588346
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fead462933224306a9b42a0eb2433085db43c13976438f5d79faccec086ccd4f
3
  size 73588346
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:edba3e2e11b49613ce2a377ec116d91655a77025fcd35863ca859fcc236283bd
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f460ca4efaa2c47b577474097b3561bee10506073f07d444922fddb74fb1bc7b
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ee231d5124e1faa72bb59e0d3351580448c9875eebe2a58142e26f5eeab5354c
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:faa0523a11b32ac61978a5b91bfe471f27b6d880dfaedd29cb6e6516dad00d0b
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c1402f998a531b2d9e639df3a0d0bab3a51ee695db29df819edf5370824d49f4
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ee9289020d6b3ecd17f692689ed65a2fe5f50143b40afcd424248034cb8eabc
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 5250,
3
- "best_metric": 1.4721767902374268,
4
- "best_model_checkpoint": "./ar-diffusion-checkpoints-progressive-attention/checkpoint-5000",
5
- "epoch": 0.42304438120144605,
6
  "eval_steps": 250,
7
- "global_step": 5500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -954,6 +954,92 @@
954
  "eval_samples_per_second": 59.336,
955
  "eval_steps_per_second": 14.834,
956
  "step": 5500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
957
  }
958
  ],
959
  "logging_steps": 50,
 
1
  {
2
+ "best_global_step": 6000,
3
+ "best_metric": 1.4524279832839966,
4
+ "best_model_checkpoint": "./ar-diffusion-checkpoints-progressive-attention/checkpoint-6000",
5
+ "epoch": 0.4615029613106684,
6
  "eval_steps": 250,
7
+ "global_step": 6000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
954
  "eval_samples_per_second": 59.336,
955
  "eval_steps_per_second": 14.834,
956
  "step": 5500
957
+ },
958
+ {
959
+ "epoch": 0.4268902392123683,
960
+ "grad_norm": 1.1347377300262451,
961
+ "learning_rate": 0.00017379424979871699,
962
+ "loss": 1.4507,
963
+ "step": 5550
964
+ },
965
+ {
966
+ "epoch": 0.43073609722329054,
967
+ "grad_norm": 1.5237597227096558,
968
+ "learning_rate": 0.0001735345297769005,
969
+ "loss": 1.4066,
970
+ "step": 5600
971
+ },
972
+ {
973
+ "epoch": 0.4345819552342128,
974
+ "grad_norm": 1.0041602849960327,
975
+ "learning_rate": 0.00017327480975508404,
976
+ "loss": 1.4724,
977
+ "step": 5650
978
+ },
979
+ {
980
+ "epoch": 0.43842781324513497,
981
+ "grad_norm": 1.3285658359527588,
982
+ "learning_rate": 0.00017301508973326755,
983
+ "loss": 1.5599,
984
+ "step": 5700
985
+ },
986
+ {
987
+ "epoch": 0.4422736712560572,
988
+ "grad_norm": 0.7520576119422913,
989
+ "learning_rate": 0.00017275536971145106,
990
+ "loss": 1.4572,
991
+ "step": 5750
992
+ },
993
+ {
994
+ "epoch": 0.4422736712560572,
995
+ "eval_loss": 1.4671169519424438,
996
+ "eval_runtime": 16.9411,
997
+ "eval_samples_per_second": 59.028,
998
+ "eval_steps_per_second": 14.757,
999
+ "step": 5750
1000
+ },
1001
+ {
1002
+ "epoch": 0.44611952926697945,
1003
+ "grad_norm": 1.737941861152649,
1004
+ "learning_rate": 0.00017249564968963458,
1005
+ "loss": 1.5221,
1006
+ "step": 5800
1007
+ },
1008
+ {
1009
+ "epoch": 0.4499653872779017,
1010
+ "grad_norm": 1.5023373365402222,
1011
+ "learning_rate": 0.0001722359296678181,
1012
+ "loss": 1.5291,
1013
+ "step": 5850
1014
+ },
1015
+ {
1016
+ "epoch": 0.45381124528882394,
1017
+ "grad_norm": 1.2984132766723633,
1018
+ "learning_rate": 0.00017197620964600163,
1019
+ "loss": 1.4288,
1020
+ "step": 5900
1021
+ },
1022
+ {
1023
+ "epoch": 0.4576571032997462,
1024
+ "grad_norm": 1.1742748022079468,
1025
+ "learning_rate": 0.00017171648962418514,
1026
+ "loss": 1.4943,
1027
+ "step": 5950
1028
+ },
1029
+ {
1030
+ "epoch": 0.4615029613106684,
1031
+ "grad_norm": 1.8346530199050903,
1032
+ "learning_rate": 0.00017145676960236866,
1033
+ "loss": 1.489,
1034
+ "step": 6000
1035
+ },
1036
+ {
1037
+ "epoch": 0.4615029613106684,
1038
+ "eval_loss": 1.4524279832839966,
1039
+ "eval_runtime": 16.8863,
1040
+ "eval_samples_per_second": 59.22,
1041
+ "eval_steps_per_second": 14.805,
1042
+ "step": 6000
1043
  }
1044
  ],
1045
  "logging_steps": 50,