rootxhacker commited on
Commit
cb565e4
·
verified ·
1 Parent(s): be50834

Training in progress, step 33500, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7a1f3a37b9195f9fe5315c1a417cc9c4c1837b6b4960ab692b3988674668e641
3
  size 36730224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ba4032c8806316e646178801ef99b592ee64fdf0f498f16c746612f51bc00e7
3
  size 36730224
last-checkpoint/ar_diffusion_info.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3523599b620af8d4d35f82aaf704dae1a9541799dcba2ac70510840b2a4877a5
3
  size 1544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2455ad53c45645477aed9b3759432e9e9c8407e4084a49e013986abc8fc7f7ca
3
  size 1544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b004e01986e4ffc28df93cce958d9d9b3e3c05bd2e39ed3961cf317990155cfc
3
  size 73588346
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd6f8832ec1dc1733a71a36aefc780b32e10bd6c5f99ceb18e8b4625154891f2
3
  size 73588346
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0849d6e61493156c95f17fe6b7e25f79c73daada8cac211ebd8c78fd56fdbe07
3
  size 14180
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30531950e4a0b77af65f33843a2ce8e4c0089055b9101a61e4068183a61f16f1
3
  size 14180
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:99769539adfb817adf246fb69dd78f4ed98ef4d44e4b95e77847af02938c82df
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a62584d395be4cf3f57783efb5aff341de6c6d4775795a1ae162154552c4daf8
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2ba7f7caed94fa0fdab770ae562d792042367a76a376e41d1e68e45e9207a740
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:301e3a937444954f3e90b7bce620ef6813e91f5ce01811f0bf70549ea9c3cae1
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 30000,
3
  "best_metric": 0.9945911169052124,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-30000",
5
- "epoch": 2.5382662872086765,
6
  "eval_steps": 250,
7
- "global_step": 33000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -5684,6 +5684,92 @@
5684
  "eval_samples_per_second": 57.647,
5685
  "eval_steps_per_second": 14.412,
5686
  "step": 33000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5687
  }
5688
  ],
5689
  "logging_steps": 50,
 
2
  "best_global_step": 30000,
3
  "best_metric": 0.9945911169052124,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-30000",
5
+ "epoch": 2.576724867317899,
6
  "eval_steps": 250,
7
+ "global_step": 33500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
5684
  "eval_samples_per_second": 57.647,
5685
  "eval_steps_per_second": 14.412,
5686
  "step": 33000
5687
+ },
5688
+ {
5689
+ "epoch": 2.5421121452195985,
5690
+ "grad_norm": 0.7536977529525757,
5691
+ "learning_rate": 3.100018180401527e-05,
5692
+ "loss": 0.9818,
5693
+ "step": 33050
5694
+ },
5695
+ {
5696
+ "epoch": 2.5459580032305205,
5697
+ "grad_norm": 1.3777302503585815,
5698
+ "learning_rate": 3.074046178219879e-05,
5699
+ "loss": 0.953,
5700
+ "step": 33100
5701
+ },
5702
+ {
5703
+ "epoch": 2.549803861241443,
5704
+ "grad_norm": 0.9286239743232727,
5705
+ "learning_rate": 3.048074176038231e-05,
5706
+ "loss": 1.028,
5707
+ "step": 33150
5708
+ },
5709
+ {
5710
+ "epoch": 2.5536497192523653,
5711
+ "grad_norm": 0.6741893291473389,
5712
+ "learning_rate": 3.022102173856583e-05,
5713
+ "loss": 0.9693,
5714
+ "step": 33200
5715
+ },
5716
+ {
5717
+ "epoch": 2.5574955772632872,
5718
+ "grad_norm": 1.3020586967468262,
5719
+ "learning_rate": 2.9961301716749346e-05,
5720
+ "loss": 0.9673,
5721
+ "step": 33250
5722
+ },
5723
+ {
5724
+ "epoch": 2.5574955772632872,
5725
+ "eval_loss": 1.0041394233703613,
5726
+ "eval_runtime": 17.32,
5727
+ "eval_samples_per_second": 57.737,
5728
+ "eval_steps_per_second": 14.434,
5729
+ "step": 33250
5730
+ },
5731
+ {
5732
+ "epoch": 2.5613414352742097,
5733
+ "grad_norm": 1.4816234111785889,
5734
+ "learning_rate": 2.9701581694932862e-05,
5735
+ "loss": 0.9964,
5736
+ "step": 33300
5737
+ },
5738
+ {
5739
+ "epoch": 2.565187293285132,
5740
+ "grad_norm": 0.8813285827636719,
5741
+ "learning_rate": 2.9441861673116382e-05,
5742
+ "loss": 0.966,
5743
+ "step": 33350
5744
+ },
5745
+ {
5746
+ "epoch": 2.569033151296054,
5747
+ "grad_norm": 1.0042293071746826,
5748
+ "learning_rate": 2.9182141651299898e-05,
5749
+ "loss": 0.9254,
5750
+ "step": 33400
5751
+ },
5752
+ {
5753
+ "epoch": 2.5728790093069764,
5754
+ "grad_norm": 1.5775707960128784,
5755
+ "learning_rate": 2.892242162948342e-05,
5756
+ "loss": 1.0215,
5757
+ "step": 33450
5758
+ },
5759
+ {
5760
+ "epoch": 2.576724867317899,
5761
+ "grad_norm": 1.0266311168670654,
5762
+ "learning_rate": 2.8662701607666937e-05,
5763
+ "loss": 0.9323,
5764
+ "step": 33500
5765
+ },
5766
+ {
5767
+ "epoch": 2.576724867317899,
5768
+ "eval_loss": 1.0002070665359497,
5769
+ "eval_runtime": 17.2317,
5770
+ "eval_samples_per_second": 58.033,
5771
+ "eval_steps_per_second": 14.508,
5772
+ "step": 33500
5773
  }
5774
  ],
5775
  "logging_steps": 50,