rootxhacker commited on
Commit
760f2a1
·
verified ·
1 Parent(s): 9708600

Training in progress, step 4500, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7b1420e5f67ba76bfd4febfb8166681a03c08ca555de4aa6aed11752038beb7c
3
  size 36730224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32736256c22dee581cce726cace4ad49e7d2340e9e0d45e70e795a7c7d75017f
3
  size 36730224
last-checkpoint/ar_diffusion_info.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:631f5d8920185c1643d4b91793959905c6ffb5cfdb99578fa1feeb9561f6cc11
3
  size 1544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41608b990c978ab6d8dc1c26793cb750782238b85c3400b76fa4199137903300
3
  size 1544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b56e183e85858df2561ffd8210747bca3130019aa445c6931bdecb14ee1c1463
3
  size 73588346
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0abbf9e53e670e94b4d6c9f0b871f16259814e74491593da1bf6db0fb9680155
3
  size 73588346
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6ba374ceeab3c18ecca1a51999f0124017113854b9f36714acb5b3cbd2a2d7ce
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:271210047536fd837cd0fd091596a0f630f6e94e0fa870a34b128422c282005c
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:56099c2856f5340cf7eae161f2a31dbe463e29390c14dc50fb171114345187df
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51de76fc3d194041ce1d9d52ff2b3fc00cdee2e0aeb7b6d8e431343a71a85eb4
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:97c85fac85989286832186f4fae10d665a033afecb7b12aeb8bf5a4a199aa56c
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da9784da0d0932d47262fa459292b039ea021966742bee090e5b53abad4765f5
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 3500,
3
  "best_metric": 4.520543098449707,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-3500",
5
- "epoch": 0.30766864087377893,
6
  "eval_steps": 250,
7
- "global_step": 4000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -696,6 +696,92 @@
696
  "eval_samples_per_second": 54.279,
697
  "eval_steps_per_second": 13.57,
698
  "step": 4000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
699
  }
700
  ],
701
  "logging_steps": 50,
 
2
  "best_global_step": 3500,
3
  "best_metric": 4.520543098449707,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-3500",
5
+ "epoch": 0.3461272209830013,
6
  "eval_steps": 250,
7
+ "global_step": 4500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
696
  "eval_samples_per_second": 54.279,
697
  "eval_steps_per_second": 13.57,
698
  "step": 4000
699
+ },
700
+ {
701
+ "epoch": 0.3115144988847012,
702
+ "grad_norm": 5.374965190887451,
703
+ "learning_rate": 0.00018159623925408412,
704
+ "loss": 4.5327,
705
+ "step": 4050
706
+ },
707
+ {
708
+ "epoch": 0.3153603568956234,
709
+ "grad_norm": 4.99652624130249,
710
+ "learning_rate": 0.00018133651923226763,
711
+ "loss": 4.3966,
712
+ "step": 4100
713
+ },
714
+ {
715
+ "epoch": 0.31920621490654566,
716
+ "grad_norm": 6.257124423980713,
717
+ "learning_rate": 0.00018107679921045114,
718
+ "loss": 4.5792,
719
+ "step": 4150
720
+ },
721
+ {
722
+ "epoch": 0.3230520729174679,
723
+ "grad_norm": 8.056533813476562,
724
+ "learning_rate": 0.00018081707918863465,
725
+ "loss": 4.6401,
726
+ "step": 4200
727
+ },
728
+ {
729
+ "epoch": 0.32689793092839015,
730
+ "grad_norm": 4.024567127227783,
731
+ "learning_rate": 0.00018055735916681817,
732
+ "loss": 4.5516,
733
+ "step": 4250
734
+ },
735
+ {
736
+ "epoch": 0.32689793092839015,
737
+ "eval_loss": 4.558110237121582,
738
+ "eval_runtime": 18.5343,
739
+ "eval_samples_per_second": 53.954,
740
+ "eval_steps_per_second": 13.488,
741
+ "step": 4250
742
+ },
743
+ {
744
+ "epoch": 0.33074378893931233,
745
+ "grad_norm": 2.4326066970825195,
746
+ "learning_rate": 0.0001802976391450017,
747
+ "loss": 4.5761,
748
+ "step": 4300
749
+ },
750
+ {
751
+ "epoch": 0.3345896469502346,
752
+ "grad_norm": 2.7615299224853516,
753
+ "learning_rate": 0.00018003791912318522,
754
+ "loss": 4.4291,
755
+ "step": 4350
756
+ },
757
+ {
758
+ "epoch": 0.3384355049611568,
759
+ "grad_norm": 3.9387362003326416,
760
+ "learning_rate": 0.00017977819910136873,
761
+ "loss": 4.5422,
762
+ "step": 4400
763
+ },
764
+ {
765
+ "epoch": 0.34228136297207906,
766
+ "grad_norm": 23.72602653503418,
767
+ "learning_rate": 0.00017951847907955227,
768
+ "loss": 4.4379,
769
+ "step": 4450
770
+ },
771
+ {
772
+ "epoch": 0.3461272209830013,
773
+ "grad_norm": 2.968930959701538,
774
+ "learning_rate": 0.0001792639534581721,
775
+ "loss": 4.433,
776
+ "step": 4500
777
+ },
778
+ {
779
+ "epoch": 0.3461272209830013,
780
+ "eval_loss": 4.5359063148498535,
781
+ "eval_runtime": 18.5422,
782
+ "eval_samples_per_second": 53.931,
783
+ "eval_steps_per_second": 13.483,
784
+ "step": 4500
785
  }
786
  ],
787
  "logging_steps": 50,