rootxhacker commited on
Commit
bb69b24
·
verified ·
1 Parent(s): 067ba33

Training in progress, step 27500, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0c71cb6762a3f2359c9b24c07c0f2c18222a0855ef4122d25dd24f1be773077c
3
  size 36730224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35ce5e6c86a1bf47cdce58143c5b09c73002dd5d89b9322534b522adf2b979c2
3
  size 36730224
last-checkpoint/ar_diffusion_info.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c7562e2e11d39589f1d1677624c9cbfb42e6035b41d3ee891b0f53a0cc6bfe79
3
  size 1544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5105319d30175c31c325f622351d24750b6ebc93a4a760e15dcddafd219a41e3
3
  size 1544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dc1dfd01f40336797b539a0d0ca763264a6fc70cdf83f8431ae379e9a2d8dff9
3
  size 73588346
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:537fd28e956b28024f32059bbc52f49d60f5e4fb3a227aae07af0b56eace7847
3
  size 73588346
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a7cb9cecde71619f5455094db9dbc10b01ced14b7fff166fcfd1f46df6e480f1
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e5855dbe60c612d06e5ce5a68c9b6c059c395e1394e85fd59ba8464398cb7a8
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e2a94b30a1039d003ca39bb6fcc94430e37b0c6c69456a996151d312d106dd61
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7eb460d7eba992c8af886ac0898482ee899dab9ae84de674b2941e35c95d2bc1
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1412b21a67b3e14f57e3f3d27ac855c98641b3c473e09eb37b8289635d633513
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d3faad18edd2356e2cb54ce0b6a6c9de80399948e06a3d1f3780847487f93c5
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 24500,
3
- "best_metric": 1.445096731185913,
4
- "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-24500",
5
- "epoch": 2.076763325898008,
6
  "eval_steps": 250,
7
- "global_step": 27000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -4652,6 +4652,92 @@
4652
  "eval_samples_per_second": 55.662,
4653
  "eval_steps_per_second": 13.915,
4654
  "step": 27000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4655
  }
4656
  ],
4657
  "logging_steps": 50,
 
1
  {
2
+ "best_global_step": 27500,
3
+ "best_metric": 1.0159448385238647,
4
+ "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-27500",
5
+ "epoch": 2.11522190600723,
6
  "eval_steps": 250,
7
+ "global_step": 27500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
4652
  "eval_samples_per_second": 55.662,
4653
  "eval_steps_per_second": 13.915,
4654
  "step": 27000
4655
+ },
4656
+ {
4657
+ "epoch": 2.0806091839089302,
4658
+ "grad_norm": 0.9695401191711426,
4659
+ "learning_rate": 6.216139002155676e-05,
4660
+ "loss": 1.4943,
4661
+ "step": 27050
4662
+ },
4663
+ {
4664
+ "epoch": 2.084455041919852,
4665
+ "grad_norm": 1.243717074394226,
4666
+ "learning_rate": 6.190166999974029e-05,
4667
+ "loss": 1.4199,
4668
+ "step": 27100
4669
+ },
4670
+ {
4671
+ "epoch": 2.0883008999307746,
4672
+ "grad_norm": 1.6151024103164673,
4673
+ "learning_rate": 6.16419499779238e-05,
4674
+ "loss": 1.4248,
4675
+ "step": 27150
4676
+ },
4677
+ {
4678
+ "epoch": 2.0921467579416966,
4679
+ "grad_norm": 1.7448607683181763,
4680
+ "learning_rate": 6.138222995610731e-05,
4681
+ "loss": 1.3944,
4682
+ "step": 27200
4683
+ },
4684
+ {
4685
+ "epoch": 2.095992615952619,
4686
+ "grad_norm": 3.0997345447540283,
4687
+ "learning_rate": 6.112250993429084e-05,
4688
+ "loss": 1.4174,
4689
+ "step": 27250
4690
+ },
4691
+ {
4692
+ "epoch": 2.095992615952619,
4693
+ "eval_loss": 1.4659229516983032,
4694
+ "eval_runtime": 18.0653,
4695
+ "eval_samples_per_second": 55.355,
4696
+ "eval_steps_per_second": 13.839,
4697
+ "step": 27250
4698
+ },
4699
+ {
4700
+ "epoch": 2.0998384739635414,
4701
+ "grad_norm": 1.637845754623413,
4702
+ "learning_rate": 6.086278991247436e-05,
4703
+ "loss": 1.446,
4704
+ "step": 27300
4705
+ },
4706
+ {
4707
+ "epoch": 2.1036843319744634,
4708
+ "grad_norm": 1.4263664484024048,
4709
+ "learning_rate": 6.060306989065787e-05,
4710
+ "loss": 0.9793,
4711
+ "step": 27350
4712
+ },
4713
+ {
4714
+ "epoch": 2.1075301899853858,
4715
+ "grad_norm": 0.8709418773651123,
4716
+ "learning_rate": 6.034334986884139e-05,
4717
+ "loss": 0.9715,
4718
+ "step": 27400
4719
+ },
4720
+ {
4721
+ "epoch": 2.111376047996308,
4722
+ "grad_norm": 0.8483341336250305,
4723
+ "learning_rate": 6.008362984702491e-05,
4724
+ "loss": 0.9163,
4725
+ "step": 27450
4726
+ },
4727
+ {
4728
+ "epoch": 2.11522190600723,
4729
+ "grad_norm": 2.070937156677246,
4730
+ "learning_rate": 5.9823909825208425e-05,
4731
+ "loss": 1.0047,
4732
+ "step": 27500
4733
+ },
4734
+ {
4735
+ "epoch": 2.11522190600723,
4736
+ "eval_loss": 1.0159448385238647,
4737
+ "eval_runtime": 17.7021,
4738
+ "eval_samples_per_second": 56.49,
4739
+ "eval_steps_per_second": 14.123,
4740
+ "step": 27500
4741
  }
4742
  ],
4743
  "logging_steps": 50,