rootxhacker commited on
Commit
782c8d3
·
verified ·
1 Parent(s): 27db481

Training in progress, step 32500, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:19d9bd7de028454d166b4a1c6d6f3145ed67ff36482f791a79118ea7b7d201ab
3
  size 36730224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d47a059c4465cb96ca8cf7f1905ca26df8afde99f0c2208111a3832ed682273e
3
  size 36730224
last-checkpoint/ar_diffusion_info.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a3efe4a639c0cf535238d781f181b5f7410e28e813293a3ad08dd1b3c0569ebd
3
  size 1544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:789a7c970269f3838d005c341e4869fd88818ad8ae5141deea1681f158455f61
3
  size 1544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e4f5b2ce31636fea31b4a89764e7b37be4b908e5ead9294fd64eb17613e89d11
3
  size 73588346
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01682574d44e97467301d5779733da7210577aa9e9ec38e6d369a4e1bb9c71a7
3
  size 73588346
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7f48c0047bbeb15d4e945ddf8a422e66a19ddd71e12c9b8b2e5a3e449379fb78
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e10cec93434f8ec9066e53d88256d0df13c4dfad53975c2a473bada794e39de4
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b918fd89981e331e86195be60fa3132ecc53927ce3bb181201004c9e6a502ae5
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe23086b61822081f0f874226d60c752bbd88420dba9100921fe74a8fe8db57f
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e779fea59867c3454c83f513ec8ab50e6683297addf1c5a422af8000a78db3f7
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16e4c0e7d997f50c97bce12877fd963ff1e035235b3d794e37197e971fb5ab23
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 30000,
3
  "best_metric": 0.9945911169052124,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-30000",
5
- "epoch": 2.4613491269902315,
6
  "eval_steps": 250,
7
- "global_step": 32000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -5512,6 +5512,92 @@
5512
  "eval_samples_per_second": 57.871,
5513
  "eval_steps_per_second": 14.468,
5514
  "step": 32000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5515
  }
5516
  ],
5517
  "logging_steps": 50,
 
2
  "best_global_step": 30000,
3
  "best_metric": 0.9945911169052124,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-30000",
5
+ "epoch": 2.4998077070994538,
6
  "eval_steps": 250,
7
+ "global_step": 32500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
5512
  "eval_samples_per_second": 57.871,
5513
  "eval_steps_per_second": 14.468,
5514
  "step": 32000
5515
+ },
5516
+ {
5517
+ "epoch": 2.465194985001154,
5518
+ "grad_norm": 0.999718964099884,
5519
+ "learning_rate": 3.619458224034491e-05,
5520
+ "loss": 0.9725,
5521
+ "step": 32050
5522
+ },
5523
+ {
5524
+ "epoch": 2.469040843012076,
5525
+ "grad_norm": 2.740297794342041,
5526
+ "learning_rate": 3.5934862218528425e-05,
5527
+ "loss": 0.9838,
5528
+ "step": 32100
5529
+ },
5530
+ {
5531
+ "epoch": 2.4728867010229982,
5532
+ "grad_norm": 1.199425458908081,
5533
+ "learning_rate": 3.5675142196711945e-05,
5534
+ "loss": 0.9807,
5535
+ "step": 32150
5536
+ },
5537
+ {
5538
+ "epoch": 2.4767325590339206,
5539
+ "grad_norm": 0.7113758325576782,
5540
+ "learning_rate": 3.5415422174895465e-05,
5541
+ "loss": 1.0046,
5542
+ "step": 32200
5543
+ },
5544
+ {
5545
+ "epoch": 2.4805784170448426,
5546
+ "grad_norm": 0.9929390549659729,
5547
+ "learning_rate": 3.5155702153078984e-05,
5548
+ "loss": 0.9692,
5549
+ "step": 32250
5550
+ },
5551
+ {
5552
+ "epoch": 2.4805784170448426,
5553
+ "eval_loss": 1.002519965171814,
5554
+ "eval_runtime": 17.3042,
5555
+ "eval_samples_per_second": 57.789,
5556
+ "eval_steps_per_second": 14.447,
5557
+ "step": 32250
5558
+ },
5559
+ {
5560
+ "epoch": 2.484424275055765,
5561
+ "grad_norm": 0.8170703649520874,
5562
+ "learning_rate": 3.48959821312625e-05,
5563
+ "loss": 0.982,
5564
+ "step": 32300
5565
+ },
5566
+ {
5567
+ "epoch": 2.488270133066687,
5568
+ "grad_norm": 0.8909692168235779,
5569
+ "learning_rate": 3.463626210944602e-05,
5570
+ "loss": 0.9953,
5571
+ "step": 32350
5572
+ },
5573
+ {
5574
+ "epoch": 2.4921159910776094,
5575
+ "grad_norm": 1.806539535522461,
5576
+ "learning_rate": 3.4376542087629536e-05,
5577
+ "loss": 1.0069,
5578
+ "step": 32400
5579
+ },
5580
+ {
5581
+ "epoch": 2.495961849088532,
5582
+ "grad_norm": 1.4509518146514893,
5583
+ "learning_rate": 3.4116822065813056e-05,
5584
+ "loss": 0.9642,
5585
+ "step": 32450
5586
+ },
5587
+ {
5588
+ "epoch": 2.4998077070994538,
5589
+ "grad_norm": 1.0312175750732422,
5590
+ "learning_rate": 3.3857102043996575e-05,
5591
+ "loss": 0.9921,
5592
+ "step": 32500
5593
+ },
5594
+ {
5595
+ "epoch": 2.4998077070994538,
5596
+ "eval_loss": 0.9993879199028015,
5597
+ "eval_runtime": 17.3389,
5598
+ "eval_samples_per_second": 57.674,
5599
+ "eval_steps_per_second": 14.418,
5600
+ "step": 32500
5601
  }
5602
  ],
5603
  "logging_steps": 50,