rootxhacker commited on
Commit
9a5e25b
·
verified ·
1 Parent(s): 7f03de6

Training in progress, step 26000, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a05a340cb4a65f48636e96ed4fd91629d922458e974787fca1ba7f6545c46cb6
3
  size 36730224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:354784630980b3e128043f599d1fa81d4eaeefccc49f9c73ac417f4b9affdc81
3
  size 36730224
last-checkpoint/ar_diffusion_info.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fe554b76c07e1e707d896c2ee3a20371f26db4350a7a78776a0cbae8a2db2c39
3
  size 1544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a382cd1d7b1cfe5578921e4a35263f149f5e86ef7359d296d8b1f906cce62a74
3
  size 1544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d55ae62412810c5314e1159d09e99db512bb7ac1a37d12bf0208475b2b472ef4
3
  size 73588346
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fbdd51e862aa846114442fbe4fc73ff82d5222c26562144ee40037d5d63ab0b6
3
  size 73588346
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dc69f04c57ac233f68440607df3025c3f527f698c64e56350e0ea45b99be0781
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35c260873e53de579d314af7f23d76fd9a02c023129e1ca7c8f1d3d5f4fae1d0
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6ce31cedb3c2765a684ec6f8057f362dc008c191e855761ff2fb30ba5f1fb29d
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bfd4827b4f5f4123b9a08cd207611b32b5022ac9c327a327659c2a44bd51e209
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ec634d9549d9c3645447089832de3b53917dd1ce5acd38abf0faed5b1df6f1af
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f5beeb269815e15f5dc6759e189a2780818b22a064798960c77eef6918e2b17
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 24500,
3
  "best_metric": 1.445096731185913,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-24500",
5
- "epoch": 1.9613875855703409,
6
  "eval_steps": 250,
7
- "global_step": 25500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -4394,6 +4394,92 @@
4394
  "eval_samples_per_second": 53.848,
4395
  "eval_steps_per_second": 13.462,
4396
  "step": 25500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4397
  }
4398
  ],
4399
  "logging_steps": 50,
 
2
  "best_global_step": 24500,
3
  "best_metric": 1.445096731185913,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-24500",
5
+ "epoch": 1.9998461656795632,
6
  "eval_steps": 250,
7
+ "global_step": 26000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
4394
  "eval_samples_per_second": 53.848,
4395
  "eval_steps_per_second": 13.462,
4396
  "step": 25500
4397
+ },
4398
+ {
4399
+ "epoch": 1.9652334435812628,
4400
+ "grad_norm": 1.808030128479004,
4401
+ "learning_rate": 6.994779627561489e-05,
4402
+ "loss": 1.4254,
4403
+ "step": 25550
4404
+ },
4405
+ {
4406
+ "epoch": 1.9690793015921852,
4407
+ "grad_norm": 1.634099006652832,
4408
+ "learning_rate": 6.96880762537984e-05,
4409
+ "loss": 1.3325,
4410
+ "step": 25600
4411
+ },
4412
+ {
4413
+ "epoch": 1.9729251596031074,
4414
+ "grad_norm": 0.8857108354568481,
4415
+ "learning_rate": 6.942835623198193e-05,
4416
+ "loss": 1.3983,
4417
+ "step": 25650
4418
+ },
4419
+ {
4420
+ "epoch": 1.9767710176140296,
4421
+ "grad_norm": 1.6114498376846313,
4422
+ "learning_rate": 6.916863621016545e-05,
4423
+ "loss": 1.3348,
4424
+ "step": 25700
4425
+ },
4426
+ {
4427
+ "epoch": 1.980616875624952,
4428
+ "grad_norm": 1.4415462017059326,
4429
+ "learning_rate": 6.890891618834895e-05,
4430
+ "loss": 1.4617,
4431
+ "step": 25750
4432
+ },
4433
+ {
4434
+ "epoch": 1.980616875624952,
4435
+ "eval_loss": 1.4457746744155884,
4436
+ "eval_runtime": 17.9567,
4437
+ "eval_samples_per_second": 55.689,
4438
+ "eval_steps_per_second": 13.922,
4439
+ "step": 25750
4440
+ },
4441
+ {
4442
+ "epoch": 1.984462733635874,
4443
+ "grad_norm": 1.9614554643630981,
4444
+ "learning_rate": 6.864919616653248e-05,
4445
+ "loss": 1.3813,
4446
+ "step": 25800
4447
+ },
4448
+ {
4449
+ "epoch": 1.9883085916467964,
4450
+ "grad_norm": 1.2938437461853027,
4451
+ "learning_rate": 6.8389476144716e-05,
4452
+ "loss": 1.4047,
4453
+ "step": 25850
4454
+ },
4455
+ {
4456
+ "epoch": 1.9921544496577186,
4457
+ "grad_norm": 2.1129326820373535,
4458
+ "learning_rate": 6.812975612289952e-05,
4459
+ "loss": 1.4362,
4460
+ "step": 25900
4461
+ },
4462
+ {
4463
+ "epoch": 1.9960003076686408,
4464
+ "grad_norm": 0.8634279370307922,
4465
+ "learning_rate": 6.787003610108303e-05,
4466
+ "loss": 1.4805,
4467
+ "step": 25950
4468
+ },
4469
+ {
4470
+ "epoch": 1.9998461656795632,
4471
+ "grad_norm": 2.995699405670166,
4472
+ "learning_rate": 6.761031607926656e-05,
4473
+ "loss": 1.5073,
4474
+ "step": 26000
4475
+ },
4476
+ {
4477
+ "epoch": 1.9998461656795632,
4478
+ "eval_loss": 1.453719973564148,
4479
+ "eval_runtime": 18.0595,
4480
+ "eval_samples_per_second": 55.373,
4481
+ "eval_steps_per_second": 13.843,
4482
+ "step": 26000
4483
  }
4484
  ],
4485
  "logging_steps": 50,