rootxhacker commited on
Commit
54f0ca1
·
verified ·
1 Parent(s): 0d05826

Training in progress, step 32000, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7dc19b8d0d5f9136639755d9316a3022b8c82a5289f75b8c2a154ea24a7ec37d
3
  size 36730224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19d9bd7de028454d166b4a1c6d6f3145ed67ff36482f791a79118ea7b7d201ab
3
  size 36730224
last-checkpoint/ar_diffusion_info.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:77557a289798db28dd4dc90cd32e22abe79a243a7d8657956d33bce4d7666e79
3
  size 1544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3efe4a639c0cf535238d781f181b5f7410e28e813293a3ad08dd1b3c0569ebd
3
  size 1544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4263d1c23e4d38ddf0a4a29df3a3b188cb0c869be730f51b663c9aae88580c07
3
  size 73588346
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4f5b2ce31636fea31b4a89764e7b37be4b908e5ead9294fd64eb17613e89d11
3
  size 73588346
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:34336c82053d260113435e2b759b35a50c0eba98515a30dfe9d41e121f34b323
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f48c0047bbeb15d4e945ddf8a422e66a19ddd71e12c9b8b2e5a3e449379fb78
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d859bf97583170267785e1e8320d8e4f984a79e2c33679e5f98c773a6e6e145a
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b918fd89981e331e86195be60fa3132ecc53927ce3bb181201004c9e6a502ae5
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d10804979bf6e76891746681a7665a759c1b00ee5b7dc26a2cd76065e4556d2b
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e779fea59867c3454c83f513ec8ab50e6683297addf1c5a422af8000a78db3f7
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 30000,
3
  "best_metric": 0.9945911169052124,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-30000",
5
- "epoch": 2.422890546881009,
6
  "eval_steps": 250,
7
- "global_step": 31500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -5426,6 +5426,92 @@
5426
  "eval_samples_per_second": 58.456,
5427
  "eval_steps_per_second": 14.614,
5428
  "step": 31500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5429
  }
5430
  ],
5431
  "logging_steps": 50,
 
2
  "best_global_step": 30000,
3
  "best_metric": 0.9945911169052124,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-30000",
5
+ "epoch": 2.4613491269902315,
6
  "eval_steps": 250,
7
+ "global_step": 32000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
5426
  "eval_samples_per_second": 58.456,
5427
  "eval_steps_per_second": 14.614,
5428
  "step": 31500
5429
+ },
5430
+ {
5431
+ "epoch": 2.4267364048919315,
5432
+ "grad_norm": 1.3409994840621948,
5433
+ "learning_rate": 3.879178245850973e-05,
5434
+ "loss": 0.9546,
5435
+ "step": 31550
5436
+ },
5437
+ {
5438
+ "epoch": 2.4305822629028535,
5439
+ "grad_norm": 1.482633352279663,
5440
+ "learning_rate": 3.853206243669324e-05,
5441
+ "loss": 1.0155,
5442
+ "step": 31600
5443
+ },
5444
+ {
5445
+ "epoch": 2.434428120913776,
5446
+ "grad_norm": 1.0458152294158936,
5447
+ "learning_rate": 3.827234241487677e-05,
5448
+ "loss": 0.989,
5449
+ "step": 31650
5450
+ },
5451
+ {
5452
+ "epoch": 2.4382739789246983,
5453
+ "grad_norm": 0.9805555939674377,
5454
+ "learning_rate": 3.801262239306028e-05,
5455
+ "loss": 0.9125,
5456
+ "step": 31700
5457
+ },
5458
+ {
5459
+ "epoch": 2.4421198369356203,
5460
+ "grad_norm": 1.5680670738220215,
5461
+ "learning_rate": 3.77529023712438e-05,
5462
+ "loss": 0.9713,
5463
+ "step": 31750
5464
+ },
5465
+ {
5466
+ "epoch": 2.4421198369356203,
5467
+ "eval_loss": 0.9981379508972168,
5468
+ "eval_runtime": 17.3284,
5469
+ "eval_samples_per_second": 57.709,
5470
+ "eval_steps_per_second": 14.427,
5471
+ "step": 31750
5472
+ },
5473
+ {
5474
+ "epoch": 2.4459656949465427,
5475
+ "grad_norm": 1.0316798686981201,
5476
+ "learning_rate": 3.749318234942732e-05,
5477
+ "loss": 0.9689,
5478
+ "step": 31800
5479
+ },
5480
+ {
5481
+ "epoch": 2.4498115529574647,
5482
+ "grad_norm": 0.6630721092224121,
5483
+ "learning_rate": 3.7233462327610834e-05,
5484
+ "loss": 0.9772,
5485
+ "step": 31850
5486
+ },
5487
+ {
5488
+ "epoch": 2.453657410968387,
5489
+ "grad_norm": 1.1662702560424805,
5490
+ "learning_rate": 3.6973742305794354e-05,
5491
+ "loss": 1.0165,
5492
+ "step": 31900
5493
+ },
5494
+ {
5495
+ "epoch": 2.457503268979309,
5496
+ "grad_norm": 1.0451244115829468,
5497
+ "learning_rate": 3.671402228397787e-05,
5498
+ "loss": 1.0233,
5499
+ "step": 31950
5500
+ },
5501
+ {
5502
+ "epoch": 2.4613491269902315,
5503
+ "grad_norm": 0.9077771306037903,
5504
+ "learning_rate": 3.645430226216139e-05,
5505
+ "loss": 0.9797,
5506
+ "step": 32000
5507
+ },
5508
+ {
5509
+ "epoch": 2.4613491269902315,
5510
+ "eval_loss": 0.9961766004562378,
5511
+ "eval_runtime": 17.2799,
5512
+ "eval_samples_per_second": 57.871,
5513
+ "eval_steps_per_second": 14.468,
5514
+ "step": 32000
5515
  }
5516
  ],
5517
  "logging_steps": 50,