rootxhacker commited on
Commit
c154a37
·
verified ·
1 Parent(s): 1a25af7

Training in progress, step 14500, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:13e9082dd993ab0c4dc4999c1db1ee4781bb37e4ef2b3309b62916fe0af14e9e
3
  size 36730224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5de88d64234be7632faf6ed628466ea75cb72606709e8a9670ff3263d20b99b2
3
  size 36730224
last-checkpoint/ar_diffusion_info.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3b05a5a771bbfa42b5ce6876a4e742b487145ad1b23810ea34ba9924b54cc834
3
  size 1544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac7a2ed0ceb2c14c05b2e472c85dab7e8d15b84be1a5716c1b4854657649f724
3
  size 1544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c567148d53eafd6022545201901938ff6ac986ce6ba91de6582e61fe1a67fdf3
3
  size 73588346
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:941a4797b295e526292ea21153bdb7a4de0cee47eeeefcced80807826927615e
3
  size 73588346
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5de168b313b50f7920582863eb6c48735221da70f052aa0c3517b7e8965981bd
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8ea42701e6bd5369fc7af2447cde260122e2711abf45d46209ed918523c1a2c
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6148534a27a25fb6f834b4dad22172177ef760e29ec4f90db326b0fc73929937
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:217ca02994358ecc2a1db89215641d4738177464b90707bbe2cb909f480a3316
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3d4b25db822a02d6858ac9bb141ed0e837701c9de7d32c7960967feccd1d18fc
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9bd4c9fae5d6170e75be05d4525938eac243e67e0a631b43205d6ab8dd428bda
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 13750,
3
  "best_metric": 1.5073590278625488,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-13000",
5
- "epoch": 1.0768402430582262,
6
  "eval_steps": 250,
7
- "global_step": 14000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -2416,6 +2416,92 @@
2416
  "eval_samples_per_second": 56.077,
2417
  "eval_steps_per_second": 14.019,
2418
  "step": 14000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2419
  }
2420
  ],
2421
  "logging_steps": 50,
 
2
  "best_global_step": 13750,
3
  "best_metric": 1.5073590278625488,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-13000",
5
+ "epoch": 1.1152988231674485,
6
  "eval_steps": 250,
7
+ "global_step": 14500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
2416
  "eval_samples_per_second": 56.077,
2417
  "eval_steps_per_second": 14.019,
2418
  "step": 14000
2419
+ },
2420
+ {
2421
+ "epoch": 1.0806861010691486,
2422
+ "grad_norm": 2.1172475814819336,
2423
+ "learning_rate": 0.00012966781809209673,
2424
+ "loss": 1.4055,
2425
+ "step": 14050
2426
+ },
2427
+ {
2428
+ "epoch": 1.0845319590800708,
2429
+ "grad_norm": 1.196999430656433,
2430
+ "learning_rate": 0.00012940809807028024,
2431
+ "loss": 1.464,
2432
+ "step": 14100
2433
+ },
2434
+ {
2435
+ "epoch": 1.088377817090993,
2436
+ "grad_norm": 1.3582040071487427,
2437
+ "learning_rate": 0.00012914837804846375,
2438
+ "loss": 1.4502,
2439
+ "step": 14150
2440
+ },
2441
+ {
2442
+ "epoch": 1.0922236751019152,
2443
+ "grad_norm": 1.6588162183761597,
2444
+ "learning_rate": 0.0001288886580266473,
2445
+ "loss": 1.5174,
2446
+ "step": 14200
2447
+ },
2448
+ {
2449
+ "epoch": 1.0960695331128374,
2450
+ "grad_norm": 1.7531650066375732,
2451
+ "learning_rate": 0.0001286289380048308,
2452
+ "loss": 1.505,
2453
+ "step": 14250
2454
+ },
2455
+ {
2456
+ "epoch": 1.0960695331128374,
2457
+ "eval_loss": 1.5160688161849976,
2458
+ "eval_runtime": 17.764,
2459
+ "eval_samples_per_second": 56.294,
2460
+ "eval_steps_per_second": 14.073,
2461
+ "step": 14250
2462
+ },
2463
+ {
2464
+ "epoch": 1.0999153911237598,
2465
+ "grad_norm": 1.868784785270691,
2466
+ "learning_rate": 0.00012836921798301432,
2467
+ "loss": 1.5544,
2468
+ "step": 14300
2469
+ },
2470
+ {
2471
+ "epoch": 1.103761249134682,
2472
+ "grad_norm": 1.9493080377578735,
2473
+ "learning_rate": 0.00012810949796119783,
2474
+ "loss": 1.533,
2475
+ "step": 14350
2476
+ },
2477
+ {
2478
+ "epoch": 1.1076071071456042,
2479
+ "grad_norm": 0.7309526801109314,
2480
+ "learning_rate": 0.00012784977793938135,
2481
+ "loss": 1.4672,
2482
+ "step": 14400
2483
+ },
2484
+ {
2485
+ "epoch": 1.1114529651565264,
2486
+ "grad_norm": 1.3281447887420654,
2487
+ "learning_rate": 0.00012759005791756486,
2488
+ "loss": 1.3874,
2489
+ "step": 14450
2490
+ },
2491
+ {
2492
+ "epoch": 1.1152988231674485,
2493
+ "grad_norm": 1.0158611536026,
2494
+ "learning_rate": 0.0001273303378957484,
2495
+ "loss": 1.4966,
2496
+ "step": 14500
2497
+ },
2498
+ {
2499
+ "epoch": 1.1152988231674485,
2500
+ "eval_loss": 1.5160739421844482,
2501
+ "eval_runtime": 17.6672,
2502
+ "eval_samples_per_second": 56.602,
2503
+ "eval_steps_per_second": 14.151,
2504
+ "step": 14500
2505
  }
2506
  ],
2507
  "logging_steps": 50,