rootxhacker commited on
Commit
a1d7113
·
verified ·
1 Parent(s): 4ea6931

Training in progress, step 38000, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e3c4fec3fcfea21f991151e26f507a7695fb23bd8b856b2b2f700a67bb497070
3
  size 36730224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6fd57c393f47a10fedc0eeb53eea073bec9f5d74a93432c74ef773c66fc48524
3
  size 36730224
last-checkpoint/ar_diffusion_info.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:af333093453e4833a3b8e0d94d92ddd95f295c0d87e9e98a54a6ad3c390330e9
3
  size 1736
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9bd9ca616ae823c9a3f8ca31216995734a05d8ab02efa11d199d90e7767f414c
3
  size 1736
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c332c5ce1f57e169c0226452b69be2dc4fb900c8955ca04e773762307c8e5eb4
3
  size 73588346
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7db25f3289aeb2b9363ef193bde6f97fc98f831d0d2faf2aba478e02c7461eb7
3
  size 73588346
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ddcf88ff022861d1e6c33a55560d1a3aa75a31ecba95d857fc1b29571146d9d8
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6fe094da8ad1e1bf555c74dca2c7341b574c5a3cf7d8c3a98ff15eda79c695fe
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f7b74025bac6cdf338bbaffce8798d5ebfeba84e2c0590feb5feb5210c2d2221
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da55266e7e44775541aba7dfea6ddb4ce98b63d56ca8b7cf213a395f32135776
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4f59e689571d05ebe27330dcd7978075e538dfc70e5b33155dcbd08ae7037e11
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82bb4fe5bf3e8542933d8cb52c350875b68d38b60b96f875a9ab6b9538329c08
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 31000,
3
  "best_metric": 0.7226839661598206,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-31000",
5
- "epoch": 2.8843935081916774,
6
  "eval_steps": 250,
7
- "global_step": 37500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -6458,6 +6458,92 @@
6458
  "eval_samples_per_second": 55.754,
6459
  "eval_steps_per_second": 13.939,
6460
  "step": 37500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6461
  }
6462
  ],
6463
  "logging_steps": 50,
 
2
  "best_global_step": 31000,
3
  "best_metric": 0.7226839661598206,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-31000",
5
+ "epoch": 2.9228520883008997,
6
  "eval_steps": 250,
7
+ "global_step": 38000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
6458
  "eval_samples_per_second": 55.754,
6459
  "eval_steps_per_second": 13.939,
6460
  "step": 37500
6461
+ },
6462
+ {
6463
+ "epoch": 2.8882393662026,
6464
+ "grad_norm": 0.6858485341072083,
6465
+ "learning_rate": 7.6201854400955775e-06,
6466
+ "loss": 0.7132,
6467
+ "step": 37550
6468
+ },
6469
+ {
6470
+ "epoch": 2.892085224213522,
6471
+ "grad_norm": 0.7138088345527649,
6472
+ "learning_rate": 7.3604654182790955e-06,
6473
+ "loss": 0.7082,
6474
+ "step": 37600
6475
+ },
6476
+ {
6477
+ "epoch": 2.895931082224444,
6478
+ "grad_norm": 0.4927150309085846,
6479
+ "learning_rate": 7.100745396462613e-06,
6480
+ "loss": 0.7551,
6481
+ "step": 37650
6482
+ },
6483
+ {
6484
+ "epoch": 2.8997769402353666,
6485
+ "grad_norm": 0.879112720489502,
6486
+ "learning_rate": 6.841025374646131e-06,
6487
+ "loss": 0.7228,
6488
+ "step": 37700
6489
+ },
6490
+ {
6491
+ "epoch": 2.903622798246289,
6492
+ "grad_norm": 1.2699699401855469,
6493
+ "learning_rate": 6.58130535282965e-06,
6494
+ "loss": 0.7208,
6495
+ "step": 37750
6496
+ },
6497
+ {
6498
+ "epoch": 2.903622798246289,
6499
+ "eval_loss": 0.7685362696647644,
6500
+ "eval_runtime": 17.9674,
6501
+ "eval_samples_per_second": 55.656,
6502
+ "eval_steps_per_second": 13.914,
6503
+ "step": 37750
6504
+ },
6505
+ {
6506
+ "epoch": 2.907468656257211,
6507
+ "grad_norm": 0.7341476082801819,
6508
+ "learning_rate": 6.321585331013168e-06,
6509
+ "loss": 0.761,
6510
+ "step": 37800
6511
+ },
6512
+ {
6513
+ "epoch": 2.9113145142681334,
6514
+ "grad_norm": 0.8890082836151123,
6515
+ "learning_rate": 6.061865309196686e-06,
6516
+ "loss": 0.6837,
6517
+ "step": 37850
6518
+ },
6519
+ {
6520
+ "epoch": 2.9151603722790553,
6521
+ "grad_norm": 0.5546180009841919,
6522
+ "learning_rate": 5.802145287380204e-06,
6523
+ "loss": 0.7126,
6524
+ "step": 37900
6525
+ },
6526
+ {
6527
+ "epoch": 2.9190062302899777,
6528
+ "grad_norm": 0.7684674263000488,
6529
+ "learning_rate": 5.542425265563723e-06,
6530
+ "loss": 0.6765,
6531
+ "step": 37950
6532
+ },
6533
+ {
6534
+ "epoch": 2.9228520883008997,
6535
+ "grad_norm": 0.8968291282653809,
6536
+ "learning_rate": 5.2827052437472405e-06,
6537
+ "loss": 0.6839,
6538
+ "step": 38000
6539
+ },
6540
+ {
6541
+ "epoch": 2.9228520883008997,
6542
+ "eval_loss": 0.7687397003173828,
6543
+ "eval_runtime": 17.8165,
6544
+ "eval_samples_per_second": 56.128,
6545
+ "eval_steps_per_second": 14.032,
6546
+ "step": 38000
6547
  }
6548
  ],
6549
  "logging_steps": 50,