rootxhacker commited on
Commit
39fd32e
·
verified ·
1 Parent(s): 8adf1a2

Training in progress, step 19500, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:31847bb52936d686e74359d3478c14923c1ebe168be3dabe55eeb97e094e4e4d
3
  size 36730224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1fd7698db7af5ca1d96c523abf1ce3ed39dad6f1ef364885f5698168d5072eab
3
  size 36730224
last-checkpoint/ar_diffusion_info.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a28811b9b6f21f7c3eb8dd1560ffdbc347e72ba020959bb8f5bc088d847bdc83
3
  size 1544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d356319b5cb8614b773ad954915afabc933d54cfb874f3f02d0e30cd4ce665d3
3
  size 1544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:40965b88e5eb22bf8d3caa10525eb8f13ed0f07bce8d46631079916b2bb29747
3
  size 73588346
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a96cf13c25e993c5a75039856a7a5ef57f09af02fd14f8120fb00ff3c830655
3
  size 73588346
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3c57dd490464340c9b3aa212b9d3844b50cfd1f6b44323e804e87459d3ff333e
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa7c19bbb017976e63ac5e9fec3eea0eda0cf5868e0275e6b00fde078e2c850d
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dbc432474a75821e9b2dae49e65dbd5211090e2d95ceeb48957adde037f27b78
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f8f3437cd7c6266ef3d6b26d1f23a26258ce02afba475c3dabc69b494e62bdf
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:68cdaa34d552da65c658445f52e286a15f93a5093fe3daa82953914a2ad847cc
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51597cfa5b705f0eeeef37eec7f4e933d1fd3032aa1f165769969345026a8d82
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 18750,
3
  "best_metric": 1.4757392406463623,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-15500",
5
- "epoch": 1.4614260441504499,
6
  "eval_steps": 250,
7
- "global_step": 19000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -3276,6 +3276,92 @@
3276
  "eval_samples_per_second": 56.258,
3277
  "eval_steps_per_second": 14.065,
3278
  "step": 19000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3279
  }
3280
  ],
3281
  "logging_steps": 50,
 
2
  "best_global_step": 18750,
3
  "best_metric": 1.4757392406463623,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-15500",
5
+ "epoch": 1.4998846242596724,
6
  "eval_steps": 250,
7
+ "global_step": 19500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
3276
  "eval_samples_per_second": 56.258,
3277
  "eval_steps_per_second": 14.065,
3278
  "step": 19000
3279
+ },
3280
+ {
3281
+ "epoch": 1.4652719021613723,
3282
+ "grad_norm": 1.2875189781188965,
3283
+ "learning_rate": 0.00010370101031088487,
3284
+ "loss": 1.4826,
3285
+ "step": 19050
3286
+ },
3287
+ {
3288
+ "epoch": 1.4691177601722945,
3289
+ "grad_norm": 1.7036223411560059,
3290
+ "learning_rate": 0.00010344129028906839,
3291
+ "loss": 1.4392,
3292
+ "step": 19100
3293
+ },
3294
+ {
3295
+ "epoch": 1.4729636181832166,
3296
+ "grad_norm": 1.537514328956604,
3297
+ "learning_rate": 0.0001031815702672519,
3298
+ "loss": 1.4846,
3299
+ "step": 19150
3300
+ },
3301
+ {
3302
+ "epoch": 1.476809476194139,
3303
+ "grad_norm": 0.9159242510795593,
3304
+ "learning_rate": 0.00010292185024543543,
3305
+ "loss": 1.4668,
3306
+ "step": 19200
3307
+ },
3308
+ {
3309
+ "epoch": 1.480655334205061,
3310
+ "grad_norm": 3.47868013381958,
3311
+ "learning_rate": 0.00010266213022361894,
3312
+ "loss": 1.493,
3313
+ "step": 19250
3314
+ },
3315
+ {
3316
+ "epoch": 1.480655334205061,
3317
+ "eval_loss": 1.4858986139297485,
3318
+ "eval_runtime": 17.7738,
3319
+ "eval_samples_per_second": 56.263,
3320
+ "eval_steps_per_second": 14.066,
3321
+ "step": 19250
3322
+ },
3323
+ {
3324
+ "epoch": 1.4845011922159834,
3325
+ "grad_norm": 1.467437505722046,
3326
+ "learning_rate": 0.00010240241020180246,
3327
+ "loss": 1.4639,
3328
+ "step": 19300
3329
+ },
3330
+ {
3331
+ "epoch": 1.4883470502269056,
3332
+ "grad_norm": 1.2710049152374268,
3333
+ "learning_rate": 0.00010214269017998598,
3334
+ "loss": 1.4244,
3335
+ "step": 19350
3336
+ },
3337
+ {
3338
+ "epoch": 1.4921929082378278,
3339
+ "grad_norm": 2.0059661865234375,
3340
+ "learning_rate": 0.0001018829701581695,
3341
+ "loss": 1.4258,
3342
+ "step": 19400
3343
+ },
3344
+ {
3345
+ "epoch": 1.4960387662487502,
3346
+ "grad_norm": 1.7536308765411377,
3347
+ "learning_rate": 0.00010162325013635301,
3348
+ "loss": 1.396,
3349
+ "step": 19450
3350
+ },
3351
+ {
3352
+ "epoch": 1.4998846242596724,
3353
+ "grad_norm": 0.9684279561042786,
3354
+ "learning_rate": 0.00010136353011453655,
3355
+ "loss": 1.4598,
3356
+ "step": 19500
3357
+ },
3358
+ {
3359
+ "epoch": 1.4998846242596724,
3360
+ "eval_loss": 1.4841110706329346,
3361
+ "eval_runtime": 17.9151,
3362
+ "eval_samples_per_second": 55.819,
3363
+ "eval_steps_per_second": 13.955,
3364
+ "step": 19500
3365
  }
3366
  ],
3367
  "logging_steps": 50,