rootxhacker commited on
Commit
bb99f2e
·
verified ·
1 Parent(s): 29e4604

Training in progress, step 2500, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:37e7ac0622b34136a1adc5dda670dd8f06fe9699327bbef64e2b847e41d62d45
3
  size 36730224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e10a7c8bb0d516328a4f08fb821bc0e53102e1b0a0d8ea1d6c8cc3bce9dca90
3
  size 36730224
last-checkpoint/ar_diffusion_info.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8d5aaec88b2f521c4d19280ee5a843dca115995f362a0926fa7ff5637694cc6d
3
  size 1736
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fdb38bb607b4da045b51a34cfbf7428a4bf481a4b7dcfcd083d72647f444c879
3
  size 1736
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bc0f99b2f4c37e6bd3da61564f89d37dedf31c888089686d20000b137615abc8
3
  size 73588346
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d026d37c2efc698996a40494d349ec54a4ff40c81599ec63f15410e52a0e87f
3
  size 73588346
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4da9c3920b2d28ca98d344913f643342e405b080bfc26edfe880e644c5be7370
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:100aab8649e7180e1ab3ef8feaab197f99e31e9f728f5189c5431d80dbc2eacd
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:43c2f44953ece167e5bd34ec80ca4bdfcda9e945ce63675d98939409afdb1cb3
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:996af29fdb07e722f1f70dd9ba54354e5a4baf4f673aef8bef5139d74d107a73
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:951a13f6b06bce52a2ba9f7d2d8f60254ac5cc4c021e67355429cc5c41426dfb
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d57c57de49427b666f955c0cc0173da1ca9651de809c40ac268e017db320996
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 2000,
3
- "best_metric": 1.60262131690979,
4
- "best_model_checkpoint": "./ar-diffusion-checkpoints-progressive-attention/checkpoint-2000",
5
- "epoch": 0.15383432043688947,
6
  "eval_steps": 250,
7
- "global_step": 2000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -352,6 +352,92 @@
352
  "eval_samples_per_second": 59.349,
353
  "eval_steps_per_second": 14.837,
354
  "step": 2000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
355
  }
356
  ],
357
  "logging_steps": 50,
 
1
  {
2
+ "best_global_step": 2500,
3
+ "best_metric": 1.5644338130950928,
4
+ "best_model_checkpoint": "./ar-diffusion-checkpoints-progressive-attention/checkpoint-2500",
5
+ "epoch": 0.19229290054611184,
6
  "eval_steps": 250,
7
+ "global_step": 2500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
352
  "eval_samples_per_second": 59.349,
353
  "eval_steps_per_second": 14.837,
354
  "step": 2000
355
+ },
356
+ {
357
+ "epoch": 0.1576801784478117,
358
+ "grad_norm": 0.8268172740936279,
359
+ "learning_rate": 0.0001919746513258707,
360
+ "loss": 1.6329,
361
+ "step": 2050
362
+ },
363
+ {
364
+ "epoch": 0.16152603645873395,
365
+ "grad_norm": 1.3260400295257568,
366
+ "learning_rate": 0.00019171493130405425,
367
+ "loss": 1.6029,
368
+ "step": 2100
369
+ },
370
+ {
371
+ "epoch": 0.16537189446965617,
372
+ "grad_norm": 1.9381955862045288,
373
+ "learning_rate": 0.00019145521128223776,
374
+ "loss": 1.5311,
375
+ "step": 2150
376
+ },
377
+ {
378
+ "epoch": 0.1692177524805784,
379
+ "grad_norm": 1.0509984493255615,
380
+ "learning_rate": 0.00019119549126042127,
381
+ "loss": 1.5224,
382
+ "step": 2200
383
+ },
384
+ {
385
+ "epoch": 0.17306361049150065,
386
+ "grad_norm": 0.8311214447021484,
387
+ "learning_rate": 0.0001909357712386048,
388
+ "loss": 1.5033,
389
+ "step": 2250
390
+ },
391
+ {
392
+ "epoch": 0.17306361049150065,
393
+ "eval_loss": 1.5902116298675537,
394
+ "eval_runtime": 16.992,
395
+ "eval_samples_per_second": 58.851,
396
+ "eval_steps_per_second": 14.713,
397
+ "step": 2250
398
+ },
399
+ {
400
+ "epoch": 0.1769094685024229,
401
+ "grad_norm": 1.4311176538467407,
402
+ "learning_rate": 0.0001906760512167883,
403
+ "loss": 1.6188,
404
+ "step": 2300
405
+ },
406
+ {
407
+ "epoch": 0.18075532651334514,
408
+ "grad_norm": 1.2279688119888306,
409
+ "learning_rate": 0.0001904163311949718,
410
+ "loss": 1.5018,
411
+ "step": 2350
412
+ },
413
+ {
414
+ "epoch": 0.18460118452426735,
415
+ "grad_norm": 1.7099772691726685,
416
+ "learning_rate": 0.00019015661117315535,
417
+ "loss": 1.5609,
418
+ "step": 2400
419
+ },
420
+ {
421
+ "epoch": 0.1884470425351896,
422
+ "grad_norm": 1.3446159362792969,
423
+ "learning_rate": 0.00018989689115133887,
424
+ "loss": 1.6171,
425
+ "step": 2450
426
+ },
427
+ {
428
+ "epoch": 0.19229290054611184,
429
+ "grad_norm": 1.4243688583374023,
430
+ "learning_rate": 0.00018963717112952238,
431
+ "loss": 1.5512,
432
+ "step": 2500
433
+ },
434
+ {
435
+ "epoch": 0.19229290054611184,
436
+ "eval_loss": 1.5644338130950928,
437
+ "eval_runtime": 16.8277,
438
+ "eval_samples_per_second": 59.426,
439
+ "eval_steps_per_second": 14.856,
440
+ "step": 2500
441
  }
442
  ],
443
  "logging_steps": 50,