rootxhacker commited on
Commit
bda29c9
·
verified ·
1 Parent(s): 314beaf

Training in progress, step 2500, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5284a72c66df303e073df72ce9f1ae1e29ea633668e40d9822a8ccaa64add555
3
  size 36730224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2b4cbe8b1b80bab80643ae95440812326a8a6e7bccc79e0f31fd0b001f92483
3
  size 36730224
last-checkpoint/ar_diffusion_info.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e8358e2ab5d7859161edb7560d72769c1dccae73dcd94f8bb280a6f4c6a418e5
3
  size 1544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:683cb6e78851437b6d551b60a7733fd0cf8a96582a781e0a27157158ccd47347
3
  size 1544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b7c9308b4bec49af406c284201ce7a6649c508431fa62b7fd440c998b6a016ca
3
  size 73588346
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:142ce534c6cf070debd44d21ea1fe5c477f0438570d559dbda8928fe80687677
3
  size 73588346
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2512ba1bd332fd1303d75224b66504a865cf77c5c151bdcdfcda52c23dbe2db6
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74818f2f3daacf3c0fca3dde38a211872e713dacdefaa18d7435559b30dc197d
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b71627c700396d7041b5a8f195ae9cbb8512fe53c30c6da53a207b7194343ba8
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21c1bf6c47692563bb8660483ef35d0f3e0d75e9fd318c04f77453b710e51e5c
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2d83848f1b1bfd2394c14189ddfec57565343ac6855bbb1685fedf0549ec3643
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eeeb94e0675525b5bb02698eb79efe748a90c2efeae2eda028133bdd4c5927c0
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 2000,
3
- "best_metric": 4.666446208953857,
4
- "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-2000",
5
- "epoch": 0.15383432043688947,
6
  "eval_steps": 250,
7
- "global_step": 2000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -352,6 +352,92 @@
352
  "eval_samples_per_second": 54.414,
353
  "eval_steps_per_second": 13.604,
354
  "step": 2000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
355
  }
356
  ],
357
  "logging_steps": 50,
 
1
  {
2
+ "best_global_step": 2500,
3
+ "best_metric": 4.597048282623291,
4
+ "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-2500",
5
+ "epoch": 0.19229290054611184,
6
  "eval_steps": 250,
7
+ "global_step": 2500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
352
  "eval_samples_per_second": 54.414,
353
  "eval_steps_per_second": 13.604,
354
  "step": 2000
355
+ },
356
+ {
357
+ "epoch": 0.1576801784478117,
358
+ "grad_norm": 6.46567964553833,
359
+ "learning_rate": 0.00019198504012674338,
360
+ "loss": 4.8124,
361
+ "step": 2050
362
+ },
363
+ {
364
+ "epoch": 0.16152603645873395,
365
+ "grad_norm": 4.300732135772705,
366
+ "learning_rate": 0.0001917253201049269,
367
+ "loss": 4.7302,
368
+ "step": 2100
369
+ },
370
+ {
371
+ "epoch": 0.16537189446965617,
372
+ "grad_norm": 4.140190601348877,
373
+ "learning_rate": 0.0001914656000831104,
374
+ "loss": 4.6498,
375
+ "step": 2150
376
+ },
377
+ {
378
+ "epoch": 0.1692177524805784,
379
+ "grad_norm": 3.221662998199463,
380
+ "learning_rate": 0.00019120588006129395,
381
+ "loss": 4.6428,
382
+ "step": 2200
383
+ },
384
+ {
385
+ "epoch": 0.17306361049150065,
386
+ "grad_norm": 2.6079111099243164,
387
+ "learning_rate": 0.00019094616003947746,
388
+ "loss": 4.6115,
389
+ "step": 2250
390
+ },
391
+ {
392
+ "epoch": 0.17306361049150065,
393
+ "eval_loss": 4.661706924438477,
394
+ "eval_runtime": 18.7413,
395
+ "eval_samples_per_second": 53.358,
396
+ "eval_steps_per_second": 13.34,
397
+ "step": 2250
398
+ },
399
+ {
400
+ "epoch": 0.1769094685024229,
401
+ "grad_norm": 4.190133094787598,
402
+ "learning_rate": 0.00019068644001766095,
403
+ "loss": 4.7041,
404
+ "step": 2300
405
+ },
406
+ {
407
+ "epoch": 0.18075532651334514,
408
+ "grad_norm": 5.242035388946533,
409
+ "learning_rate": 0.0001904267199958445,
410
+ "loss": 4.6656,
411
+ "step": 2350
412
+ },
413
+ {
414
+ "epoch": 0.18460118452426735,
415
+ "grad_norm": 6.203541278839111,
416
+ "learning_rate": 0.000190166999974028,
417
+ "loss": 4.6835,
418
+ "step": 2400
419
+ },
420
+ {
421
+ "epoch": 0.1884470425351896,
422
+ "grad_norm": 2.8591034412384033,
423
+ "learning_rate": 0.00018990727995221151,
424
+ "loss": 4.6751,
425
+ "step": 2450
426
+ },
427
+ {
428
+ "epoch": 0.19229290054611184,
429
+ "grad_norm": 5.204433441162109,
430
+ "learning_rate": 0.00018964755993039505,
431
+ "loss": 4.7301,
432
+ "step": 2500
433
+ },
434
+ {
435
+ "epoch": 0.19229290054611184,
436
+ "eval_loss": 4.597048282623291,
437
+ "eval_runtime": 18.5098,
438
+ "eval_samples_per_second": 54.025,
439
+ "eval_steps_per_second": 13.506,
440
+ "step": 2500
441
  }
442
  ],
443
  "logging_steps": 50,