rootxhacker commited on
Commit
e460a2c
·
verified ·
1 Parent(s): 5f18928

Training in progress, step 6000, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:97249c47c6b32ef65b151737e7f96c260e5a23f9fbe742a453b5f4d81d690726
3
  size 36730224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:436b6e968fb5604005fd81ad87662f85c94593110929c806420ee474d7f3d4b3
3
  size 36730224
last-checkpoint/ar_diffusion_info.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f4be1866ad2b89ce10f9d86783f55773d8feaaccbe73932e4a09243f667cbcc5
3
  size 1544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb28ed3ffec69fef5de4a3f116c672c7bdb8dcd8d1d63a0a351fcf8d1d424c2d
3
  size 1544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:62aa10d649cc73207a70cc479a1f297dd3d4ee8f4046bf419864ec2fcc09094e
3
  size 73588346
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee9b798a96c2e7a3a2a1ab191f1fff2b3926ef156d5382c2afa2a8f948173117
3
  size 73588346
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:452f9d1449e365d91136837164af087a289325b1bf94b381d6eeb9d18ffa0513
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12c22be93200b6ea29a5a43fdc896fd16b0e2c374bfcbb275fb907bb85c40cd3
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:91bbcbbac469a768b1f8fb700c511addacfb7e81974f1cc808de5a03588fc9f9
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b6618d641c818c3995a5b603cd6e606d1c4f3e865f138e046dbb16cc25967da
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:66663104f3ba703edc4ec090a0702d7a9699150cb3c08b7ab9b0c3768767d04b
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3428e4135cd17a5056c02e50b97a6e67b768ec92eede0a8846febe18ebcfa82
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 5000,
3
  "best_metric": 4.465761661529541,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-5000",
5
- "epoch": 0.42304438120144605,
6
  "eval_steps": 250,
7
- "global_step": 5500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -954,6 +954,92 @@
954
  "eval_samples_per_second": 53.707,
955
  "eval_steps_per_second": 13.427,
956
  "step": 5500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
957
  }
958
  ],
959
  "logging_steps": 50,
 
2
  "best_global_step": 5000,
3
  "best_metric": 4.465761661529541,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-5000",
5
+ "epoch": 0.4615029613106684,
6
  "eval_steps": 250,
7
+ "global_step": 6000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
954
  "eval_samples_per_second": 53.707,
955
  "eval_steps_per_second": 13.427,
956
  "step": 5500
957
+ },
958
+ {
959
+ "epoch": 0.4268902392123683,
960
+ "grad_norm": 4.2113752365112305,
961
+ "learning_rate": 0.00017380983300002597,
962
+ "loss": 4.5454,
963
+ "step": 5550
964
+ },
965
+ {
966
+ "epoch": 0.43073609722329054,
967
+ "grad_norm": 4.782048225402832,
968
+ "learning_rate": 0.0001735501129782095,
969
+ "loss": 4.4705,
970
+ "step": 5600
971
+ },
972
+ {
973
+ "epoch": 0.4345819552342128,
974
+ "grad_norm": 2.6753036975860596,
975
+ "learning_rate": 0.00017329039295639303,
976
+ "loss": 4.4592,
977
+ "step": 5650
978
+ },
979
+ {
980
+ "epoch": 0.43842781324513497,
981
+ "grad_norm": 5.012415885925293,
982
+ "learning_rate": 0.00017303067293457654,
983
+ "loss": 4.623,
984
+ "step": 5700
985
+ },
986
+ {
987
+ "epoch": 0.4422736712560572,
988
+ "grad_norm": 3.0666699409484863,
989
+ "learning_rate": 0.00017277095291276005,
990
+ "loss": 4.4325,
991
+ "step": 5750
992
+ },
993
+ {
994
+ "epoch": 0.4422736712560572,
995
+ "eval_loss": 4.489352703094482,
996
+ "eval_runtime": 18.4948,
997
+ "eval_samples_per_second": 54.069,
998
+ "eval_steps_per_second": 13.517,
999
+ "step": 5750
1000
+ },
1001
+ {
1002
+ "epoch": 0.44611952926697945,
1003
+ "grad_norm": 6.8570876121521,
1004
+ "learning_rate": 0.00017251123289094357,
1005
+ "loss": 4.5179,
1006
+ "step": 5800
1007
+ },
1008
+ {
1009
+ "epoch": 0.4499653872779017,
1010
+ "grad_norm": 7.190755844116211,
1011
+ "learning_rate": 0.00017225151286912708,
1012
+ "loss": 4.5877,
1013
+ "step": 5850
1014
+ },
1015
+ {
1016
+ "epoch": 0.45381124528882394,
1017
+ "grad_norm": 4.404886722564697,
1018
+ "learning_rate": 0.00017199179284731062,
1019
+ "loss": 4.4072,
1020
+ "step": 5900
1021
+ },
1022
+ {
1023
+ "epoch": 0.4576571032997462,
1024
+ "grad_norm": 3.0543084144592285,
1025
+ "learning_rate": 0.00017173207282549413,
1026
+ "loss": 4.4656,
1027
+ "step": 5950
1028
+ },
1029
+ {
1030
+ "epoch": 0.4615029613106684,
1031
+ "grad_norm": 6.7454514503479,
1032
+ "learning_rate": 0.00017147235280367764,
1033
+ "loss": 4.5688,
1034
+ "step": 6000
1035
+ },
1036
+ {
1037
+ "epoch": 0.4615029613106684,
1038
+ "eval_loss": 4.480144023895264,
1039
+ "eval_runtime": 18.5584,
1040
+ "eval_samples_per_second": 53.884,
1041
+ "eval_steps_per_second": 13.471,
1042
+ "step": 6000
1043
  }
1044
  ],
1045
  "logging_steps": 50,