rootxhacker commited on
Commit
97a6581
·
verified ·
1 Parent(s): 8ea3bcb

Training in progress, step 6500, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:436b6e968fb5604005fd81ad87662f85c94593110929c806420ee474d7f3d4b3
3
  size 36730224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df74840f90de2e67e9907cab52791a6dd441f2b7df4dee24f3d27614fb7c4e81
3
  size 36730224
last-checkpoint/ar_diffusion_info.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cb28ed3ffec69fef5de4a3f116c672c7bdb8dcd8d1d63a0a351fcf8d1d424c2d
3
  size 1544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35f6e0128f9fd6473636f2b7fa321fba2a34670190a7fcccacc9997f0e6e3efd
3
  size 1544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ee9b798a96c2e7a3a2a1ab191f1fff2b3926ef156d5382c2afa2a8f948173117
3
  size 73588346
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e91da0cfbee4e888038757b7189ea413722951a4530435531acf1f53d94aedfd
3
  size 73588346
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:12c22be93200b6ea29a5a43fdc896fd16b0e2c374bfcbb275fb907bb85c40cd3
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44c02dc0791054ba042a754ce4b193305b8c58f3c6ec32c6d59f64ae1e19274a
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4b6618d641c818c3995a5b603cd6e606d1c4f3e865f138e046dbb16cc25967da
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96851dceb7a310a70f7ecfde20fb5205a7253860759d2b8ce0924be746e3091f
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e3428e4135cd17a5056c02e50b97a6e67b768ec92eede0a8846febe18ebcfa82
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18b7addcef54bd827fd6d26a7fd7e8fd6d6f1182cd34f05f02a7c070592639be
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 5000,
3
  "best_metric": 4.465761661529541,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-5000",
5
- "epoch": 0.4615029613106684,
6
  "eval_steps": 250,
7
- "global_step": 6000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -1040,6 +1040,92 @@
1040
  "eval_samples_per_second": 53.884,
1041
  "eval_steps_per_second": 13.471,
1042
  "step": 6000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1043
  }
1044
  ],
1045
  "logging_steps": 50,
 
2
  "best_global_step": 5000,
3
  "best_metric": 4.465761661529541,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-5000",
5
+ "epoch": 0.4999615414198908,
6
  "eval_steps": 250,
7
+ "global_step": 6500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
1040
  "eval_samples_per_second": 53.884,
1041
  "eval_steps_per_second": 13.471,
1042
  "step": 6000
1043
+ },
1044
+ {
1045
+ "epoch": 0.46534881932159067,
1046
+ "grad_norm": 5.5196661949157715,
1047
+ "learning_rate": 0.00017121263278186118,
1048
+ "loss": 4.5703,
1049
+ "step": 6050
1050
+ },
1051
+ {
1052
+ "epoch": 0.4691946773325129,
1053
+ "grad_norm": 4.253966331481934,
1054
+ "learning_rate": 0.00017095291276004467,
1055
+ "loss": 4.6012,
1056
+ "step": 6100
1057
+ },
1058
+ {
1059
+ "epoch": 0.4730405353434351,
1060
+ "grad_norm": 2.459376096725464,
1061
+ "learning_rate": 0.00017069319273822818,
1062
+ "loss": 4.5002,
1063
+ "step": 6150
1064
+ },
1065
+ {
1066
+ "epoch": 0.47688639335435734,
1067
+ "grad_norm": 4.933450698852539,
1068
+ "learning_rate": 0.00017043347271641172,
1069
+ "loss": 4.5703,
1070
+ "step": 6200
1071
+ },
1072
+ {
1073
+ "epoch": 0.4807322513652796,
1074
+ "grad_norm": 4.511186599731445,
1075
+ "learning_rate": 0.00017017375269459524,
1076
+ "loss": 4.4665,
1077
+ "step": 6250
1078
+ },
1079
+ {
1080
+ "epoch": 0.4807322513652796,
1081
+ "eval_loss": 4.485811233520508,
1082
+ "eval_runtime": 18.522,
1083
+ "eval_samples_per_second": 53.99,
1084
+ "eval_steps_per_second": 13.497,
1085
+ "step": 6250
1086
+ },
1087
+ {
1088
+ "epoch": 0.4845781093762018,
1089
+ "grad_norm": 5.634074687957764,
1090
+ "learning_rate": 0.00016991403267277875,
1091
+ "loss": 4.4616,
1092
+ "step": 6300
1093
+ },
1094
+ {
1095
+ "epoch": 0.48842396738712407,
1096
+ "grad_norm": 3.319650650024414,
1097
+ "learning_rate": 0.0001696543126509623,
1098
+ "loss": 4.4836,
1099
+ "step": 6350
1100
+ },
1101
+ {
1102
+ "epoch": 0.4922698253980463,
1103
+ "grad_norm": 3.306976079940796,
1104
+ "learning_rate": 0.00016939459262914577,
1105
+ "loss": 4.5256,
1106
+ "step": 6400
1107
+ },
1108
+ {
1109
+ "epoch": 0.49611568340896856,
1110
+ "grad_norm": 4.1797308921813965,
1111
+ "learning_rate": 0.0001691348726073293,
1112
+ "loss": 4.3822,
1113
+ "step": 6450
1114
+ },
1115
+ {
1116
+ "epoch": 0.4999615414198908,
1117
+ "grad_norm": 3.2349929809570312,
1118
+ "learning_rate": 0.00016887515258551283,
1119
+ "loss": 4.4384,
1120
+ "step": 6500
1121
+ },
1122
+ {
1123
+ "epoch": 0.4999615414198908,
1124
+ "eval_loss": 4.485826015472412,
1125
+ "eval_runtime": 18.614,
1126
+ "eval_samples_per_second": 53.723,
1127
+ "eval_steps_per_second": 13.431,
1128
+ "step": 6500
1129
  }
1130
  ],
1131
  "logging_steps": 50,