rootxhacker commited on
Commit
81327e1
·
verified ·
1 Parent(s): c905b03

Training in progress, step 13500, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e2d7fcaf2efe42ffb5f3c9e028de2d4020155b47fd00969c045a7b96f9a500e0
3
  size 36730224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:474b67c549b3ac63215af64bfd5c3e231be24980b37242c9f744a9bc612f0008
3
  size 36730224
last-checkpoint/ar_diffusion_info.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:828b8db8ad6923c1cf715c1424f34fe8d45d1942c07709d2ed3e3b91c7b41825
3
  size 1544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0480e511efe20f590b2d821022731b40382edf3655bca705228ed05b63128830
3
  size 1544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:81731a2aece3051885d7289cef2d696a33b091ba71fd2ad97dba80506614db51
3
  size 73588346
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1a8b91d626d80e48ce9e4448a6fbe135ae118d67810182f7182aa5d1211e998
3
  size 73588346
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dbf8948534182fde8a4da31776a53cc78337e1e18ed4b526e2ee8ca99eff5731
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81ec269cbd23a3955804ddaef963a9e0d68f2087a109e239da5baed50032493e
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d1a2f8fe642f01391ef2e54fcf96a41d1f8399b7293ea1f181058d0539b5b33d
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b7a18a05122b0a199bfed591a89a0565feeaa299af76bd8309bbdc13d5d6b59
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:69b23dccdca16565cb13b99c2e00b6827579e6c2cc8759c8f2106a0579d096c8
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba4610d4a5272883eace09557947e58aa9c641822afa7ad93c2a7f7af7024f8b
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 13000,
3
  "best_metric": 1.5119102001190186,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-13000",
5
- "epoch": 0.9999230828397816,
6
  "eval_steps": 250,
7
- "global_step": 13000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -2244,6 +2244,92 @@
2244
  "eval_samples_per_second": 56.404,
2245
  "eval_steps_per_second": 14.101,
2246
  "step": 13000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2247
  }
2248
  ],
2249
  "logging_steps": 50,
 
2
  "best_global_step": 13000,
3
  "best_metric": 1.5119102001190186,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-13000",
5
+ "epoch": 1.038381662949004,
6
  "eval_steps": 250,
7
+ "global_step": 13500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
2244
  "eval_samples_per_second": 56.404,
2245
  "eval_steps_per_second": 14.101,
2246
  "step": 13000
2247
+ },
2248
+ {
2249
+ "epoch": 1.0037689408507038,
2250
+ "grad_norm": 1.4789248704910278,
2251
+ "learning_rate": 0.00013486221852842636,
2252
+ "loss": 1.4551,
2253
+ "step": 13050
2254
+ },
2255
+ {
2256
+ "epoch": 1.007614798861626,
2257
+ "grad_norm": 1.3270663022994995,
2258
+ "learning_rate": 0.00013460249850660988,
2259
+ "loss": 1.4776,
2260
+ "step": 13100
2261
+ },
2262
+ {
2263
+ "epoch": 1.0114606568725482,
2264
+ "grad_norm": 1.3546854257583618,
2265
+ "learning_rate": 0.0001343427784847934,
2266
+ "loss": 1.5807,
2267
+ "step": 13150
2268
+ },
2269
+ {
2270
+ "epoch": 1.0153065148834706,
2271
+ "grad_norm": 1.303915023803711,
2272
+ "learning_rate": 0.0001340830584629769,
2273
+ "loss": 1.4309,
2274
+ "step": 13200
2275
+ },
2276
+ {
2277
+ "epoch": 1.0191523728943928,
2278
+ "grad_norm": 0.8854748606681824,
2279
+ "learning_rate": 0.00013382333844116044,
2280
+ "loss": 1.4395,
2281
+ "step": 13250
2282
+ },
2283
+ {
2284
+ "epoch": 1.0191523728943928,
2285
+ "eval_loss": 1.5238608121871948,
2286
+ "eval_runtime": 17.7588,
2287
+ "eval_samples_per_second": 56.31,
2288
+ "eval_steps_per_second": 14.077,
2289
+ "step": 13250
2290
+ },
2291
+ {
2292
+ "epoch": 1.022998230905315,
2293
+ "grad_norm": 1.5649653673171997,
2294
+ "learning_rate": 0.00013356361841934395,
2295
+ "loss": 1.5022,
2296
+ "step": 13300
2297
+ },
2298
+ {
2299
+ "epoch": 1.0268440889162371,
2300
+ "grad_norm": 1.6031616926193237,
2301
+ "learning_rate": 0.0001333038983975275,
2302
+ "loss": 1.4315,
2303
+ "step": 13350
2304
+ },
2305
+ {
2306
+ "epoch": 1.0306899469271595,
2307
+ "grad_norm": 1.3788844347000122,
2308
+ "learning_rate": 0.00013304417837571098,
2309
+ "loss": 1.578,
2310
+ "step": 13400
2311
+ },
2312
+ {
2313
+ "epoch": 1.0345358049380817,
2314
+ "grad_norm": 1.4347171783447266,
2315
+ "learning_rate": 0.0001327844583538945,
2316
+ "loss": 1.3993,
2317
+ "step": 13450
2318
+ },
2319
+ {
2320
+ "epoch": 1.038381662949004,
2321
+ "grad_norm": 1.9777193069458008,
2322
+ "learning_rate": 0.00013252473833207803,
2323
+ "loss": 1.4331,
2324
+ "step": 13500
2325
+ },
2326
+ {
2327
+ "epoch": 1.038381662949004,
2328
+ "eval_loss": 1.5231057405471802,
2329
+ "eval_runtime": 17.8114,
2330
+ "eval_samples_per_second": 56.144,
2331
+ "eval_steps_per_second": 14.036,
2332
+ "step": 13500
2333
  }
2334
  ],
2335
  "logging_steps": 50,