Transformers
PyTorch
English
pixel
pretraining
plip commited on
Commit
ded1b5a
·
1 Parent(s): 2bf164d

Training in progress, step 180000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6f9a70132918b6ab165a91d577d712613356dca52075d5c7c05f34314005b476
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f5acc2861e7396e81698a045ce779c528c1589b7b78bde65686da82c4408ddb
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:04e4608999d97a58a30e39361b70b419f5aef3e2535ed3ca55c26e98dfa526a2
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d48649d1b881cb101c25c27c14decb38dce780e3aea5787ee35216eccf1c8fd9
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ef92b44093f62f1441b173acbe3fd1139e94c5c223ed6a54381a9d3cb2f5c022
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd995b6d6c5baa6e5ed73d97b87a49724ad2e0d0f8e35c78d6e562318a4660ea
3
  size 14503
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:161efcaf59347006251947d35ba8e577aead293e95ee199281ec31fb424a8671
3
- size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6650ce86ed3c7c5c7fbe55b75f320b30724b552ef56b063389bed584cfcfd3a4
3
+ size 14439
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a5b4db0eb85867b5e22ab5799a8329f0f5930ac32c5205c1b81fbef9bb0ad0ab
3
- size 14439
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca377902b93ec16a61eb5ef6b00da3d0b2f00ee9310c5dd7863b3027def19ecc
3
+ size 14503
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed9a9a05da89d28b0f8404cc60f79e71945e2a52c47886846fb03eae29b9b7e7
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0979b9f8cf08248ef7cf31dc7f9e5488be3d1a638741d1d3e358d69c0f25d13d
3
  size 14503
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7e6e6dbb6845e268a54a5a558c86918603b34b6bae9a32a1510a924b34f03635
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cdbc1873940bd05dec6fa8ddeee78ddbd4cf0afa60b7658d7e729096721589da
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.59593507108281,
5
- "global_step": 170000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -1264,11 +1264,85 @@
1264
  "eval_samples_per_second": 850.656,
1265
  "eval_steps_per_second": 13.611,
1266
  "step": 170000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1267
  }
1268
  ],
1269
  "max_steps": 1000000,
1270
  "num_train_epochs": 16,
1271
- "total_flos": 1.191703123379604e+22,
1272
  "trial_name": null,
1273
  "trial_params": null
1274
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.7486371340876814,
5
+ "global_step": 180000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
1264
  "eval_samples_per_second": 850.656,
1265
  "eval_steps_per_second": 13.611,
1266
  "step": 170000
1267
+ },
1268
+ {
1269
+ "epoch": 2.61,
1270
+ "learning_rate": 0.00014447046094149437,
1271
+ "loss": 0.3221,
1272
+ "step": 171000
1273
+ },
1274
+ {
1275
+ "epoch": 2.63,
1276
+ "learning_rate": 0.00014437993399594003,
1277
+ "loss": 0.3216,
1278
+ "step": 172000
1279
+ },
1280
+ {
1281
+ "epoch": 2.64,
1282
+ "learning_rate": 0.0001442887030017421,
1283
+ "loss": 0.3217,
1284
+ "step": 173000
1285
+ },
1286
+ {
1287
+ "epoch": 2.66,
1288
+ "learning_rate": 0.00014419676895658807,
1289
+ "loss": 0.3208,
1290
+ "step": 174000
1291
+ },
1292
+ {
1293
+ "epoch": 2.67,
1294
+ "learning_rate": 0.000144104132865854,
1295
+ "loss": 0.3207,
1296
+ "step": 175000
1297
+ },
1298
+ {
1299
+ "epoch": 2.67,
1300
+ "eval_runtime": 1.0679,
1301
+ "eval_samples_per_second": 936.423,
1302
+ "eval_steps_per_second": 14.983,
1303
+ "step": 175000
1304
+ },
1305
+ {
1306
+ "epoch": 2.69,
1307
+ "learning_rate": 0.0001440107957425933,
1308
+ "loss": 0.3203,
1309
+ "step": 176000
1310
+ },
1311
+ {
1312
+ "epoch": 2.7,
1313
+ "learning_rate": 0.0001439167586075258,
1314
+ "loss": 0.3201,
1315
+ "step": 177000
1316
+ },
1317
+ {
1318
+ "epoch": 2.72,
1319
+ "learning_rate": 0.0001438220224890265,
1320
+ "loss": 0.3191,
1321
+ "step": 178000
1322
+ },
1323
+ {
1324
+ "epoch": 2.73,
1325
+ "learning_rate": 0.00014372658842311449,
1326
+ "loss": 0.3195,
1327
+ "step": 179000
1328
+ },
1329
+ {
1330
+ "epoch": 2.75,
1331
+ "learning_rate": 0.00014363045745344137,
1332
+ "loss": 0.3191,
1333
+ "step": 180000
1334
+ },
1335
+ {
1336
+ "epoch": 2.75,
1337
+ "eval_runtime": 1.0169,
1338
+ "eval_samples_per_second": 983.42,
1339
+ "eval_steps_per_second": 15.735,
1340
+ "step": 180000
1341
  }
1342
  ],
1343
  "max_steps": 1000000,
1344
  "num_train_epochs": 16,
1345
+ "total_flos": 1.261803384409951e+22,
1346
  "trial_name": null,
1347
  "trial_params": null
1348
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:04e4608999d97a58a30e39361b70b419f5aef3e2535ed3ca55c26e98dfa526a2
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d48649d1b881cb101c25c27c14decb38dce780e3aea5787ee35216eccf1c8fd9
3
  size 449471589