Transformers
PyTorch
English
pixel
pretraining
plip commited on
Commit
7b801db
·
1 Parent(s): b13ced3

Training in progress, step 200000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a79698e8ce41155df8f2ac96cd99d16ef6b016cb4ff277c5445301a3db1fa101
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67589357f5095310d4686130056aa06ce9ae4e2fa5ce926bd48f51088af92af7
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:16799df5e196079b65225695fe6105fc300cf5157671e1537af93401d1b8d74a
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f8355919230d3848ec5ca15fcb85fb31871fa61b50484347e59854072226bac
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8d372c7ec90718e7e982db780f8d7b62ea26c5068bb213efc91ce4e4dbff2188
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56696dbd8b022c9a375dc483a2ed57d389284babd22e89c40b8de9038eb3703d
3
  size 14503
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:200bd99b77ad19fc80e27fc902aca5e36eebe6570a18efbc020b994d75bc6fba
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0c18c513645e98f74c56b9e9e177b503e18704a58f67fc3838ebaa773205ef1
3
  size 14503
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c0f78dbe211932d0c37e15c11f906dcb55aae5aedb42250507005f499cf4150e
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7657a362d765d540acd9b7e721a68b7cd2eb75cf243194edc5a268c52185c5f
3
  size 14503
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fb7cd6974be7a03bcf0342d3707956fc7f1e60ef89c3b2bd3445ff8c5a29e4db
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17cd85c4bd32b953041cb6ed12687d174e095b2b2edce062be3f66f2a0041ec7
3
  size 14503
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4347385b2c0f1e2d9aeca7fb88e1c942d1dae99e52563bdfa6c48a7a4a2bf97f
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82157ec414d7845758afa3fc7a8ceafcaf8d618c9a8c5350ea190a69bffb0ab4
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.9013391970925526,
5
- "global_step": 190000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -1412,11 +1412,85 @@
1412
  "eval_samples_per_second": 988.212,
1413
  "eval_steps_per_second": 15.811,
1414
  "step": 190000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1415
  }
1416
  ],
1417
  "max_steps": 1000000,
1418
  "num_train_epochs": 16,
1419
- "total_flos": 1.3319036454402982e+22,
1420
  "trial_name": null,
1421
  "trial_params": null
1422
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 3.054041260097424,
5
+ "global_step": 200000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
1412
  "eval_samples_per_second": 988.212,
1413
  "eval_steps_per_second": 15.811,
1414
  "step": 190000
1415
+ },
1416
+ {
1417
+ "epoch": 2.92,
1418
+ "learning_rate": 0.00014252732722876176,
1419
+ "loss": 0.3149,
1420
+ "step": 191000
1421
+ },
1422
+ {
1423
+ "epoch": 2.93,
1424
+ "learning_rate": 0.0001424229175812373,
1425
+ "loss": 0.3149,
1426
+ "step": 192000
1427
+ },
1428
+ {
1429
+ "epoch": 2.95,
1430
+ "learning_rate": 0.00014231782528668717,
1431
+ "loss": 0.3146,
1432
+ "step": 193000
1433
+ },
1434
+ {
1435
+ "epoch": 2.96,
1436
+ "learning_rate": 0.00014221205149438394,
1437
+ "loss": 0.3145,
1438
+ "step": 194000
1439
+ },
1440
+ {
1441
+ "epoch": 2.98,
1442
+ "learning_rate": 0.0001421055973610528,
1443
+ "loss": 0.3138,
1444
+ "step": 195000
1445
+ },
1446
+ {
1447
+ "epoch": 2.98,
1448
+ "eval_runtime": 1.0908,
1449
+ "eval_samples_per_second": 916.734,
1450
+ "eval_steps_per_second": 14.668,
1451
+ "step": 195000
1452
+ },
1453
+ {
1454
+ "epoch": 2.99,
1455
+ "learning_rate": 0.00014199846405085913,
1456
+ "loss": 0.3137,
1457
+ "step": 196000
1458
+ },
1459
+ {
1460
+ "epoch": 3.01,
1461
+ "learning_rate": 0.00014189065273539564,
1462
+ "loss": 0.3135,
1463
+ "step": 197000
1464
+ },
1465
+ {
1466
+ "epoch": 3.02,
1467
+ "learning_rate": 0.00014178216459366958,
1468
+ "loss": 0.3137,
1469
+ "step": 198000
1470
+ },
1471
+ {
1472
+ "epoch": 3.04,
1473
+ "learning_rate": 0.00014167300081208988,
1474
+ "loss": 0.3131,
1475
+ "step": 199000
1476
+ },
1477
+ {
1478
+ "epoch": 3.05,
1479
+ "learning_rate": 0.00014156316258445421,
1480
+ "loss": 0.3125,
1481
+ "step": 200000
1482
+ },
1483
+ {
1484
+ "epoch": 3.05,
1485
+ "eval_runtime": 1.1346,
1486
+ "eval_samples_per_second": 881.333,
1487
+ "eval_steps_per_second": 14.101,
1488
+ "step": 200000
1489
  }
1490
  ],
1491
  "max_steps": 1000000,
1492
  "num_train_epochs": 16,
1493
+ "total_flos": 1.4020032494024966e+22,
1494
  "trial_name": null,
1495
  "trial_params": null
1496
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:16799df5e196079b65225695fe6105fc300cf5157671e1537af93401d1b8d74a
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f8355919230d3848ec5ca15fcb85fb31871fa61b50484347e59854072226bac
3
  size 449471589