Transformers
PyTorch
English
pixel
pretraining
plip commited on
Commit
812b067
·
1 Parent(s): a2b6150

Training in progress, step 950000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a56a8f0ae8b5b9f2aec995742da47ff25dfe07ebb15ec7ee61db4a763d8289c8
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70e10dc58492fed71483adf6f5b8363903e23bef03e170ace087681ebc08713a
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c00c6557048c11e66b95589de29730bca35a40598e37017f064297cb592c4f93
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b779e5dbc65f9055978747a6483cc3aacc9d67baf238821e25b63cb286556c36
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8e8be78115c1d7a8b7fd3ba012ea9e0890f7c8e7c74970d79909bd336b578ec4
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c593a167703dbaf9947d32973b51a125779553f32e153671a91b63abf7f7876
3
  size 14503
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a534ad0e2fa8f314cc3ae9bccc570e59499e6b5c546b12853d32ae75d416e0e6
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3c374b98251ab1768e65aa1b6a7f148a712a2ce1b1f2f903e4af64c54752379
3
  size 14503
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a2825291049da8c0b63497c412e6d53ce0d529ebee7d30f4f47c2a1d271fc14d
3
- size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:891f782320602223f61f367a6458f228c51432918fe313542e407d34511dfc6d
3
+ size 14567
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:087eacd702285507c39ac952397dc9f6dae700c001504f218d7b716e9f249005
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9286b15801381b7a96fc2895ff30b4645bc69f0722e3eeae374fcb4eb7890f47
3
  size 14503
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3dab84d4b75593cd9349f424c4371ea8ac2493751bc544a294c8ef74a18b08e9
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76d771b6aa86b6db5c1d3a18a5ba01d5f7ff8a339c98c29586734738700dc44c
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 14.353993922457892,
5
- "global_step": 940000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -6962,11 +6962,85 @@
6962
  "eval_samples_per_second": 1269.803,
6963
  "eval_steps_per_second": 20.317,
6964
  "step": 940000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6965
  }
6966
  ],
6967
  "max_steps": 1000000,
6968
  "num_train_epochs": 16,
6969
- "total_flos": 6.589415337898549e+22,
6970
  "trial_name": null,
6971
  "trial_params": null
6972
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 14.506695985462764,
5
+ "global_step": 950000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
6962
  "eval_samples_per_second": 1269.803,
6963
  "eval_steps_per_second": 20.317,
6964
  "step": 940000
6965
+ },
6966
+ {
6967
+ "epoch": 14.37,
6968
+ "learning_rate": 1.1328147928906494e-05,
6969
+ "loss": 0.2287,
6970
+ "step": 941000
6971
+ },
6972
+ {
6973
+ "epoch": 14.38,
6974
+ "learning_rate": 1.1283644453421678e-05,
6975
+ "loss": 0.2289,
6976
+ "step": 942000
6977
+ },
6978
+ {
6979
+ "epoch": 14.4,
6980
+ "learning_rate": 1.1239892448991798e-05,
6981
+ "loss": 0.2284,
6982
+ "step": 943000
6983
+ },
6984
+ {
6985
+ "epoch": 14.42,
6986
+ "learning_rate": 1.1196892394081743e-05,
6987
+ "loss": 0.2287,
6988
+ "step": 944000
6989
+ },
6990
+ {
6991
+ "epoch": 14.43,
6992
+ "learning_rate": 1.1154644758933235e-05,
6993
+ "loss": 0.2285,
6994
+ "step": 945000
6995
+ },
6996
+ {
6997
+ "epoch": 14.43,
6998
+ "eval_runtime": 0.7294,
6999
+ "eval_samples_per_second": 1370.909,
7000
+ "eval_steps_per_second": 21.935,
7001
+ "step": 945000
7002
+ },
7003
+ {
7004
+ "epoch": 14.45,
7005
+ "learning_rate": 1.1113150005559644e-05,
7006
+ "loss": 0.2283,
7007
+ "step": 946000
7008
+ },
7009
+ {
7010
+ "epoch": 14.46,
7011
+ "learning_rate": 1.1072408587740942e-05,
7012
+ "loss": 0.2282,
7013
+ "step": 947000
7014
+ },
7015
+ {
7016
+ "epoch": 14.48,
7017
+ "learning_rate": 1.1032420951018755e-05,
7018
+ "loss": 0.228,
7019
+ "step": 948000
7020
+ },
7021
+ {
7022
+ "epoch": 14.49,
7023
+ "learning_rate": 1.0993187532691458e-05,
7024
+ "loss": 0.2281,
7025
+ "step": 949000
7026
+ },
7027
+ {
7028
+ "epoch": 14.51,
7029
+ "learning_rate": 1.0954708761809438e-05,
7030
+ "loss": 0.2281,
7031
+ "step": 950000
7032
+ },
7033
+ {
7034
+ "epoch": 14.51,
7035
+ "eval_runtime": 0.7692,
7036
+ "eval_samples_per_second": 1300.007,
7037
+ "eval_steps_per_second": 20.8,
7038
+ "step": 950000
7039
  }
7040
  ],
7041
  "max_steps": 1000000,
7042
  "num_train_epochs": 16,
7043
+ "total_flos": 6.659515598928896e+22,
7044
  "trial_name": null,
7045
  "trial_params": null
7046
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c00c6557048c11e66b95589de29730bca35a40598e37017f064297cb592c4f93
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b779e5dbc65f9055978747a6483cc3aacc9d67baf238821e25b63cb286556c36
3
  size 449471589