Transformers
PyTorch
English
pixel
pretraining
plip commited on
Commit
9bc180e
·
1 Parent(s): 56aeb80

Training in progress, step 830000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ece7b379c7a5a58ecf06bad11ca4cf9bd52de11683f133c698a0cd46d58e7f3f
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d676bdecf6cef07d6d1557838930ff920f76201e2414575a644361d9ebd0ca5
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:83c02b97525bdc0170d693b11906b5064b3417228255adea84f3fccd20f429d1
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c181b3b0e0340fe0f0c6e90ca26f9e2021277f659fa06f6c810cab95d243c9f
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:471be9073ca16931b802d54b255e23b3102b1be6c0e243832ecda5d9de213243
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10fb0b6575db7cc3fd463d26671f67a57f4c817b1f162f6dd70df0ba155fea6a
3
  size 14503
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c26d9707c692819517328265ab4fd028c1ec91f8e531a3899c963382192856e1
3
- size 14567
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b966173ec2647fe3f9ce64251f9ba275015c518c4e11801d8a5787cb53077e4
3
+ size 14503
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2f7ef808d3e0c55b070bb63a51ac31108dc6594c932f2329575c64f0ec5d34a6
3
- size 14439
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:626675f0b56b6320753b402844bd4c05cb33ef3bdd886b37ae3b7133c13f9441
3
+ size 14503
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3915824192442b74d4af5e3ad4160d4a09adeeec3fcac9fa02d181a6969e8279
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25a0cb16e446a0582e61cafe4a89816af44798dc1964f3425f293eb3e6cf9c2b
3
  size 14503
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c63a65d51252613e1cd5f3ab255f2a8e56d55631776ee22be37789c5802ebbf2
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b44f4d1ea700e774f5dee0343ba4324675c77c29852dd54fec6a281d849ccd3b
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 12.521569166399438,
5
- "global_step": 820000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -6074,11 +6074,85 @@
6074
  "eval_samples_per_second": 1609.99,
6075
  "eval_steps_per_second": 25.76,
6076
  "step": 820000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6077
  }
6078
  ],
6079
  "max_steps": 1000000,
6080
  "num_train_epochs": 16,
6081
- "total_flos": 5.748213519670681e+22,
6082
  "trial_name": null,
6083
  "trial_params": null
6084
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 12.67427122940431,
5
+ "global_step": 830000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
6074
  "eval_samples_per_second": 1609.99,
6075
  "eval_steps_per_second": 25.76,
6076
  "step": 820000
6077
+ },
6078
+ {
6079
+ "epoch": 12.54,
6080
+ "learning_rate": 2.1909901420919184e-05,
6081
+ "loss": 0.2351,
6082
+ "step": 821000
6083
+ },
6084
+ {
6085
+ "epoch": 12.55,
6086
+ "learning_rate": 2.1781056286210997e-05,
6087
+ "loss": 0.235,
6088
+ "step": 822000
6089
+ },
6090
+ {
6091
+ "epoch": 12.57,
6092
+ "learning_rate": 2.1652847824543744e-05,
6093
+ "loss": 0.2347,
6094
+ "step": 823000
6095
+ },
6096
+ {
6097
+ "epoch": 12.58,
6098
+ "learning_rate": 2.1525277437984636e-05,
6099
+ "loss": 0.2348,
6100
+ "step": 824000
6101
+ },
6102
+ {
6103
+ "epoch": 12.6,
6104
+ "learning_rate": 2.1398346521623e-05,
6105
+ "loss": 0.2345,
6106
+ "step": 825000
6107
+ },
6108
+ {
6109
+ "epoch": 12.6,
6110
+ "eval_runtime": 0.7605,
6111
+ "eval_samples_per_second": 1314.934,
6112
+ "eval_steps_per_second": 21.039,
6113
+ "step": 825000
6114
+ },
6115
+ {
6116
+ "epoch": 12.61,
6117
+ "learning_rate": 2.1272056463554978e-05,
6118
+ "loss": 0.2343,
6119
+ "step": 826000
6120
+ },
6121
+ {
6122
+ "epoch": 12.63,
6123
+ "learning_rate": 2.114640864486845e-05,
6124
+ "loss": 0.2346,
6125
+ "step": 827000
6126
+ },
6127
+ {
6128
+ "epoch": 12.64,
6129
+ "learning_rate": 2.1021404439627775e-05,
6130
+ "loss": 0.2344,
6131
+ "step": 828000
6132
+ },
6133
+ {
6134
+ "epoch": 12.66,
6135
+ "learning_rate": 2.089704521485896e-05,
6136
+ "loss": 0.2344,
6137
+ "step": 829000
6138
+ },
6139
+ {
6140
+ "epoch": 12.67,
6141
+ "learning_rate": 2.0773332330534513e-05,
6142
+ "loss": 0.2343,
6143
+ "step": 830000
6144
+ },
6145
+ {
6146
+ "epoch": 12.67,
6147
+ "eval_runtime": 0.7327,
6148
+ "eval_samples_per_second": 1364.889,
6149
+ "eval_steps_per_second": 21.838,
6150
+ "step": 830000
6151
  }
6152
  ],
6153
  "max_steps": 1000000,
6154
  "num_train_epochs": 16,
6155
+ "total_flos": 5.818313780701028e+22,
6156
  "trial_name": null,
6157
  "trial_params": null
6158
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:83c02b97525bdc0170d693b11906b5064b3417228255adea84f3fccd20f429d1
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c181b3b0e0340fe0f0c6e90ca26f9e2021277f659fa06f6c810cab95d243c9f
3
  size 449471589