Transformers
PyTorch
English
pixel
pretraining
plip commited on
Commit
6a33a43
·
1 Parent(s): fa2a4d4

Training in progress, step 700000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:03c116c94691fe83930a5993880bd8c0998a3e0ec38012be8fad0b40e1c29568
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fca1ce8e1321c185070051c404827dfc693fe55a6777dd0acded04344c9c30fd
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b2b586adc3a504918e31f8a9a7e0f4be94f03956b7f0114b4da9476acb22a6ef
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab594cbb8d871dbbf2b25c376be7c8da151b2a99217825751fae78b7561f2ad5
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:33a77fe6605383afb833ca53fc48599ad56cfe3eec3e43ed5ccdec337bfa0ca8
3
- size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e22039e8547ad63b2ace49f210f4357ab45439130e9ce4cde64ab4d788dae45
3
+ size 14439
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:815de40461412919a5889eec61609965c9d2866910047894a4dc0f6b20abb0b4
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0035334d6d79118a4fbb19f853805075e8cbb76d056e9372535b5cc2b4046af0
3
  size 14503
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f4ae17687fd76755d54219d89fc11c8946b10678e74c0c01048fa01e50274084
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:523d1db2472a9cc3cbeb9c091f0349bda45803d7d0a416b91c4a707a5260de91
3
  size 14503
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c17905fc96ebc0f02fa95bfe12b431ac787bae4299fa05067fe9a564d5bb62cc
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89bdfe288c33ce02d82b7c3c74d7eb542a7bb82b47a44b8ec4cd489dc5c385c0
3
  size 14503
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b4ee1c07d4ce16af70500d9164050fdd6814fe5b1c70d5ddc9dc0d403bb72893
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8867e21d1b6a1acf6d7736261e75716fa7b5040d081c92aba0073b066f2ada16
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 10.536442347336113,
5
- "global_step": 690000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -5112,11 +5112,85 @@
5112
  "eval_samples_per_second": 1199.26,
5113
  "eval_steps_per_second": 19.188,
5114
  "step": 690000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5115
  }
5116
  ],
5117
  "max_steps": 1000000,
5118
  "num_train_epochs": 16,
5119
- "total_flos": 4.8369114404124654e+22,
5120
  "trial_name": null,
5121
  "trial_params": null
5122
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 10.689144410340983,
5
+ "global_step": 700000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
5112
  "eval_samples_per_second": 1199.26,
5113
  "eval_steps_per_second": 19.188,
5114
  "step": 690000
5115
+ },
5116
+ {
5117
+ "epoch": 10.55,
5118
+ "learning_rate": 4.347445648076057e-05,
5119
+ "loss": 0.2463,
5120
+ "step": 691000
5121
+ },
5122
+ {
5123
+ "epoch": 10.57,
5124
+ "learning_rate": 4.327718256369826e-05,
5125
+ "loss": 0.2458,
5126
+ "step": 692000
5127
+ },
5128
+ {
5129
+ "epoch": 10.58,
5130
+ "learning_rate": 4.3080310241483885e-05,
5131
+ "loss": 0.2451,
5132
+ "step": 693000
5133
+ },
5134
+ {
5135
+ "epoch": 10.6,
5136
+ "learning_rate": 4.2883841667081675e-05,
5137
+ "loss": 0.2454,
5138
+ "step": 694000
5139
+ },
5140
+ {
5141
+ "epoch": 10.61,
5142
+ "learning_rate": 4.268777898904044e-05,
5143
+ "loss": 0.2455,
5144
+ "step": 695000
5145
+ },
5146
+ {
5147
+ "epoch": 10.61,
5148
+ "eval_runtime": 0.794,
5149
+ "eval_samples_per_second": 1259.505,
5150
+ "eval_steps_per_second": 20.152,
5151
+ "step": 695000
5152
+ },
5153
+ {
5154
+ "epoch": 10.63,
5155
+ "learning_rate": 4.2492124351470214e-05,
5156
+ "loss": 0.2453,
5157
+ "step": 696000
5158
+ },
5159
+ {
5160
+ "epoch": 10.64,
5161
+ "learning_rate": 4.2296879894018835e-05,
5162
+ "loss": 0.2449,
5163
+ "step": 697000
5164
+ },
5165
+ {
5166
+ "epoch": 10.66,
5167
+ "learning_rate": 4.210204775184834e-05,
5168
+ "loss": 0.245,
5169
+ "step": 698000
5170
+ },
5171
+ {
5172
+ "epoch": 10.67,
5173
+ "learning_rate": 4.190763005561186e-05,
5174
+ "loss": 0.2447,
5175
+ "step": 699000
5176
+ },
5177
+ {
5178
+ "epoch": 10.69,
5179
+ "learning_rate": 4.171362893143013e-05,
5180
+ "loss": 0.2444,
5181
+ "step": 700000
5182
+ },
5183
+ {
5184
+ "epoch": 10.69,
5185
+ "eval_runtime": 0.7798,
5186
+ "eval_samples_per_second": 1282.444,
5187
+ "eval_steps_per_second": 20.519,
5188
+ "step": 700000
5189
  }
5190
  ],
5191
  "max_steps": 1000000,
5192
  "num_train_epochs": 16,
5193
+ "total_flos": 4.9070117014428126e+22,
5194
  "trial_name": null,
5195
  "trial_params": null
5196
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b2b586adc3a504918e31f8a9a7e0f4be94f03956b7f0114b4da9476acb22a6ef
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab594cbb8d871dbbf2b25c376be7c8da151b2a99217825751fae78b7561f2ad5
3
  size 449471589