Transformers
PyTorch
English
pixel
pretraining
plip commited on
Commit
30cea94
·
1 Parent(s): d57244a

Training in progress, step 290000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a09f2253c2da714db2381b4b6c94afe74f0c5bcca5dfab2a4d09f3bc77a1a830
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3a8513b0368f6cb2e3381f928e0aa14b5dd1d4d6e81f16afa2b1f5c07381ace
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f568156f561dbbcf7503a348dffb485dffe24e58ccf5c28c9e6be3fa82361daf
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34882c0a1ec238c2b1ad9048809a8c4ec0fe4694d212fa9d7361294be70895cf
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:59a9fce20181e682cc72fca21c2c1d9ae33919a24109d9c3b0015bbe48914330
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53d2183906572577bb72529bb7cea14ccb3598c2ad81bd496d1690556b2c2fad
3
  size 14503
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6f3a816674b62f2ebc9df81821d70aa6368f98c31e4a2d5592af6a40fe48198f
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e47c84ee1a7263145bb05e6bd38ff747cca1ce76d180b5d014131790082d04ac
3
  size 14503
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:913db27023ff5c862ac68d8593e062aa9da19c0798da56d43a2896de4cc6dca5
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5654423abeb0cd8c1ac599d51c54b19e61e2cbf655685c7b1d094b3f86c3ae14
3
  size 14503
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:77a839f0e74d399ee3f4539eaee8bff7b1db922601d5d69fcbfe490fd00b94d2
3
- size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75741429273458049dfadf451049de4bb7af88e4bb53df1b8babe07272a17a27
3
+ size 14439
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9756e1f2ce28cffe3ad2413091d8de7b6aa9409f983eeb48589ea2a1911fb547
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43486ecf7953ead4f44fd0913517d08c2421c80bd01545c2aa6edfd9bc952a2c
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 4.275657764136393,
5
- "global_step": 280000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -2078,11 +2078,85 @@
2078
  "eval_samples_per_second": 971.532,
2079
  "eval_steps_per_second": 15.545,
2080
  "step": 280000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2081
  }
2082
  ],
2083
  "max_steps": 1000000,
2084
  "num_train_epochs": 16,
2085
- "total_flos": 1.962804680577125e+22,
2086
  "trial_name": null,
2087
  "trial_params": null
2088
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 4.428359827141264,
5
+ "global_step": 290000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
2078
  "eval_samples_per_second": 971.532,
2079
  "eval_steps_per_second": 15.545,
2080
  "step": 280000
2081
+ },
2082
+ {
2083
+ "epoch": 4.29,
2084
+ "learning_rate": 0.00013054991184149905,
2085
+ "loss": 0.2946,
2086
+ "step": 281000
2087
+ },
2088
+ {
2089
+ "epoch": 4.31,
2090
+ "learning_rate": 0.00013038950654188476,
2091
+ "loss": 0.2942,
2092
+ "step": 282000
2093
+ },
2094
+ {
2095
+ "epoch": 4.32,
2096
+ "learning_rate": 0.00013022855019070005,
2097
+ "loss": 0.2941,
2098
+ "step": 283000
2099
+ },
2100
+ {
2101
+ "epoch": 4.34,
2102
+ "learning_rate": 0.0001300670445481378,
2103
+ "loss": 0.2937,
2104
+ "step": 284000
2105
+ },
2106
+ {
2107
+ "epoch": 4.35,
2108
+ "learning_rate": 0.0001299049913803978,
2109
+ "loss": 0.2937,
2110
+ "step": 285000
2111
+ },
2112
+ {
2113
+ "epoch": 4.35,
2114
+ "eval_runtime": 1.0469,
2115
+ "eval_samples_per_second": 955.197,
2116
+ "eval_steps_per_second": 15.283,
2117
+ "step": 285000
2118
+ },
2119
+ {
2120
+ "epoch": 4.37,
2121
+ "learning_rate": 0.00012974239245966754,
2122
+ "loss": 0.2934,
2123
+ "step": 286000
2124
+ },
2125
+ {
2126
+ "epoch": 4.38,
2127
+ "learning_rate": 0.0001295792495641028,
2128
+ "loss": 0.2962,
2129
+ "step": 287000
2130
+ },
2131
+ {
2132
+ "epoch": 4.4,
2133
+ "learning_rate": 0.00012941556447780813,
2134
+ "loss": 0.2931,
2135
+ "step": 288000
2136
+ },
2137
+ {
2138
+ "epoch": 4.41,
2139
+ "learning_rate": 0.0001292513389908174,
2140
+ "loss": 0.2931,
2141
+ "step": 289000
2142
+ },
2143
+ {
2144
+ "epoch": 4.43,
2145
+ "learning_rate": 0.0001290865748990742,
2146
+ "loss": 0.2932,
2147
+ "step": 290000
2148
+ },
2149
+ {
2150
+ "epoch": 4.43,
2151
+ "eval_runtime": 1.0143,
2152
+ "eval_samples_per_second": 985.898,
2153
+ "eval_steps_per_second": 15.774,
2154
+ "step": 290000
2155
  }
2156
  ],
2157
  "max_steps": 1000000,
2158
  "num_train_epochs": 16,
2159
+ "total_flos": 2.032904941607472e+22,
2160
  "trial_name": null,
2161
  "trial_params": null
2162
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f568156f561dbbcf7503a348dffb485dffe24e58ccf5c28c9e6be3fa82361daf
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34882c0a1ec238c2b1ad9048809a8c4ec0fe4694d212fa9d7361294be70895cf
3
  size 449471589