JuanPajero commited on
Commit
a683a0f
Β·
1 Parent(s): 73a26aa

Training in progress, step 12000

Browse files
{checkpoint-9000 β†’ checkpoint-12000}/config.json RENAMED
File without changes
{checkpoint-9000 β†’ checkpoint-12000}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:853a10b701c41859978527142af4efb610899026f2e0fa7952b243e513fbe8cd
3
  size 721687499
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53875c50949cb858b32b38afb434db1546fa61e5e5dcda9462f12c903fe9a8ea
3
  size 721687499
{checkpoint-9000 β†’ checkpoint-12000}/preprocessor_config.json RENAMED
File without changes
{checkpoint-9000 β†’ checkpoint-12000}/pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:81b0f74cc3edaa150bfa1b6a8d50d40730c767b06b515bfe1fe7ed56d12fa4bc
3
  size 377674359
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96d132744211d2c04695c3263e34a2f814f3d08d1bb925aff50c57941723e3b1
3
  size 377674359
{checkpoint-9000 β†’ checkpoint-12000}/rng_state.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:95016d19f94268c2f81c3982cc7610459bc11c4070f1fc44c48b8e16ebb72e44
3
- size 14709
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24e705e7fbd74f4035ace4fa92507d51e4b05a05c88a5a0718de02484617fc51
3
+ size 14645
{checkpoint-9000 β†’ checkpoint-12000}/scaler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:341b48166e5b847633c7df137f2c55412ed2c1d14b58e81d4d9b894963a415f1
3
  size 1383
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e174a76e0e352d264e5f92fd6a6b771293954f5541c746e7e66ccde440cbb3e
3
  size 1383
{checkpoint-9000 β†’ checkpoint-12000}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e58b2aeb001747b91828136e7425c14c72edfc65e6905aea3a08554cc37fcafd
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:055259b9a818f446687e46aed4d609ba8d81f683861514ef91a50adacfd89299
3
  size 1465
{checkpoint-9000 β†’ checkpoint-12000}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.6258692628650904,
5
- "global_step": 9000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -141,11 +141,56 @@
141
  "eval_steps_per_second": 1.891,
142
  "eval_wer": 0.355694020946573,
143
  "step": 9000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
144
  }
145
  ],
146
  "max_steps": 43140,
147
  "num_train_epochs": 3,
148
- "total_flos": 5.355539118047232e+18,
149
  "trial_name": null,
150
  "trial_params": null
151
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.8344923504867872,
5
+ "global_step": 12000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
141
  "eval_steps_per_second": 1.891,
142
  "eval_wer": 0.355694020946573,
143
  "step": 9000
144
+ },
145
+ {
146
+ "epoch": 0.7,
147
+ "learning_rate": 2.561273373512595e-05,
148
+ "loss": 0.4482,
149
+ "step": 10000
150
+ },
151
+ {
152
+ "epoch": 0.7,
153
+ "eval_loss": 0.7687897086143494,
154
+ "eval_runtime": 1333.2181,
155
+ "eval_samples_per_second": 14.947,
156
+ "eval_steps_per_second": 1.868,
157
+ "eval_wer": 0.343775176169449,
158
+ "step": 10000
159
+ },
160
+ {
161
+ "epoch": 0.76,
162
+ "learning_rate": 2.4840055632823366e-05,
163
+ "loss": 0.4311,
164
+ "step": 11000
165
+ },
166
+ {
167
+ "epoch": 0.76,
168
+ "eval_loss": 0.7420344948768616,
169
+ "eval_runtime": 1329.3248,
170
+ "eval_samples_per_second": 14.991,
171
+ "eval_steps_per_second": 1.874,
172
+ "eval_wer": 0.3233537972037243,
173
+ "step": 11000
174
+ },
175
+ {
176
+ "epoch": 0.83,
177
+ "learning_rate": 2.4067377530520787e-05,
178
+ "loss": 0.4272,
179
+ "step": 12000
180
+ },
181
+ {
182
+ "epoch": 0.83,
183
+ "eval_loss": 0.782776415348053,
184
+ "eval_runtime": 1318.9648,
185
+ "eval_samples_per_second": 15.109,
186
+ "eval_steps_per_second": 1.889,
187
+ "eval_wer": 0.33638421766487525,
188
+ "step": 12000
189
  }
190
  ],
191
  "max_steps": 43140,
192
  "num_train_epochs": 3,
193
+ "total_flos": 7.137862466936832e+18,
194
  "trial_name": null,
195
  "trial_params": null
196
  }
{checkpoint-9000 β†’ checkpoint-12000}/training_args.bin RENAMED
File without changes
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6cf498c1fa08223b228f427a79968055619ec91d8255ce93830627bb36991315
3
  size 377674359
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96d132744211d2c04695c3263e34a2f814f3d08d1bb925aff50c57941723e3b1
3
  size 377674359
runs/Mar10_01-38-16_42fb38fbc845/events.out.tfevents.1773113504.42fb38fbc845.2655.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e8dfaedad67200afce2e8e06ba7e7c4adf7e54f74ecf1ab91b12f49039364881
3
- size 10271
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd2aab3b538cc43c0d6363401500d463f12630515cca37920b859769dcb3917c
3
+ size 10746