Basma2423 commited on
Commit
6e979d5
·
verified ·
1 Parent(s): 7d95240

Training in progress, step 11242

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6432e5d4dbcf96f5f64c6469ce31b0d5b3c9f01110150b82ee9cdadc1010e989
3
  size 667849236
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5fd5f2647fde284fadd8fe1b84d2385e1d8557c192a97d1bcb3b84b535022e3
3
  size 667849236
runs/May05_22-15-18_ip-10-192-11-107/events.out.tfevents.1746483320.ip-10-192-11-107.1742.3 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:acc24c92646c4300934b8e42a0af0a9a570793e89cf4cb7a4bf4d6430ecf6297
3
- size 8333
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c0c1ed8c78331621c33d91080f46daa3bfc44db1cd7f7208e0e1b80939a9db4
3
+ size 9425
trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 9636,
3
- "best_metric": 0.7073388677263619,
4
- "best_model_checkpoint": "checkpoints/checkpoint-9636",
5
- "epoch": 1.4999805424757753,
6
  "eval_steps": 1606,
7
- "global_step": 9636,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -213,6 +213,39 @@
213
  "eval_steps_per_second": 1.728,
214
  "eval_wer": 0.6740765765448399,
215
  "step": 9636
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
216
  }
217
  ],
218
  "logging_steps": 500,
@@ -232,7 +265,7 @@
232
  "attributes": {}
233
  }
234
  },
235
- "total_flos": 7.52077105281368e+17,
236
  "train_batch_size": 256,
237
  "trial_name": null,
238
  "trial_params": null
 
1
  {
2
+ "best_global_step": 11242,
3
+ "best_metric": 0.7068964281422255,
4
+ "best_model_checkpoint": "checkpoints/checkpoint-11242",
5
+ "epoch": 1.749970813713663,
6
  "eval_steps": 1606,
7
+ "global_step": 11242,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
213
  "eval_steps_per_second": 1.728,
214
  "eval_wer": 0.6740765765448399,
215
  "step": 9636
216
+ },
217
+ {
218
+ "epoch": 1.556640853017862,
219
+ "grad_norm": 0.031485334038734436,
220
+ "learning_rate": 4.587349950536374e-05,
221
+ "loss": 0.0492,
222
+ "step": 10000
223
+ },
224
+ {
225
+ "epoch": 1.6344709499163326,
226
+ "grad_norm": 0.031592607498168945,
227
+ "learning_rate": 4.46840328658421e-05,
228
+ "loss": 0.0481,
229
+ "step": 10500
230
+ },
231
+ {
232
+ "epoch": 1.7123010468148032,
233
+ "grad_norm": 0.031952131539583206,
234
+ "learning_rate": 4.336387097207617e-05,
235
+ "loss": 0.0468,
236
+ "step": 11000
237
+ },
238
+ {
239
+ "epoch": 1.749970813713663,
240
+ "eval_avg": 0.7068964281422255,
241
+ "eval_cer": 0.6539495257646198,
242
+ "eval_der": 0.7937636951733035,
243
+ "eval_loss": 0.036437951028347015,
244
+ "eval_runtime": 308.1694,
245
+ "eval_samples_per_second": 440.417,
246
+ "eval_steps_per_second": 1.723,
247
+ "eval_wer": 0.6729760634887532,
248
+ "step": 11242
249
  }
250
  ],
251
  "logging_steps": 500,
 
265
  "attributes": {}
266
  }
267
  },
268
+ "total_flos": 8.774232894949294e+17,
269
  "train_batch_size": 256,
270
  "trial_name": null,
271
  "trial_params": null