Basma2423 commited on
Commit
6c76d0e
·
verified ·
1 Parent(s): 4f153b2

Training in progress, step 9636

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d7d9179be7efa3d039286efbd45485bca053994cd099d18d9332ecc07e690565
3
  size 667849236
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6432e5d4dbcf96f5f64c6469ce31b0d5b3c9f01110150b82ee9cdadc1010e989
3
  size 667849236
runs/May05_22-15-18_ip-10-192-11-107/events.out.tfevents.1746483320.ip-10-192-11-107.1742.3 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4fa1b1793cd7a32a78d0adb81f839c2d36b48f7ef40f2b34aab870ba9924d01c
3
- size 7241
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:acc24c92646c4300934b8e42a0af0a9a570793e89cf4cb7a4bf4d6430ecf6297
3
+ size 8333
trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 8030,
3
- "best_metric": 0.7079419812877328,
4
- "best_model_checkpoint": "checkpoints/checkpoint-8030",
5
- "epoch": 1.2499902712378876,
6
  "eval_steps": 1606,
7
- "global_step": 8030,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -180,6 +180,39 @@
180
  "eval_steps_per_second": 1.728,
181
  "eval_wer": 0.6757794831111406,
182
  "step": 8030
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
183
  }
184
  ],
185
  "logging_steps": 500,
@@ -199,7 +232,7 @@
199
  "attributes": {}
200
  }
201
  },
202
- "total_flos": 6.267309210678067e+17,
203
  "train_batch_size": 256,
204
  "trial_name": null,
205
  "trial_params": null
 
1
  {
2
+ "best_global_step": 9636,
3
+ "best_metric": 0.7073388677263619,
4
+ "best_model_checkpoint": "checkpoints/checkpoint-9636",
5
+ "epoch": 1.4999805424757753,
6
  "eval_steps": 1606,
7
+ "global_step": 9636,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
180
  "eval_steps_per_second": 1.728,
181
  "eval_wer": 0.6757794831111406,
182
  "step": 8030
183
+ },
184
+ {
185
+ "epoch": 1.32315056232245,
186
+ "grad_norm": 0.035194575786590576,
187
+ "learning_rate": 4.8583398752382485e-05,
188
+ "loss": 0.0539,
189
+ "step": 8500
190
+ },
191
+ {
192
+ "epoch": 1.4009806592209206,
193
+ "grad_norm": 0.03347332403063774,
194
+ "learning_rate": 4.782967662255196e-05,
195
+ "loss": 0.0523,
196
+ "step": 9000
197
+ },
198
+ {
199
+ "epoch": 1.4788107561193913,
200
+ "grad_norm": 0.06645191460847855,
201
+ "learning_rate": 4.692437323847159e-05,
202
+ "loss": 0.0507,
203
+ "step": 9500
204
+ },
205
+ {
206
+ "epoch": 1.4999805424757753,
207
+ "eval_avg": 0.7073388677263619,
208
+ "eval_cer": 0.6541002942380697,
209
+ "eval_der": 0.7938397323961762,
210
+ "eval_loss": 0.03928952291607857,
211
+ "eval_runtime": 307.3123,
212
+ "eval_samples_per_second": 441.645,
213
+ "eval_steps_per_second": 1.728,
214
+ "eval_wer": 0.6740765765448399,
215
+ "step": 9636
216
  }
217
  ],
218
  "logging_steps": 500,
 
232
  "attributes": {}
233
  }
234
  },
235
+ "total_flos": 7.52077105281368e+17,
236
  "train_batch_size": 256,
237
  "trial_name": null,
238
  "trial_params": null