Basma2423 commited on
Commit
bf57795
·
verified ·
1 Parent(s): 5933078

Training in progress, step 10420

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:63eea8c40b61bba355a0097c91aec36f1d47d21024da7a0b696a224d7f332070
3
  size 1470068592
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b624a6ea8d6d1418579f888925098269918a7ce6b105f6ab042eec442ec455b8
3
  size 1470068592
runs/Jul16_10-37-58_ip-10-192-10-108/events.out.tfevents.1752662280.ip-10-192-10-108.2114.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:905d5d8111debb3d686d2323d92f6a85d8d86a7b195825485f295465b1c839b7
3
+ size 6794
trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 7815,
3
- "best_metric": 0.047643108039959726,
4
- "best_model_checkpoint": "checkpoints/checkpoint-7815",
5
- "epoch": 0.5998388149057835,
6
  "eval_steps": 2605,
7
- "global_step": 7815,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -137,6 +137,53 @@
137
  "eval_steps_per_second": 0.377,
138
  "eval_wer": 0.07081328706403231,
139
  "step": 7815
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
140
  }
141
  ],
142
  "logging_steps": 500,
@@ -156,7 +203,7 @@
156
  "attributes": {}
157
  }
158
  },
159
- "total_flos": 5.432807843168256e+17,
160
  "train_batch_size": 80,
161
  "trial_name": null,
162
  "trial_params": null
 
1
  {
2
+ "best_global_step": 10420,
3
+ "best_metric": 0.046850736209360914,
4
+ "best_model_checkpoint": "checkpoints/checkpoint-10420",
5
+ "epoch": 0.7997850865410446,
6
  "eval_steps": 2605,
7
+ "global_step": 10420,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
137
  "eval_steps_per_second": 0.377,
138
  "eval_wer": 0.07081328706403231,
139
  "step": 7815
140
+ },
141
+ {
142
+ "epoch": 0.6140384541581917,
143
+ "grad_norm": 0.10269790142774582,
144
+ "learning_rate": 4.905050311075738e-05,
145
+ "loss": 0.139,
146
+ "step": 8000
147
+ },
148
+ {
149
+ "epoch": 0.6524158575430786,
150
+ "grad_norm": 0.08717872947454453,
151
+ "learning_rate": 4.8756902702886506e-05,
152
+ "loss": 0.1374,
153
+ "step": 8500
154
+ },
155
+ {
156
+ "epoch": 0.6907932609279657,
157
+ "grad_norm": 0.09375835955142975,
158
+ "learning_rate": 4.842493983528561e-05,
159
+ "loss": 0.1381,
160
+ "step": 9000
161
+ },
162
+ {
163
+ "epoch": 0.7291706643128526,
164
+ "grad_norm": 0.09731540083885193,
165
+ "learning_rate": 4.805515055898372e-05,
166
+ "loss": 0.1365,
167
+ "step": 9500
168
+ },
169
+ {
170
+ "epoch": 0.7675480676977395,
171
+ "grad_norm": 0.13318291306495667,
172
+ "learning_rate": 4.764813200679724e-05,
173
+ "loss": 0.1367,
174
+ "step": 10000
175
+ },
176
+ {
177
+ "epoch": 0.7997850865410446,
178
+ "eval_avg": 0.046850736209360914,
179
+ "eval_cer": 0.030717447084398133,
180
+ "eval_der": 0.040079204095426355,
181
+ "eval_loss": 0.12388349324464798,
182
+ "eval_runtime": 1688.4755,
183
+ "eval_samples_per_second": 30.658,
184
+ "eval_steps_per_second": 0.384,
185
+ "eval_wer": 0.06975555744825825,
186
+ "step": 10420
187
  }
188
  ],
189
  "logging_steps": 500,
 
203
  "attributes": {}
204
  }
205
  },
206
+ "total_flos": 7.243743790891008e+17,
207
  "train_batch_size": 80,
208
  "trial_name": null,
209
  "trial_params": null
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cc9ecd76b0bc819c93ee275a6f1cdc22d588a2c3cac72c302c4668fed5df65f6
3
  size 5905
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61bada019f1b6e6889591c3c2feece3654269f05a9a603962c9ef4b6d6acb215
3
  size 5905