Myat-Oo-Swe commited on
Commit
02e5c91
·
verified ·
1 Parent(s): dcce8c9

Training in progress, step 2000, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:239e6ee34c627288f07da635c7607c26cb1658248cb4216138582c969c562c53
3
  size 62969640
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1faae7c834d1bb6209cce5a3f0eba37603cd97968d5ae1b6bf60ee5532f4c25f
3
  size 62969640
last-checkpoint/adapter_model/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:239e6ee34c627288f07da635c7607c26cb1658248cb4216138582c969c562c53
3
  size 62969640
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1faae7c834d1bb6209cce5a3f0eba37603cd97968d5ae1b6bf60ee5532f4c25f
3
  size 62969640
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b57dc2a75271934b9272c6e364dbf8843d89c17ee905195eb7b2c5eaf32f6c3c
3
  size 84101370
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f26b7ff9e117acaaf45b07eccb6cd0baa36728fc0f969371979374cc5be60035
3
  size 84101370
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:018d3489ed13a5f5303fe87bc05ee3bd7e42fab42cae25b01d59fef9cd4802ee
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1cdd3cf64f5c3a203d2cecf3121f10fda7f7fc667ea30f96acfb98121b8c3035
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c2a4b6e0ef05ca249f2d6b7f9f3ad1dff81e55842a962df795bb9740c17c8e92
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c50a9cebe5d66d453d25b140738bff479749ac03e0a43597d8776bc22f6ed0c
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:416c83758baa78b1c3e5334d8425b4107684ccd443376b2af239f14f10f93e92
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:382782d862255d071016cff9c6a4b56eed27c6324967e51b062457330841da4d
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 1500,
3
- "best_metric": 0.6280742287635803,
4
- "best_model_checkpoint": "./whisper-large-v3-lt1/checkpoint-1500",
5
- "epoch": 0.75,
6
  "eval_steps": 500,
7
- "global_step": 1500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -137,6 +137,49 @@
137
  "eval_samples_per_second": 2.509,
138
  "eval_steps_per_second": 0.314,
139
  "step": 1500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
140
  }
141
  ],
142
  "logging_steps": 100,
@@ -151,12 +194,12 @@
151
  "should_evaluate": false,
152
  "should_log": false,
153
  "should_save": true,
154
- "should_training_stop": false
155
  },
156
  "attributes": {}
157
  }
158
  },
159
- "total_flos": 8.240969023488e+19,
160
  "train_batch_size": 16,
161
  "trial_name": null,
162
  "trial_params": null
 
1
  {
2
+ "best_global_step": 2000,
3
+ "best_metric": 0.6051455140113831,
4
+ "best_model_checkpoint": "./whisper-large-v3-lt1/checkpoint-2000",
5
+ "epoch": 1.179,
6
  "eval_steps": 500,
7
+ "global_step": 2000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
137
  "eval_samples_per_second": 2.509,
138
  "eval_steps_per_second": 0.314,
139
  "step": 1500
140
+ },
141
+ {
142
+ "epoch": 0.8,
143
+ "grad_norm": 1.4991073608398438,
144
+ "learning_rate": 2.110526315789474e-06,
145
+ "loss": 0.6425,
146
+ "step": 1600
147
+ },
148
+ {
149
+ "epoch": 1.029,
150
+ "grad_norm": 1.7371805906295776,
151
+ "learning_rate": 1.5842105263157894e-06,
152
+ "loss": 0.6223,
153
+ "step": 1700
154
+ },
155
+ {
156
+ "epoch": 1.079,
157
+ "grad_norm": 3.491868495941162,
158
+ "learning_rate": 1.0578947368421054e-06,
159
+ "loss": 0.6013,
160
+ "step": 1800
161
+ },
162
+ {
163
+ "epoch": 1.129,
164
+ "grad_norm": 2.1243815422058105,
165
+ "learning_rate": 5.315789473684211e-07,
166
+ "loss": 0.5967,
167
+ "step": 1900
168
+ },
169
+ {
170
+ "epoch": 1.179,
171
+ "grad_norm": 2.0289883613586426,
172
+ "learning_rate": 5.263157894736842e-09,
173
+ "loss": 0.5986,
174
+ "step": 2000
175
+ },
176
+ {
177
+ "epoch": 1.179,
178
+ "eval_loss": 0.6051455140113831,
179
+ "eval_runtime": 1166.0635,
180
+ "eval_samples_per_second": 2.504,
181
+ "eval_steps_per_second": 0.313,
182
+ "step": 2000
183
  }
184
  ],
185
  "logging_steps": 100,
 
194
  "should_evaluate": false,
195
  "should_log": false,
196
  "should_save": true,
197
+ "should_training_stop": true
198
  },
199
  "attributes": {}
200
  }
201
  },
202
+ "total_flos": 1.0985211708309504e+20,
203
  "train_batch_size": 16,
204
  "trial_name": null,
205
  "trial_params": null