Arnold145 commited on
Commit
f52238c
·
verified ·
1 Parent(s): 27ec731

Training in progress, step 450, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2e13aeadadcb18ccca3990a5ea046ad853d02f3507e924d3e926423422b9724f
3
  size 731354744
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3eadd3d4eaf8e8cca40ccfcdf2e7e8c317298579e4396633a91d3ee0c34bdd05
3
  size 731354744
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b2f9470edf00755a751f98de8c88e303ee2727803762be95e73a952d310cb559
3
  size 63408995
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f394d21ae96d51c3003b350f67f08fd6b890f4a5aed87fa1ad54d05089da21e9
3
  size 63408995
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:55ea6e86605f5bdbd3d2670e361e09f3a420c9ea42b3ec5fedc3dc6fe8a71f9f
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb704cb6af3d7d6343b8a939e6a99a7d5bc9718dc6aef63d92b013125b539e8a
3
  size 14645
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2b8c59142c671cf2cf56a62db55635521ca84aea1b7e2c066062e1f4726a4090
3
  size 1383
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75d188a721aa835b9489f9988a78c4834dfa093c6501e89534b2b37f1089e3c2
3
  size 1383
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8eb257dcc0502678a900ea37d077b117e01470f20d05ddfe2d784926affdb6db
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a7a8730b38600022e9cc851fea0cc8fd28f0a9a328859865df47989c36fd5de
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 150,
3
  "best_metric": 1.0783365570599612,
4
  "best_model_checkpoint": "./whisper-transcription-test-2\\checkpoint-150",
5
- "epoch": 1.0101010101010102,
6
  "eval_steps": 150,
7
- "global_step": 300,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -112,6 +112,58 @@
112
  "eval_steps_per_second": 0.015,
113
  "eval_wer": 1.2195357833655707,
114
  "step": 300
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
115
  }
116
  ],
117
  "logging_steps": 25,
@@ -131,7 +183,7 @@
131
  "attributes": {}
132
  }
133
  },
134
- "total_flos": 3.2905894035456e+19,
135
  "train_batch_size": 8,
136
  "trial_name": null,
137
  "trial_params": null
 
2
  "best_global_step": 150,
3
  "best_metric": 1.0783365570599612,
4
  "best_model_checkpoint": "./whisper-transcription-test-2\\checkpoint-150",
5
+ "epoch": 1.5151515151515151,
6
  "eval_steps": 150,
7
+ "global_step": 450,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
112
  "eval_steps_per_second": 0.015,
113
  "eval_wer": 1.2195357833655707,
114
  "step": 300
115
+ },
116
+ {
117
+ "epoch": 1.0942760942760943,
118
+ "grad_norm": 1.3164455890655518,
119
+ "learning_rate": 9.997482711915926e-06,
120
+ "loss": 7.9224,
121
+ "step": 325
122
+ },
123
+ {
124
+ "epoch": 1.1784511784511784,
125
+ "grad_norm": 2.3813953399658203,
126
+ "learning_rate": 9.990665021116475e-06,
127
+ "loss": 7.8599,
128
+ "step": 350
129
+ },
130
+ {
131
+ "epoch": 1.2626262626262625,
132
+ "grad_norm": 1.4914205074310303,
133
+ "learning_rate": 9.979538999730047e-06,
134
+ "loss": 7.7867,
135
+ "step": 375
136
+ },
137
+ {
138
+ "epoch": 1.3468013468013469,
139
+ "grad_norm": 0.9378845691680908,
140
+ "learning_rate": 9.964114252604508e-06,
141
+ "loss": 7.7853,
142
+ "step": 400
143
+ },
144
+ {
145
+ "epoch": 1.430976430976431,
146
+ "grad_norm": 1.8846515417099,
147
+ "learning_rate": 9.944404095582444e-06,
148
+ "loss": 7.7433,
149
+ "step": 425
150
+ },
151
+ {
152
+ "epoch": 1.5151515151515151,
153
+ "grad_norm": 1.9767364263534546,
154
+ "learning_rate": 9.920425544005902e-06,
155
+ "loss": 7.7287,
156
+ "step": 450
157
+ },
158
+ {
159
+ "epoch": 1.5151515151515151,
160
+ "eval_cer": 1.0391868512110727,
161
+ "eval_loss": 7.759721755981445,
162
+ "eval_runtime": 4160.7601,
163
+ "eval_samples_per_second": 0.048,
164
+ "eval_steps_per_second": 0.012,
165
+ "eval_wer": 1.4598646034816247,
166
+ "step": 450
167
  }
168
  ],
169
  "logging_steps": 25,
 
183
  "attributes": {}
184
  }
185
  },
186
+ "total_flos": 4.9358841053184e+19,
187
  "train_batch_size": 8,
188
  "trial_name": null,
189
  "trial_params": null