dq158 commited on
Commit
2ebdd0d
·
1 Parent(s): 407276e

Training in progress, epoch 5, checkpoint

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2e182cf7af55a4587a0ca3ba6416b1aa45eafc79633351a41e5d59811f7a451c
3
  size 1980860410
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edbf65f6f6b2d902ca192fe35b3efd93add0d803274b4def7bd26dee546982fe
3
  size 1980860410
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cec0c19e5d8676c555d959ec2b293902f093b7ead0acaa05a8a02126e66971d0
3
  size 990409330
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:459187e110db4e0fb7a78cfb68b5e2e416fc7bc717e4748019446f5cdf973209
3
  size 990409330
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:729abbd3ef67de81491d0ba432cad08d03530a09134bacfb682480f442a1aec0
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9519ad1f203ec112bc005ea3f5aacffca3d057ed940f03bc40440539df41b908
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e79d3f19a5bd9c30d954331796aa7283483a96c6d7e33353c55c9ee00b681646
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4166a33b5520e0dfb0734abb46fce8eedf9514c1a2270d14609538201a3fae48
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 1.4407896995544434,
3
- "best_model_checkpoint": "dq158/morbius/checkpoint-5900",
4
- "epoch": 4.0,
5
  "eval_steps": 500,
6
- "global_step": 5900,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -149,13 +149,50 @@
149
  "eval_steps_per_second": 0.562,
150
  "eval_translation_length": 36007,
151
  "step": 5900
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
152
  }
153
  ],
154
  "logging_steps": 500,
155
  "max_steps": 7375,
156
  "num_train_epochs": 5,
157
  "save_steps": 500,
158
- "total_flos": 4.846438637685965e+16,
159
  "trial_name": null,
160
  "trial_params": null
161
  }
 
1
  {
2
+ "best_metric": 1.4382692575454712,
3
+ "best_model_checkpoint": "dq158/morbius/checkpoint-7375",
4
+ "epoch": 5.0,
5
  "eval_steps": 500,
6
+ "global_step": 7375,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
149
  "eval_steps_per_second": 0.562,
150
  "eval_translation_length": 36007,
151
  "step": 5900
152
+ },
153
+ {
154
+ "epoch": 4.07,
155
+ "learning_rate": 9.322033898305085e-06,
156
+ "loss": 1.6139,
157
+ "step": 6000
158
+ },
159
+ {
160
+ "epoch": 4.41,
161
+ "learning_rate": 5.932203389830509e-06,
162
+ "loss": 1.5939,
163
+ "step": 6500
164
+ },
165
+ {
166
+ "epoch": 4.75,
167
+ "learning_rate": 2.5423728813559323e-06,
168
+ "loss": 1.5956,
169
+ "step": 7000
170
+ },
171
+ {
172
+ "epoch": 5.0,
173
+ "eval_bleu": 1.0,
174
+ "eval_brevity_penalty": 1.0,
175
+ "eval_length_ratio": 1.0,
176
+ "eval_loss": 1.4382692575454712,
177
+ "eval_precisions": [
178
+ 1.0,
179
+ 1.0,
180
+ 1.0,
181
+ 1.0
182
+ ],
183
+ "eval_reference_length": 36000,
184
+ "eval_runtime": 292.0466,
185
+ "eval_samples_per_second": 6.732,
186
+ "eval_steps_per_second": 0.562,
187
+ "eval_translation_length": 36000,
188
+ "step": 7375
189
  }
190
  ],
191
  "logging_steps": 500,
192
  "max_steps": 7375,
193
  "num_train_epochs": 5,
194
  "save_steps": 500,
195
+ "total_flos": 6.058048297107456e+16,
196
  "trial_name": null,
197
  "trial_params": null
198
  }