dq158 commited on
Commit
16fa8f0
·
1 Parent(s): 9d88160

Training in progress, epoch 3, checkpoint

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2c4363d06929aee26c9e927701774792fb7453e840d38a5ad5a3f1d36b1be96b
3
  size 1980860410
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33cd6ceaf3e5c0a15820c9055970f910107122ac5f2692ee038a552928978e93
3
  size 1980860410
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:96e4c9ef9cd2909c6491e22429888102a5089a17edf046aff201c9c1677a0ddc
3
  size 990409330
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b2efc889d52b2d6c0784b72b631f0fe873c965bb89fe3a1d443214cc2dcc088
3
  size 990409330
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:240c04ca9a3cb29b976a770fef919a933d604a3470e1df27947f582528033848
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3af69a82a1b91d6e5092406535f43bc1f304899b494dcf1053de5c4be7029152
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d9ba60403de9780e4b1c2244a6784efea5c6643ffcd4f768f2fe7e0521babfed
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d45ce75f87aaa5b92cdc5c7abdc86c8b62d1ae1a014d3240669d9630def6c5a
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 2.3292136192321777,
3
- "best_model_checkpoint": "dq158/morbius/checkpoint-6326",
4
- "epoch": 2.0,
5
  "eval_steps": 500,
6
- "global_step": 6326,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -117,13 +117,68 @@
117
  "eval_steps_per_second": 0.626,
118
  "eval_translation_length": 53147,
119
  "step": 6326
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
120
  }
121
  ],
122
  "logging_steps": 500,
123
  "max_steps": 63260,
124
  "num_train_epochs": 20,
125
  "save_steps": 500,
126
- "total_flos": 3.465283057798349e+16,
127
  "trial_name": null,
128
  "trial_params": null
129
  }
 
1
  {
2
+ "best_metric": 2.3189847469329834,
3
+ "best_model_checkpoint": "dq158/morbius/checkpoint-9489",
4
+ "epoch": 3.0,
5
  "eval_steps": 500,
6
+ "global_step": 9489,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
117
  "eval_steps_per_second": 0.626,
118
  "eval_translation_length": 53147,
119
  "step": 6326
120
+ },
121
+ {
122
+ "epoch": 2.06,
123
+ "learning_rate": 6.8433222607963194e-06,
124
+ "loss": 2.4242,
125
+ "step": 6500
126
+ },
127
+ {
128
+ "epoch": 2.21,
129
+ "learning_rate": 6.816361474374877e-06,
130
+ "loss": 2.4037,
131
+ "step": 7000
132
+ },
133
+ {
134
+ "epoch": 2.37,
135
+ "learning_rate": 6.787323321691012e-06,
136
+ "loss": 2.3952,
137
+ "step": 7500
138
+ },
139
+ {
140
+ "epoch": 2.53,
141
+ "learning_rate": 6.7562259922211045e-06,
142
+ "loss": 2.4106,
143
+ "step": 8000
144
+ },
145
+ {
146
+ "epoch": 2.69,
147
+ "learning_rate": 6.723088965308281e-06,
148
+ "loss": 2.4145,
149
+ "step": 8500
150
+ },
151
+ {
152
+ "epoch": 2.85,
153
+ "learning_rate": 6.68793299796057e-06,
154
+ "loss": 2.356,
155
+ "step": 9000
156
+ },
157
+ {
158
+ "epoch": 3.0,
159
+ "eval_bleu": 1.0,
160
+ "eval_brevity_penalty": 1.0,
161
+ "eval_length_ratio": 1.0,
162
+ "eval_loss": 2.3189847469329834,
163
+ "eval_precisions": [
164
+ 1.0,
165
+ 1.0,
166
+ 1.0,
167
+ 1.0
168
+ ],
169
+ "eval_reference_length": 53040,
170
+ "eval_runtime": 561.5646,
171
+ "eval_samples_per_second": 5.007,
172
+ "eval_steps_per_second": 0.627,
173
+ "eval_translation_length": 53040,
174
+ "step": 9489
175
  }
176
  ],
177
  "logging_steps": 500,
178
  "max_steps": 63260,
179
  "num_train_epochs": 20,
180
  "save_steps": 500,
181
+ "total_flos": 5.197924586697523e+16,
182
  "trial_name": null,
183
  "trial_params": null
184
  }