Reggie commited on
Commit
97d9451
·
verified ·
1 Parent(s): 6fa2dd6

Training in progress, step 1200, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:34f7c9f58b8006385995ced81e6445accf31a9b8a633aacfb0c70b92fc518b3e
3
  size 69782384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73a10ff5eb3169db4be2445ff7800df6ca56baf41d13df8beabc8dbd49758ae1
3
  size 69782384
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bf98b9dd13314e20beaff9f79e1eebccaea346aa82a3bf932061a8f81b389e7b
3
  size 139790651
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2eae897c01400a9b8db73e8dccb20a5cf751422c61f8a0f8ea7fa2d6cb6a973b
3
  size 139790651
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:48f8f6135c7853ebe442ee7acd4ef9a904245becd61941f4c9ec59b6ead1f855
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e0747b8c0f8a4ac9c7c69f279af311715abe07e1d91c1c29f20fdd8f88956b7
3
  size 14645
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e818f6fe93c49323bdb08dd60b51f7d49082edfe5fc12b2bfe83ab714f779a95
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e82b50b2ea56f39b6747507c52624e7d162a635e82738b894c21d143ffb08c1
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 1000,
3
- "best_metric": 2.22625994682312,
4
- "best_model_checkpoint": "./outputs/checkpoint-1000",
5
- "epoch": 1.0857763300760044,
6
  "eval_steps": 200,
7
- "global_step": 1000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -188,6 +188,42 @@
188
  "eval_samples_per_second": 81.558,
189
  "eval_steps_per_second": 2.574,
190
  "step": 1000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
191
  }
192
  ],
193
  "logging_steps": 50,
@@ -216,7 +252,7 @@
216
  "attributes": {}
217
  }
218
  },
219
- "total_flos": 2.8005692620367462e+17,
220
  "train_batch_size": 32,
221
  "trial_name": null,
222
  "trial_params": null
 
1
  {
2
+ "best_global_step": 1200,
3
+ "best_metric": 2.21370530128479,
4
+ "best_model_checkpoint": "./outputs/checkpoint-1200",
5
+ "epoch": 1.3029315960912053,
6
  "eval_steps": 200,
7
+ "global_step": 1200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
188
  "eval_samples_per_second": 81.558,
189
  "eval_steps_per_second": 2.574,
190
  "step": 1000
191
+ },
192
+ {
193
+ "epoch": 1.1400651465798046,
194
+ "grad_norm": 0.788972795009613,
195
+ "learning_rate": 0.00014022534788594312,
196
+ "loss": 2.2099,
197
+ "step": 1050
198
+ },
199
+ {
200
+ "epoch": 1.1943539630836049,
201
+ "grad_norm": 0.7912983894348145,
202
+ "learning_rate": 0.00013486009898582889,
203
+ "loss": 2.1799,
204
+ "step": 1100
205
+ },
206
+ {
207
+ "epoch": 1.248642779587405,
208
+ "grad_norm": 0.766243040561676,
209
+ "learning_rate": 0.00012937802194741994,
210
+ "loss": 2.2058,
211
+ "step": 1150
212
+ },
213
+ {
214
+ "epoch": 1.3029315960912053,
215
+ "grad_norm": 0.8190643191337585,
216
+ "learning_rate": 0.00012379748908958562,
217
+ "loss": 2.2021,
218
+ "step": 1200
219
+ },
220
+ {
221
+ "epoch": 1.3029315960912053,
222
+ "eval_loss": 2.21370530128479,
223
+ "eval_runtime": 7.3565,
224
+ "eval_samples_per_second": 81.833,
225
+ "eval_steps_per_second": 2.583,
226
+ "step": 1200
227
  }
228
  ],
229
  "logging_steps": 50,
 
252
  "attributes": {}
253
  }
254
  },
255
+ "total_flos": 3.361352657491722e+17,
256
  "train_batch_size": 32,
257
  "trial_name": null,
258
  "trial_params": null