Reggie commited on
Commit
6dff460
·
verified ·
1 Parent(s): 6b42a6e

Training in progress, step 1000, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aac60fa61b1371f0628e4cdce110bd39a12e57e9c460d701427e8c58e754e7e9
3
  size 69782384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34f7c9f58b8006385995ced81e6445accf31a9b8a633aacfb0c70b92fc518b3e
3
  size 69782384
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a63b11235c95638e0ee559b2345b5d8f7a103f5995eca48cb715fe2ba2cac47e
3
  size 139790651
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf98b9dd13314e20beaff9f79e1eebccaea346aa82a3bf932061a8f81b389e7b
3
  size 139790651
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bb0516b0656c487c351bad1057295186b5e3e00c79529207cd235ce5be6a5d40
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48f8f6135c7853ebe442ee7acd4ef9a904245becd61941f4c9ec59b6ead1f855
3
  size 14645
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e4f1426694c38acbbdcb00f1a570a9712c4816b9dc6fb937a5303ba759aa3ab7
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e818f6fe93c49323bdb08dd60b51f7d49082edfe5fc12b2bfe83ab714f779a95
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 800,
3
- "best_metric": 2.2396719455718994,
4
- "best_model_checkpoint": "./outputs/checkpoint-800",
5
- "epoch": 0.8686210640608035,
6
  "eval_steps": 200,
7
- "global_step": 800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -152,6 +152,42 @@
152
  "eval_samples_per_second": 81.898,
153
  "eval_steps_per_second": 2.585,
154
  "step": 800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
155
  }
156
  ],
157
  "logging_steps": 50,
@@ -180,7 +216,7 @@
180
  "attributes": {}
181
  }
182
  },
183
- "total_flos": 2.2399365411628646e+17,
184
  "train_batch_size": 32,
185
  "trial_name": null,
186
  "trial_params": null
 
1
  {
2
+ "best_global_step": 1000,
3
+ "best_metric": 2.22625994682312,
4
+ "best_model_checkpoint": "./outputs/checkpoint-1000",
5
+ "epoch": 1.0857763300760044,
6
  "eval_steps": 200,
7
+ "global_step": 1000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
152
  "eval_samples_per_second": 81.898,
153
  "eval_steps_per_second": 2.585,
154
  "step": 800
155
+ },
156
+ {
157
+ "epoch": 0.9229098805646037,
158
+ "grad_norm": 0.6467435359954834,
159
+ "learning_rate": 0.0001601655739753613,
160
+ "loss": 2.2523,
161
+ "step": 850
162
+ },
163
+ {
164
+ "epoch": 0.9771986970684039,
165
+ "grad_norm": 0.6962546706199646,
166
+ "learning_rate": 0.0001554426355793363,
167
+ "loss": 2.2509,
168
+ "step": 900
169
+ },
170
+ {
171
+ "epoch": 1.0314875135722041,
172
+ "grad_norm": 0.6648530960083008,
173
+ "learning_rate": 0.0001505338899112344,
174
+ "loss": 2.2103,
175
+ "step": 950
176
+ },
177
+ {
178
+ "epoch": 1.0857763300760044,
179
+ "grad_norm": 0.9022650122642517,
180
+ "learning_rate": 0.00014545578786002178,
181
+ "loss": 2.1862,
182
+ "step": 1000
183
+ },
184
+ {
185
+ "epoch": 1.0857763300760044,
186
+ "eval_loss": 2.22625994682312,
187
+ "eval_runtime": 7.3813,
188
+ "eval_samples_per_second": 81.558,
189
+ "eval_steps_per_second": 2.574,
190
+ "step": 1000
191
  }
192
  ],
193
  "logging_steps": 50,
 
216
  "attributes": {}
217
  }
218
  },
219
+ "total_flos": 2.8005692620367462e+17,
220
  "train_batch_size": 32,
221
  "trial_name": null,
222
  "trial_params": null