emdemor commited on
Commit
af972b3
·
verified ·
1 Parent(s): d5910a1

Training in progress, step 330

Browse files
Files changed (2) hide show
  1. adapter_model.safetensors +1 -1
  2. state.json +18 -3
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:164cd75ce7d75783388fda00bd1983d8add8c0d60e1682807773d77977bbb275
3
  size 35668592
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:673aa39bdc5c2f0ebc47b58e552386c125809c5f0bc1ce481fb92273af7b8e68
3
  size 35668592
state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.512,
5
  "eval_steps": 20,
6
- "global_step": 320,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -232,6 +232,21 @@
232
  "eval_samples_per_second": 3.396,
233
  "eval_steps_per_second": 0.425,
234
  "step": 300
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
235
  }
236
  ],
237
  "logging_steps": 20,
@@ -251,7 +266,7 @@
251
  "attributes": {}
252
  }
253
  },
254
- "total_flos": 2.490887225745408e+16,
255
  "train_batch_size": 8,
256
  "trial_name": null,
257
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.528,
5
  "eval_steps": 20,
6
+ "global_step": 330,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
232
  "eval_samples_per_second": 3.396,
233
  "eval_steps_per_second": 0.425,
234
  "step": 300
235
+ },
236
+ {
237
+ "epoch": 0.512,
238
+ "grad_norm": 0.03938526660203934,
239
+ "learning_rate": 0.00046117368109069355,
240
+ "loss": 1.4996,
241
+ "step": 320
242
+ },
243
+ {
244
+ "epoch": 0.512,
245
+ "eval_loss": 1.4825308322906494,
246
+ "eval_runtime": 1500.8065,
247
+ "eval_samples_per_second": 3.332,
248
+ "eval_steps_per_second": 0.416,
249
+ "step": 320
250
  }
251
  ],
252
  "logging_steps": 20,
 
266
  "attributes": {}
267
  }
268
  },
269
+ "total_flos": 2.572185984761856e+16,
270
  "train_batch_size": 8,
271
  "trial_name": null,
272
  "trial_params": null