emdemor commited on
Commit
8019ed8
·
verified ·
1 Parent(s): bf319f5

Training in progress, step 350

Browse files
Files changed (2) hide show
  1. adapter_model.safetensors +1 -1
  2. state.json +18 -3
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:52e5b21efcff07a93f2b659f7c57e6cacbb0c9bfdf26d9b4fabe959421c4d76f
3
  size 35668592
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26ead50c513c37732efea9076d192b04a31af3830534624ffcda5bac2a4f7997
3
  size 35668592
state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.544,
5
  "eval_steps": 20,
6
- "global_step": 340,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -247,6 +247,21 @@
247
  "eval_samples_per_second": 3.332,
248
  "eval_steps_per_second": 0.416,
249
  "step": 320
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
250
  }
251
  ],
252
  "logging_steps": 20,
@@ -266,7 +281,7 @@
266
  "attributes": {}
267
  }
268
  },
269
- "total_flos": 2.650851803136e+16,
270
  "train_batch_size": 8,
271
  "trial_name": null,
272
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.56,
5
  "eval_steps": 20,
6
+ "global_step": 350,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
247
  "eval_samples_per_second": 3.332,
248
  "eval_steps_per_second": 0.416,
249
  "step": 320
250
+ },
251
+ {
252
+ "epoch": 0.544,
253
+ "grad_norm": 0.041331056505441666,
254
+ "learning_rate": 0.00045524599881446355,
255
+ "loss": 1.4742,
256
+ "step": 340
257
+ },
258
+ {
259
+ "epoch": 0.544,
260
+ "eval_loss": 1.4830516576766968,
261
+ "eval_runtime": 1501.5622,
262
+ "eval_samples_per_second": 3.33,
263
+ "eval_steps_per_second": 0.416,
264
+ "step": 340
265
  }
266
  ],
267
  "logging_steps": 20,
 
281
  "attributes": {}
282
  }
283
  },
284
+ "total_flos": 2.729553443831808e+16,
285
  "train_batch_size": 8,
286
  "trial_name": null,
287
  "trial_params": null