DaniilOr commited on
Commit
87390a9
·
verified ·
1 Parent(s): c4f4ccd

Upload 12 files

Browse files
Files changed (5) hide show
  1. model.safetensors +1 -1
  2. optimizer.pt +1 -1
  3. rng_state.pth +1 -1
  4. scheduler.pt +1 -1
  5. trainer_state.json +31 -3
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5f04940d191d5116d1cdb84fb958d626c7cb6fe3561cc4e4a2aa5ef8b7c7b6ea
3
  size 1115283588
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef88acd7b940c0a42e85cb82aad1441811e9cad6a2a30dbe70b1e6dfd39899d4
3
  size 1115283588
optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:685362a4e376c51d038de9536e01e7b5d486c3f469024975b5800d12f1d7d16a
3
  size 2230686277
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e95ab3a0e177ebef1a730ea6c25411246adf47a11f94abb1102b76fae92c729a
3
  size 2230686277
rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:42cd100366657e056c44ccf9126d34c08c902f596b2532bee723c91bd3220fa0
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de71cb290b64bc136ac49050f7bce13d74391577dd275bda3c8142bd03f8bfb1
3
  size 14575
scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d157d941cae3d6318e2b951c2b5e3f17b9c66893c4c246690a1e90c216a8558f
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b6716fb4bc72b67621113830aa02a129248ffd9a4100203fff469ffeaeccbf5
3
  size 627
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 1.9327729940414429,
3
  "best_model_checkpoint": "./results/checkpoint-322",
4
- "epoch": 14.0,
5
  "eval_steps": 500,
6
- "global_step": 4508,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -215,6 +215,34 @@
215
  "eval_samples_per_second": 91.676,
216
  "eval_steps_per_second": 0.464,
217
  "step": 4508
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
218
  }
219
  ],
220
  "logging_steps": 500,
@@ -222,7 +250,7 @@
222
  "num_input_tokens_seen": 0,
223
  "num_train_epochs": 50,
224
  "save_steps": 500,
225
- "total_flos": 2.3718794212945306e+17,
226
  "train_batch_size": 200,
227
  "trial_name": null,
228
  "trial_params": null
 
1
  {
2
  "best_metric": 1.9327729940414429,
3
  "best_model_checkpoint": "./results/checkpoint-322",
4
+ "epoch": 16.0,
5
  "eval_steps": 500,
6
+ "global_step": 5152,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
215
  "eval_samples_per_second": 91.676,
216
  "eval_steps_per_second": 0.464,
217
  "step": 4508
218
+ },
219
+ {
220
+ "epoch": 15.0,
221
+ "eval_accuracy": 0.33707370737073705,
222
+ "eval_loss": 5.8459153175354,
223
+ "eval_precision": 0.3366756679639873,
224
+ "eval_recall": 0.33707370737073705,
225
+ "eval_runtime": 100.8652,
226
+ "eval_samples_per_second": 90.12,
227
+ "eval_steps_per_second": 0.456,
228
+ "step": 4830
229
+ },
230
+ {
231
+ "epoch": 15.53,
232
+ "learning_rate": 6.894409937888199e-05,
233
+ "loss": 0.0243,
234
+ "step": 5000
235
+ },
236
+ {
237
+ "epoch": 16.0,
238
+ "eval_accuracy": 0.35401540154015404,
239
+ "eval_loss": 5.645482540130615,
240
+ "eval_precision": 0.3631233149571772,
241
+ "eval_recall": 0.35401540154015404,
242
+ "eval_runtime": 99.6631,
243
+ "eval_samples_per_second": 91.207,
244
+ "eval_steps_per_second": 0.462,
245
+ "step": 5152
246
  }
247
  ],
248
  "logging_steps": 500,
 
250
  "num_input_tokens_seen": 0,
251
  "num_train_epochs": 50,
252
  "save_steps": 500,
253
+ "total_flos": 2.7107193386223206e+17,
254
  "train_batch_size": 200,
255
  "trial_name": null,
256
  "trial_params": null