HiAmNear commited on
Commit
60de2a7
·
verified ·
1 Parent(s): c3677f7

Training in progress, epoch 2, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d93af6b070094148dfc3c2004e4aec24e25586fe06b45e8796b998d8cc7e2a2a
3
  size 2239647372
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24d5dff093a432a5eb5282bfdd86ae2416dc3aca3ae2dcf7c7b93bb828742254
3
  size 2239647372
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8df875358177620549416ae8cd21a4bf769c228af9cbdb8dcc84dbbfe4d45452
3
  size 4479530129
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1bb2d041b144809f2caa73323e0b7cc022dc2d5ebdcfd1b8e7590657d984df7e
3
  size 4479530129
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:474ed59e44a96690485aa267e28741f930f12c408ee6a6090faf325b2090550e
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a105e433a7700673c26b9c7278261e31311e890567b4f9e7e49a5b2f356e0cf
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:da70d674c7df75d777418290e3779cdd654b083cf22d636cc438f1a0580aa29d
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e6a8b78b43d8a7789266e20d2a66bd79cbd8d65e3b2aaa76564d25b3082924d
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 0.4931787175989086,
3
- "best_model_checkpoint": "../../modelParams/TrainingArguments_output\\checkpoint-182",
4
- "epoch": 1.9911262798634812,
5
  "eval_steps": 500,
6
- "global_step": 182,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -25,6 +25,15 @@
25
  "eval_samples_per_second": 4.95,
26
  "eval_steps_per_second": 1.239,
27
  "step": 182
 
 
 
 
 
 
 
 
 
28
  }
29
  ],
30
  "logging_steps": 500,
@@ -44,7 +53,7 @@
44
  "attributes": {}
45
  }
46
  },
47
- "total_flos": 1.088521576955904e+16,
48
  "train_batch_size": 4,
49
  "trial_name": null,
50
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.5068212824010914,
3
+ "best_model_checkpoint": "../../modelParams/TrainingArguments_output\\checkpoint-273",
4
+ "epoch": 2.98839590443686,
5
  "eval_steps": 500,
6
+ "global_step": 273,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
25
  "eval_samples_per_second": 4.95,
26
  "eval_steps_per_second": 1.239,
27
  "step": 182
28
+ },
29
+ {
30
+ "epoch": 2.98839590443686,
31
+ "eval_accuracy": 0.5068212824010914,
32
+ "eval_loss": 1.3609565496444702,
33
+ "eval_runtime": 297.4155,
34
+ "eval_samples_per_second": 4.929,
35
+ "eval_steps_per_second": 1.234,
36
+ "step": 273
37
  }
38
  ],
39
  "logging_steps": 500,
 
53
  "attributes": {}
54
  }
55
  },
56
+ "total_flos": 1.632782365433856e+16,
57
  "train_batch_size": 4,
58
  "trial_name": null,
59
  "trial_params": null