johannes-garstenauer commited on
Commit
6dab8bb
·
1 Parent(s): 890a9fc

Training in progress, step 12, checkpoint

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e5a2921d652e04475b2582b874f40efe10202f7e752cf8e6bf772c80fa36293c
3
  size 532568837
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bccd47a596f0e43bb0c809a1c3febda05c119b173b251dc10b0aabd3dc10e31d
3
  size 532568837
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:627ab678b05d1d840ef3d0714b93cb9c171cb0a2d785cdcc0516f7df3a027a3b
3
  size 266276525
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c5e72d3cd80888d9fc94cb7b08c79ce79570b417e9058372ff428c729b744ed
3
  size 266276525
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e06a947d6fc15c8a25160dd61856cbc1c96ea1dea26f5686402c76b0bea68e06
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ec42316ae917e112d26281400ad1e9ce2c3fa0e3a8ca2b12b69194231d70a41
3
  size 14575
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:00ee2dafdbb84ea87e7c1219a1c24c93068f181ae377a958d250f16672213757
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa0b72c7e600fbfa81cd2eb092188fa9ace6d764140d4fb121c3e9a7ee4ebee0
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,47 +1,18 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.732142857142857,
5
  "eval_steps": 500,
6
- "global_step": 612,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
- "log_history": [
11
- {
12
- "epoch": 1.0,
13
- "eval_accuracy": {
14
- "accuracy": 0.9920424403183024
15
- },
16
- "eval_loss": 0.03427809104323387,
17
- "eval_runtime": 4.2982,
18
- "eval_samples_per_second": 175.424,
19
- "eval_steps_per_second": 2.792,
20
- "step": 224
21
- },
22
- {
23
- "epoch": 2.0,
24
- "eval_accuracy": {
25
- "accuracy": 0.993368700265252
26
- },
27
- "eval_loss": 0.034899961203336716,
28
- "eval_runtime": 4.4313,
29
- "eval_samples_per_second": 170.152,
30
- "eval_steps_per_second": 2.708,
31
- "step": 448
32
- },
33
- {
34
- "epoch": 2.23,
35
- "learning_rate": 1.2797619047619047e-05,
36
- "loss": 0.0858,
37
- "step": 500
38
- }
39
- ],
40
  "logging_steps": 500,
41
- "max_steps": 672,
42
- "num_train_epochs": 3,
43
- "save_steps": 34,
44
- "total_flos": 5184786423674880.0,
45
  "trial_name": null,
46
  "trial_params": null
47
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.05357142857142857,
5
  "eval_steps": 500,
6
+ "global_step": 12,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
+ "log_history": [],
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
11
  "logging_steps": 500,
12
+ "max_steps": 224,
13
+ "num_train_epochs": 1,
14
+ "save_steps": 12,
15
+ "total_flos": 101740405063680.0,
16
  "trial_name": null,
17
  "trial_params": null
18
  }
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:27bd36ee6c5a9e7bb0ca2b91a86693810b4c7de03801bdf0efc717497e63e1e8
3
  size 4155
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd7496b3d888ccc8e86cf6dd63842a0e206390f90d78af2e46aafaebdb45a7cb
3
  size 4155