msinghy commited on
Commit
384de55
·
verified ·
1 Parent(s): 91a9fcf

Training in progress, epoch 3, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8ba2f487423f3ee403b2b9cdb4410a466f0cfdb517e419c5c9a80cb48c89a3db
3
  size 6403448
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a618ef5cf269b6c1e073eb60bd9bcb6e6baaf9d63bac08e567e248237330824
3
  size 6403448
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:15eae082e01864f410ba2f95b77b0ebd570f80467f63f7660dd0f19a4ab71015
3
  size 12867066
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a99a17d26069ea1b2300ddb31f582c86c1ffc96ba7d40a5bd87b7b9157de3d5
3
  size 12867066
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0cf172885e90853de4ff46d2054e9b24daa1c6a6ad504c5b28bcf6f9d1bef903
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:010dca2978871dd22e51ccf13e041ea95312e9e51a2d6bc8498d3840cd5050e5
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c2fd4b24a386a8e80db11b364387d0eebec81beeabc63133ccb6bc22dfcfddf0
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:718198051aa9e8e989e25ac52095d0ce7b7daa6408cffd37d0553cc200763431
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 26,
3
- "best_metric": 5.1018967628479,
4
- "best_model_checkpoint": "My-Nietzsche-Model/checkpoint-26",
5
- "epoch": 2.0,
6
  "eval_steps": 500,
7
- "global_step": 26,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -24,6 +24,14 @@
24
  "eval_samples_per_second": 3.211,
25
  "eval_steps_per_second": 0.803,
26
  "step": 26
 
 
 
 
 
 
 
 
27
  }
28
  ],
29
  "logging_steps": 500,
@@ -43,7 +51,7 @@
43
  "attributes": {}
44
  }
45
  },
46
- "total_flos": 1247276595916800.0,
47
  "train_batch_size": 4,
48
  "trial_name": null,
49
  "trial_params": null
 
1
  {
2
+ "best_global_step": 39,
3
+ "best_metric": 5.06503438949585,
4
+ "best_model_checkpoint": "My-Nietzsche-Model/checkpoint-39",
5
+ "epoch": 3.0,
6
  "eval_steps": 500,
7
+ "global_step": 39,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
24
  "eval_samples_per_second": 3.211,
25
  "eval_steps_per_second": 0.803,
26
  "step": 26
27
+ },
28
+ {
29
+ "epoch": 3.0,
30
+ "eval_loss": 5.06503438949585,
31
+ "eval_runtime": 6.173,
32
+ "eval_samples_per_second": 3.24,
33
+ "eval_steps_per_second": 0.81,
34
+ "step": 39
35
  }
36
  ],
37
  "logging_steps": 500,
 
51
  "attributes": {}
52
  }
53
  },
54
+ "total_flos": 1870914893875200.0,
55
  "train_batch_size": 4,
56
  "trial_name": null,
57
  "trial_params": null