msinghy commited on
Commit
f6b5eb1
·
verified ·
1 Parent(s): 7165271

Training in progress, epoch 4, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8a618ef5cf269b6c1e073eb60bd9bcb6e6baaf9d63bac08e567e248237330824
3
  size 6403448
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf7f1711371cdf22625cfd71373d0e13667f9262db729700ebba8bff281e302f
3
  size 6403448
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6a99a17d26069ea1b2300ddb31f582c86c1ffc96ba7d40a5bd87b7b9157de3d5
3
  size 12867066
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa22af2fc608eb3be5b6d7756926317b864996be333d25aedbb9e48d2d5bd10f
3
  size 12867066
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:010dca2978871dd22e51ccf13e041ea95312e9e51a2d6bc8498d3840cd5050e5
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a0a24216fd4977ce1d76fe035f83db58fced950e69f3285260aec3babc9a654
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:718198051aa9e8e989e25ac52095d0ce7b7daa6408cffd37d0553cc200763431
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:492f28b6539849c91c4a713593f718b0248ba49625b6a14592a3de84ad5d56c7
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 39,
3
- "best_metric": 5.06503438949585,
4
- "best_model_checkpoint": "My-Nietzsche-Model/checkpoint-39",
5
- "epoch": 3.0,
6
  "eval_steps": 500,
7
- "global_step": 39,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -32,6 +32,14 @@
32
  "eval_samples_per_second": 3.24,
33
  "eval_steps_per_second": 0.81,
34
  "step": 39
 
 
 
 
 
 
 
 
35
  }
36
  ],
37
  "logging_steps": 500,
@@ -51,7 +59,7 @@
51
  "attributes": {}
52
  }
53
  },
54
- "total_flos": 1870914893875200.0,
55
  "train_batch_size": 4,
56
  "trial_name": null,
57
  "trial_params": null
 
1
  {
2
+ "best_global_step": 52,
3
+ "best_metric": 5.0411696434021,
4
+ "best_model_checkpoint": "My-Nietzsche-Model/checkpoint-52",
5
+ "epoch": 4.0,
6
  "eval_steps": 500,
7
+ "global_step": 52,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
32
  "eval_samples_per_second": 3.24,
33
  "eval_steps_per_second": 0.81,
34
  "step": 39
35
+ },
36
+ {
37
+ "epoch": 4.0,
38
+ "eval_loss": 5.0411696434021,
39
+ "eval_runtime": 6.2271,
40
+ "eval_samples_per_second": 3.212,
41
+ "eval_steps_per_second": 0.803,
42
+ "step": 52
43
  }
44
  ],
45
  "logging_steps": 500,
 
59
  "attributes": {}
60
  }
61
  },
62
+ "total_flos": 2494553191833600.0,
63
  "train_batch_size": 4,
64
  "trial_name": null,
65
  "trial_params": null