Training in progress, epoch 3, checkpoint
Browse files
last-checkpoint/adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 6403448
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8a618ef5cf269b6c1e073eb60bd9bcb6e6baaf9d63bac08e567e248237330824
|
| 3 |
size 6403448
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 12867066
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6a99a17d26069ea1b2300ddb31f582c86c1ffc96ba7d40a5bd87b7b9157de3d5
|
| 3 |
size 12867066
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:010dca2978871dd22e51ccf13e041ea95312e9e51a2d6bc8498d3840cd5050e5
|
| 3 |
size 14244
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:718198051aa9e8e989e25ac52095d0ce7b7daa6408cffd37d0553cc200763431
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -1,10 +1,10 @@
|
|
| 1 |
{
|
| 2 |
-
"best_global_step":
|
| 3 |
-
"best_metric": 5.
|
| 4 |
-
"best_model_checkpoint": "My-Nietzsche-Model/checkpoint-
|
| 5 |
-
"epoch":
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -24,6 +24,14 @@
|
|
| 24 |
"eval_samples_per_second": 3.211,
|
| 25 |
"eval_steps_per_second": 0.803,
|
| 26 |
"step": 26
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 27 |
}
|
| 28 |
],
|
| 29 |
"logging_steps": 500,
|
|
@@ -43,7 +51,7 @@
|
|
| 43 |
"attributes": {}
|
| 44 |
}
|
| 45 |
},
|
| 46 |
-
"total_flos":
|
| 47 |
"train_batch_size": 4,
|
| 48 |
"trial_name": null,
|
| 49 |
"trial_params": null
|
|
|
|
| 1 |
{
|
| 2 |
+
"best_global_step": 39,
|
| 3 |
+
"best_metric": 5.06503438949585,
|
| 4 |
+
"best_model_checkpoint": "My-Nietzsche-Model/checkpoint-39",
|
| 5 |
+
"epoch": 3.0,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 39,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 24 |
"eval_samples_per_second": 3.211,
|
| 25 |
"eval_steps_per_second": 0.803,
|
| 26 |
"step": 26
|
| 27 |
+
},
|
| 28 |
+
{
|
| 29 |
+
"epoch": 3.0,
|
| 30 |
+
"eval_loss": 5.06503438949585,
|
| 31 |
+
"eval_runtime": 6.173,
|
| 32 |
+
"eval_samples_per_second": 3.24,
|
| 33 |
+
"eval_steps_per_second": 0.81,
|
| 34 |
+
"step": 39
|
| 35 |
}
|
| 36 |
],
|
| 37 |
"logging_steps": 500,
|
|
|
|
| 51 |
"attributes": {}
|
| 52 |
}
|
| 53 |
},
|
| 54 |
+
"total_flos": 1870914893875200.0,
|
| 55 |
"train_batch_size": 4,
|
| 56 |
"trial_name": null,
|
| 57 |
"trial_params": null
|