Training in progress, step 13
Browse files- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/pytorch_model.bin +1 -1
- last-checkpoint/rng_state.pth +1 -1
- last-checkpoint/scaler.pt +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +27 -3
- pytorch_model.bin +1 -1
- runs/Jul19_18-03-38_47ad500bc002/events.out.tfevents.1689789837.47ad500bc002.2216.8 +2 -2
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1044539653
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5c7a59da2efa72379bcc54eca155c61485a34016dc472390837f7e6667e1f381
|
| 3 |
size 1044539653
|
last-checkpoint/pytorch_model.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 5018531153
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3c1829e1d9fe90b41ecbfccc04d70f06a21fb290a57b54fa1d7cdb906bac3a50
|
| 3 |
size 5018531153
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14575
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:512f018b467c169e2aa0e142ea191b73786d79604dace238e3d4834d1df266e8
|
| 3 |
size 14575
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 557
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5ecb4b4bc15e0509048b47d006eba35fc56dec209d6d90c42b552a5ead63d9d9
|
| 3 |
size 557
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 627
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:89ce2185c6877d072e8ca86c937358d8e8317963d32ce90379cdc35bd6460cdf
|
| 3 |
size 627
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -1,8 +1,8 @@
|
|
| 1 |
{
|
| 2 |
"best_metric": null,
|
| 3 |
"best_model_checkpoint": null,
|
| 4 |
-
"epoch":
|
| 5 |
-
"global_step":
|
| 6 |
"is_hyper_param_search": false,
|
| 7 |
"is_local_process_zero": true,
|
| 8 |
"is_world_process_zero": true,
|
|
@@ -60,11 +60,35 @@
|
|
| 60 |
"learning_rate": 0.0002,
|
| 61 |
"loss": 1.1174,
|
| 62 |
"step": 9
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 63 |
}
|
| 64 |
],
|
| 65 |
"max_steps": 500,
|
| 66 |
"num_train_epochs": 125,
|
| 67 |
-
"total_flos":
|
| 68 |
"trial_name": null,
|
| 69 |
"trial_params": null
|
| 70 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"best_metric": null,
|
| 3 |
"best_model_checkpoint": null,
|
| 4 |
+
"epoch": 3.25,
|
| 5 |
+
"global_step": 13,
|
| 6 |
"is_hyper_param_search": false,
|
| 7 |
"is_local_process_zero": true,
|
| 8 |
"is_world_process_zero": true,
|
|
|
|
| 60 |
"learning_rate": 0.0002,
|
| 61 |
"loss": 1.1174,
|
| 62 |
"step": 9
|
| 63 |
+
},
|
| 64 |
+
{
|
| 65 |
+
"epoch": 2.5,
|
| 66 |
+
"learning_rate": 0.0002,
|
| 67 |
+
"loss": 0.9802,
|
| 68 |
+
"step": 10
|
| 69 |
+
},
|
| 70 |
+
{
|
| 71 |
+
"epoch": 2.75,
|
| 72 |
+
"learning_rate": 0.0002,
|
| 73 |
+
"loss": 0.8965,
|
| 74 |
+
"step": 11
|
| 75 |
+
},
|
| 76 |
+
{
|
| 77 |
+
"epoch": 3.0,
|
| 78 |
+
"learning_rate": 0.0002,
|
| 79 |
+
"loss": 0.7951,
|
| 80 |
+
"step": 12
|
| 81 |
+
},
|
| 82 |
+
{
|
| 83 |
+
"epoch": 3.25,
|
| 84 |
+
"learning_rate": 0.0002,
|
| 85 |
+
"loss": 0.6422,
|
| 86 |
+
"step": 13
|
| 87 |
}
|
| 88 |
],
|
| 89 |
"max_steps": 500,
|
| 90 |
"num_train_epochs": 125,
|
| 91 |
+
"total_flos": 2168782279802880.0,
|
| 92 |
"trial_name": null,
|
| 93 |
"trial_params": null
|
| 94 |
}
|
pytorch_model.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 5018531153
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3c1829e1d9fe90b41ecbfccc04d70f06a21fb290a57b54fa1d7cdb906bac3a50
|
| 3 |
size 5018531153
|
runs/Jul19_18-03-38_47ad500bc002/events.out.tfevents.1689789837.47ad500bc002.2216.8
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:20ae9a3f24920171c22cccb9e05be58bfecabaa437ec9df242a7dd0a1a1bd2bf
|
| 3 |
+
size 6522
|