Training in progress, step 45000
Browse files- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/pytorch_model.bin +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +63 -3
- pytorch_model.bin +1 -1
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 202193937
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:246faa74bee80665f358d5669008a0887cddb7b18e016fafe9dd7ea6316dd50e
|
| 3 |
size 202193937
|
last-checkpoint/pytorch_model.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 102501541
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:84e97a922c2788b9920a24141a5e48a7999f9bc8c2eff341a1e699714ef37106
|
| 3 |
size 102501541
|
last-checkpoint/rng_state_0.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14503
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:46dd8d4a8076e5a459a085df9fe23a5e0b6a3ba2a8db83be1492ad01e7ed9159
|
| 3 |
size 14503
|
last-checkpoint/rng_state_1.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14503
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:46dd8d4a8076e5a459a085df9fe23a5e0b6a3ba2a8db83be1492ad01e7ed9159
|
| 3 |
size 14503
|
last-checkpoint/rng_state_2.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14503
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:46dd8d4a8076e5a459a085df9fe23a5e0b6a3ba2a8db83be1492ad01e7ed9159
|
| 3 |
size 14503
|
last-checkpoint/rng_state_3.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14503
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:46dd8d4a8076e5a459a085df9fe23a5e0b6a3ba2a8db83be1492ad01e7ed9159
|
| 3 |
size 14503
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 623
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3b42368e9f62da349b2760579f9deddc87fbe7062743f1048a9d6bf6e1d86f64
|
| 3 |
size 623
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -1,8 +1,8 @@
|
|
| 1 |
{
|
| 2 |
"best_metric": null,
|
| 3 |
"best_model_checkpoint": null,
|
| 4 |
-
"epoch": 0.
|
| 5 |
-
"global_step":
|
| 6 |
"is_hyper_param_search": false,
|
| 7 |
"is_local_process_zero": true,
|
| 8 |
"is_world_process_zero": true,
|
|
@@ -486,11 +486,71 @@
|
|
| 486 |
"learning_rate": 1.4975414512725056e-05,
|
| 487 |
"loss": 0.0519,
|
| 488 |
"step": 40000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 489 |
}
|
| 490 |
],
|
| 491 |
"max_steps": 500000,
|
| 492 |
"num_train_epochs": 8,
|
| 493 |
-
"total_flos":
|
| 494 |
"trial_name": null,
|
| 495 |
"trial_params": null
|
| 496 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"best_metric": null,
|
| 3 |
"best_model_checkpoint": null,
|
| 4 |
+
"epoch": 0.689364635594194,
|
| 5 |
+
"global_step": 45000,
|
| 6 |
"is_hyper_param_search": false,
|
| 7 |
"is_local_process_zero": true,
|
| 8 |
"is_world_process_zero": true,
|
|
|
|
| 486 |
"learning_rate": 1.4975414512725056e-05,
|
| 487 |
"loss": 0.0519,
|
| 488 |
"step": 40000
|
| 489 |
+
},
|
| 490 |
+
{
|
| 491 |
+
"epoch": 0.62,
|
| 492 |
+
"learning_rate": 1.4973749622593532e-05,
|
| 493 |
+
"loss": 0.0518,
|
| 494 |
+
"step": 40500
|
| 495 |
+
},
|
| 496 |
+
{
|
| 497 |
+
"epoch": 0.63,
|
| 498 |
+
"learning_rate": 1.4972030340333e-05,
|
| 499 |
+
"loss": 0.0517,
|
| 500 |
+
"step": 41000
|
| 501 |
+
},
|
| 502 |
+
{
|
| 503 |
+
"epoch": 0.64,
|
| 504 |
+
"learning_rate": 1.4970256684745257e-05,
|
| 505 |
+
"loss": 0.0516,
|
| 506 |
+
"step": 41500
|
| 507 |
+
},
|
| 508 |
+
{
|
| 509 |
+
"epoch": 0.64,
|
| 510 |
+
"learning_rate": 1.4968428675226714e-05,
|
| 511 |
+
"loss": 0.0516,
|
| 512 |
+
"step": 42000
|
| 513 |
+
},
|
| 514 |
+
{
|
| 515 |
+
"epoch": 0.65,
|
| 516 |
+
"learning_rate": 1.4966546331768191e-05,
|
| 517 |
+
"loss": 0.0515,
|
| 518 |
+
"step": 42500
|
| 519 |
+
},
|
| 520 |
+
{
|
| 521 |
+
"epoch": 0.66,
|
| 522 |
+
"learning_rate": 1.4964609674954694e-05,
|
| 523 |
+
"loss": 0.0514,
|
| 524 |
+
"step": 43000
|
| 525 |
+
},
|
| 526 |
+
{
|
| 527 |
+
"epoch": 0.67,
|
| 528 |
+
"learning_rate": 1.4962618725965194e-05,
|
| 529 |
+
"loss": 0.0512,
|
| 530 |
+
"step": 43500
|
| 531 |
+
},
|
| 532 |
+
{
|
| 533 |
+
"epoch": 0.67,
|
| 534 |
+
"learning_rate": 1.496057350657239e-05,
|
| 535 |
+
"loss": 0.051,
|
| 536 |
+
"step": 44000
|
| 537 |
+
},
|
| 538 |
+
{
|
| 539 |
+
"epoch": 0.68,
|
| 540 |
+
"learning_rate": 1.4958474039142468e-05,
|
| 541 |
+
"loss": 0.0509,
|
| 542 |
+
"step": 44500
|
| 543 |
+
},
|
| 544 |
+
{
|
| 545 |
+
"epoch": 0.69,
|
| 546 |
+
"learning_rate": 1.4956320346634877e-05,
|
| 547 |
+
"loss": 0.0507,
|
| 548 |
+
"step": 45000
|
| 549 |
}
|
| 550 |
],
|
| 551 |
"max_steps": 500000,
|
| 552 |
"num_train_epochs": 8,
|
| 553 |
+
"total_flos": 7.18846062242625e+20,
|
| 554 |
"trial_name": null,
|
| 555 |
"trial_params": null
|
| 556 |
}
|
pytorch_model.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 102501541
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:84e97a922c2788b9920a24141a5e48a7999f9bc8c2eff341a1e699714ef37106
|
| 3 |
size 102501541
|