Training in progress, epoch 0, checkpoint
Browse files- last-checkpoint/adapter_model.safetensors +1 -1
- last-checkpoint/global_step200/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step200/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step200/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step200/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step200/mp_rank_00_model_states.pt +3 -0
- last-checkpoint/latest +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +169 -3
last-checkpoint/adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 431331112
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aee538636744e0acbe2239a943ad435e5614264522618ad93fab75142dd2ec13
|
| 3 |
size 431331112
|
last-checkpoint/global_step200/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6ccc451fc82781f109bb7c16f02dbb15a7f815a88c9ae16090b0e4a6948306fd
|
| 3 |
+
size 325177765
|
last-checkpoint/global_step200/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7fa03c7035ce362f4a36232a00d556316b0470c05122c1ef9070f16cca2e710b
|
| 3 |
+
size 325177765
|
last-checkpoint/global_step200/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e65a63a4b0dc1db26d7f33c1e837810aa366c61c33a053879e3e05dd1a80b741
|
| 3 |
+
size 325177765
|
last-checkpoint/global_step200/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:266655c35b3c6c6d27d4702e03e32041a3c2dc2265eec4453ab2bdd297c3b732
|
| 3 |
+
size 325177765
|
last-checkpoint/global_step200/mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:26588628f6cd900302e44e8309320238d062e557c38863d5c4517ee078bbd7e0
|
| 3 |
+
size 431463321
|
last-checkpoint/latest
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
|
|
|
|
| 1 |
+
global_step200
|
last-checkpoint/rng_state_0.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15429
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:81d5f83aeb4b3f559bd28377336d47659b320e7f6ef2e5a723d284716278a151
|
| 3 |
size 15429
|
last-checkpoint/rng_state_1.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15429
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2626437dcb133ffcf003ac89603f8cce07459b93a98d760cd9419e0d6a994067
|
| 3 |
size 15429
|
last-checkpoint/rng_state_2.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15429
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ae777e24d50cb7159634e1245f0697ba0fc64d5b26d535f2c80e411371a90b1c
|
| 3 |
size 15429
|
last-checkpoint/rng_state_3.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15429
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:afc5a67564eebcfc961e8f1406a7418cc73497c2935a39af0232ef59f8153a6a
|
| 3 |
size 15429
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1401
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:61cf7a6562a1b537ed732fd397b8f4fbad25c227aed55701c0cfe78f176c42d9
|
| 3 |
size 1401
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -1,10 +1,10 @@
|
|
| 1 |
{
|
| 2 |
"best_global_step": null,
|
| 3 |
-
"best_metric": 0.
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 50,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -506,6 +506,172 @@
|
|
| 506 |
"eval_samples_per_second": 44.338,
|
| 507 |
"eval_steps_per_second": 0.353,
|
| 508 |
"step": 150
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 509 |
}
|
| 510 |
],
|
| 511 |
"logging_steps": 5,
|
|
|
|
| 1 |
{
|
| 2 |
"best_global_step": null,
|
| 3 |
+
"best_metric": 0.05630422756075859,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.12987012987012986,
|
| 6 |
"eval_steps": 50,
|
| 7 |
+
"global_step": 200,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 506 |
"eval_samples_per_second": 44.338,
|
| 507 |
"eval_steps_per_second": 0.353,
|
| 508 |
"step": 150
|
| 509 |
+
},
|
| 510 |
+
{
|
| 511 |
+
"epoch": 0.10064935064935066,
|
| 512 |
+
"grad_norm": 0.891044557094574,
|
| 513 |
+
"learning_rate": 0.00011565544706162286,
|
| 514 |
+
"logits/chosen": 6.451029300689697,
|
| 515 |
+
"logits/rejected": 7.018620491027832,
|
| 516 |
+
"logps/chosen": -318.9430236816406,
|
| 517 |
+
"logps/rejected": -354.2622985839844,
|
| 518 |
+
"loss": 0.077,
|
| 519 |
+
"rewards/accuracies": 0.96875,
|
| 520 |
+
"rewards/chosen": -2.790806293487549,
|
| 521 |
+
"rewards/margins": 10.650590896606445,
|
| 522 |
+
"rewards/rejected": -13.441396713256836,
|
| 523 |
+
"step": 155
|
| 524 |
+
},
|
| 525 |
+
{
|
| 526 |
+
"epoch": 0.1038961038961039,
|
| 527 |
+
"grad_norm": 1.011932134628296,
|
| 528 |
+
"learning_rate": 0.00011565380196097788,
|
| 529 |
+
"logits/chosen": 6.38694953918457,
|
| 530 |
+
"logits/rejected": 6.985430717468262,
|
| 531 |
+
"logps/chosen": -305.1867370605469,
|
| 532 |
+
"logps/rejected": -316.77239990234375,
|
| 533 |
+
"loss": 0.0743,
|
| 534 |
+
"rewards/accuracies": 0.96875,
|
| 535 |
+
"rewards/chosen": -1.8528194427490234,
|
| 536 |
+
"rewards/margins": 8.657999038696289,
|
| 537 |
+
"rewards/rejected": -10.510818481445312,
|
| 538 |
+
"step": 160
|
| 539 |
+
},
|
| 540 |
+
{
|
| 541 |
+
"epoch": 0.10714285714285714,
|
| 542 |
+
"grad_norm": 1.1229149103164673,
|
| 543 |
+
"learning_rate": 0.00011565201129393704,
|
| 544 |
+
"logits/chosen": 6.276331424713135,
|
| 545 |
+
"logits/rejected": 6.919455051422119,
|
| 546 |
+
"logps/chosen": -323.6394348144531,
|
| 547 |
+
"logps/rejected": -360.06695556640625,
|
| 548 |
+
"loss": 0.0711,
|
| 549 |
+
"rewards/accuracies": 0.9703124761581421,
|
| 550 |
+
"rewards/chosen": -3.3554577827453613,
|
| 551 |
+
"rewards/margins": 9.554231643676758,
|
| 552 |
+
"rewards/rejected": -12.909688949584961,
|
| 553 |
+
"step": 165
|
| 554 |
+
},
|
| 555 |
+
{
|
| 556 |
+
"epoch": 0.11038961038961038,
|
| 557 |
+
"grad_norm": 0.8342244029045105,
|
| 558 |
+
"learning_rate": 0.00011565007506500828,
|
| 559 |
+
"logits/chosen": 5.989048957824707,
|
| 560 |
+
"logits/rejected": 6.676814079284668,
|
| 561 |
+
"logps/chosen": -304.5875549316406,
|
| 562 |
+
"logps/rejected": -326.0283203125,
|
| 563 |
+
"loss": 0.0981,
|
| 564 |
+
"rewards/accuracies": 0.9703124761581421,
|
| 565 |
+
"rewards/chosen": -1.7597744464874268,
|
| 566 |
+
"rewards/margins": 8.476037979125977,
|
| 567 |
+
"rewards/rejected": -10.235812187194824,
|
| 568 |
+
"step": 170
|
| 569 |
+
},
|
| 570 |
+
{
|
| 571 |
+
"epoch": 0.11363636363636363,
|
| 572 |
+
"grad_norm": 0.7202894687652588,
|
| 573 |
+
"learning_rate": 0.0001156479932790661,
|
| 574 |
+
"logits/chosen": 6.15761661529541,
|
| 575 |
+
"logits/rejected": 6.778907775878906,
|
| 576 |
+
"logps/chosen": -302.4050598144531,
|
| 577 |
+
"logps/rejected": -324.09765625,
|
| 578 |
+
"loss": 0.0923,
|
| 579 |
+
"rewards/accuracies": 0.9703124761581421,
|
| 580 |
+
"rewards/chosen": -0.7549916505813599,
|
| 581 |
+
"rewards/margins": 8.769140243530273,
|
| 582 |
+
"rewards/rejected": -9.524131774902344,
|
| 583 |
+
"step": 175
|
| 584 |
+
},
|
| 585 |
+
{
|
| 586 |
+
"epoch": 0.11688311688311688,
|
| 587 |
+
"grad_norm": 0.753760576248169,
|
| 588 |
+
"learning_rate": 0.00011564576594135137,
|
| 589 |
+
"logits/chosen": 6.395578384399414,
|
| 590 |
+
"logits/rejected": 7.083353519439697,
|
| 591 |
+
"logps/chosen": -313.22186279296875,
|
| 592 |
+
"logps/rejected": -348.41339111328125,
|
| 593 |
+
"loss": 0.0507,
|
| 594 |
+
"rewards/accuracies": 0.9828125238418579,
|
| 595 |
+
"rewards/chosen": -3.535522937774658,
|
| 596 |
+
"rewards/margins": 8.79172420501709,
|
| 597 |
+
"rewards/rejected": -12.327247619628906,
|
| 598 |
+
"step": 180
|
| 599 |
+
},
|
| 600 |
+
{
|
| 601 |
+
"epoch": 0.12012987012987013,
|
| 602 |
+
"grad_norm": 0.6927999258041382,
|
| 603 |
+
"learning_rate": 0.00011564339305747142,
|
| 604 |
+
"logits/chosen": 6.240847587585449,
|
| 605 |
+
"logits/rejected": 6.926623344421387,
|
| 606 |
+
"logps/chosen": -318.8568420410156,
|
| 607 |
+
"logps/rejected": -346.41680908203125,
|
| 608 |
+
"loss": 0.053,
|
| 609 |
+
"rewards/accuracies": 0.981249988079071,
|
| 610 |
+
"rewards/chosen": -3.0302348136901855,
|
| 611 |
+
"rewards/margins": 10.297189712524414,
|
| 612 |
+
"rewards/rejected": -13.327425003051758,
|
| 613 |
+
"step": 185
|
| 614 |
+
},
|
| 615 |
+
{
|
| 616 |
+
"epoch": 0.12337662337662338,
|
| 617 |
+
"grad_norm": 0.2692127227783203,
|
| 618 |
+
"learning_rate": 0.00011564087463339999,
|
| 619 |
+
"logits/chosen": 5.879881858825684,
|
| 620 |
+
"logits/rejected": 6.644034385681152,
|
| 621 |
+
"logps/chosen": -300.416259765625,
|
| 622 |
+
"logps/rejected": -339.57037353515625,
|
| 623 |
+
"loss": 0.0423,
|
| 624 |
+
"rewards/accuracies": 0.981249988079071,
|
| 625 |
+
"rewards/chosen": -1.8148984909057617,
|
| 626 |
+
"rewards/margins": 9.979120254516602,
|
| 627 |
+
"rewards/rejected": -11.794018745422363,
|
| 628 |
+
"step": 190
|
| 629 |
+
},
|
| 630 |
+
{
|
| 631 |
+
"epoch": 0.1266233766233766,
|
| 632 |
+
"grad_norm": 0.7986512184143066,
|
| 633 |
+
"learning_rate": 0.0001156382106754772,
|
| 634 |
+
"logits/chosen": 5.803470611572266,
|
| 635 |
+
"logits/rejected": 6.645857334136963,
|
| 636 |
+
"logps/chosen": -310.81170654296875,
|
| 637 |
+
"logps/rejected": -348.056396484375,
|
| 638 |
+
"loss": 0.0403,
|
| 639 |
+
"rewards/accuracies": 0.989062488079071,
|
| 640 |
+
"rewards/chosen": -2.6157710552215576,
|
| 641 |
+
"rewards/margins": 10.561070442199707,
|
| 642 |
+
"rewards/rejected": -13.176841735839844,
|
| 643 |
+
"step": 195
|
| 644 |
+
},
|
| 645 |
+
{
|
| 646 |
+
"epoch": 0.12987012987012986,
|
| 647 |
+
"grad_norm": 0.7699182629585266,
|
| 648 |
+
"learning_rate": 0.00011563540119040956,
|
| 649 |
+
"logits/chosen": 6.0391011238098145,
|
| 650 |
+
"logits/rejected": 6.851220607757568,
|
| 651 |
+
"logps/chosen": -306.738525390625,
|
| 652 |
+
"logps/rejected": -371.85369873046875,
|
| 653 |
+
"loss": 0.0557,
|
| 654 |
+
"rewards/accuracies": 0.9828125238418579,
|
| 655 |
+
"rewards/chosen": -1.9803781509399414,
|
| 656 |
+
"rewards/margins": 12.751678466796875,
|
| 657 |
+
"rewards/rejected": -14.732057571411133,
|
| 658 |
+
"step": 200
|
| 659 |
+
},
|
| 660 |
+
{
|
| 661 |
+
"epoch": 0.12987012987012986,
|
| 662 |
+
"eval_logits/chosen": 6.243391513824463,
|
| 663 |
+
"eval_logits/rejected": 6.946824073791504,
|
| 664 |
+
"eval_logps/chosen": -326.7683410644531,
|
| 665 |
+
"eval_logps/rejected": -375.8028259277344,
|
| 666 |
+
"eval_loss": 0.05630422756075859,
|
| 667 |
+
"eval_rewards/accuracies": 0.9780886769294739,
|
| 668 |
+
"eval_rewards/chosen": -4.148531913757324,
|
| 669 |
+
"eval_rewards/margins": 11.36646842956543,
|
| 670 |
+
"eval_rewards/rejected": -15.515000343322754,
|
| 671 |
+
"eval_runtime": 133.2954,
|
| 672 |
+
"eval_samples_per_second": 44.338,
|
| 673 |
+
"eval_steps_per_second": 0.353,
|
| 674 |
+
"step": 200
|
| 675 |
}
|
| 676 |
],
|
| 677 |
"logging_steps": 5,
|