Training in progress, epoch 0, checkpoint
Browse files- last-checkpoint/adapter_model.safetensors +1 -1
- last-checkpoint/global_step200/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step200/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step200/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step200/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step200/mp_rank_00_model_states.pt +3 -0
- last-checkpoint/latest +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +169 -3
last-checkpoint/adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1172343536
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5c7d696805c33619b84f2fedbcdd5a68607d7306abf5dbf4533f634e4982f5c8
|
| 3 |
size 1172343536
|
last-checkpoint/global_step200/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cf16ed368a600d277fefa127eb7bd51d4425d02c1295916f8e6dabd62576a579
|
| 3 |
+
size 883824229
|
last-checkpoint/global_step200/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e7b683aadce016b516f68c28a00f6dec6a4b48f3461e2b15e7485cdc143b6ad6
|
| 3 |
+
size 883824293
|
last-checkpoint/global_step200/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4bc266731f510a3524e59f5c44e8e4f88929d533de5658ef8f53f3dc06c2228e
|
| 3 |
+
size 883824293
|
last-checkpoint/global_step200/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a9611a34df5478b6c4f3853f043ba4c2f69d27ef6010e32a7a94a8fcdd0d346f
|
| 3 |
+
size 883824293
|
last-checkpoint/global_step200/mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8529c0392fe7f20dafe3c781e6ef68c62b7fbc32a4c2150c61a180b83c64c208
|
| 3 |
+
size 1172522073
|
last-checkpoint/latest
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
|
|
|
|
| 1 |
+
global_step200
|
last-checkpoint/rng_state_0.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15429
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:81d5f83aeb4b3f559bd28377336d47659b320e7f6ef2e5a723d284716278a151
|
| 3 |
size 15429
|
last-checkpoint/rng_state_1.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15429
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2626437dcb133ffcf003ac89603f8cce07459b93a98d760cd9419e0d6a994067
|
| 3 |
size 15429
|
last-checkpoint/rng_state_2.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15429
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ae777e24d50cb7159634e1245f0697ba0fc64d5b26d535f2c80e411371a90b1c
|
| 3 |
size 15429
|
last-checkpoint/rng_state_3.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15429
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:afc5a67564eebcfc961e8f1406a7418cc73497c2935a39af0232ef59f8153a6a
|
| 3 |
size 15429
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1401
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:331d42834d40f6ab9fe0c79a5f67902cd952ec456fbe0c511bb4b4fc0a7cf69b
|
| 3 |
size 1401
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -1,10 +1,10 @@
|
|
| 1 |
{
|
| 2 |
"best_global_step": null,
|
| 3 |
-
"best_metric": 0.
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 50,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -506,6 +506,172 @@
|
|
| 506 |
"eval_samples_per_second": 45.285,
|
| 507 |
"eval_steps_per_second": 2.838,
|
| 508 |
"step": 150
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 509 |
}
|
| 510 |
],
|
| 511 |
"logging_steps": 5,
|
|
|
|
| 1 |
{
|
| 2 |
"best_global_step": null,
|
| 3 |
+
"best_metric": 0.06463618576526642,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.1737242128121607,
|
| 6 |
"eval_steps": 50,
|
| 7 |
+
"global_step": 200,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 506 |
"eval_samples_per_second": 45.285,
|
| 507 |
"eval_steps_per_second": 2.838,
|
| 508 |
"step": 150
|
| 509 |
+
},
|
| 510 |
+
{
|
| 511 |
+
"epoch": 0.13463626492942454,
|
| 512 |
+
"grad_norm": 0.9481019973754883,
|
| 513 |
+
"learning_rate": 2.5988917234452568e-05,
|
| 514 |
+
"logits/chosen": -0.7090820074081421,
|
| 515 |
+
"logits/rejected": -1.00244140625,
|
| 516 |
+
"logps/chosen": -95.23750305175781,
|
| 517 |
+
"logps/rejected": -174.4250030517578,
|
| 518 |
+
"loss": 0.0439,
|
| 519 |
+
"rewards/accuracies": 0.9859374761581421,
|
| 520 |
+
"rewards/chosen": -1.6262695789337158,
|
| 521 |
+
"rewards/margins": 9.666406631469727,
|
| 522 |
+
"rewards/rejected": -11.287500381469727,
|
| 523 |
+
"step": 155
|
| 524 |
+
},
|
| 525 |
+
{
|
| 526 |
+
"epoch": 0.13897937024972856,
|
| 527 |
+
"grad_norm": 3.119917392730713,
|
| 528 |
+
"learning_rate": 2.598854756414658e-05,
|
| 529 |
+
"logits/chosen": -0.706250011920929,
|
| 530 |
+
"logits/rejected": -1.006445288658142,
|
| 531 |
+
"logps/chosen": -100.73750305175781,
|
| 532 |
+
"logps/rejected": -195.52499389648438,
|
| 533 |
+
"loss": 0.0753,
|
| 534 |
+
"rewards/accuracies": 0.973437488079071,
|
| 535 |
+
"rewards/chosen": -2.6958985328674316,
|
| 536 |
+
"rewards/margins": 12.09375,
|
| 537 |
+
"rewards/rejected": -14.793749809265137,
|
| 538 |
+
"step": 160
|
| 539 |
+
},
|
| 540 |
+
{
|
| 541 |
+
"epoch": 0.14332247557003258,
|
| 542 |
+
"grad_norm": 2.0484530925750732,
|
| 543 |
+
"learning_rate": 2.5988145183638775e-05,
|
| 544 |
+
"logits/chosen": -0.687695324420929,
|
| 545 |
+
"logits/rejected": -0.9659179449081421,
|
| 546 |
+
"logps/chosen": -99.67500305175781,
|
| 547 |
+
"logps/rejected": -186.60000610351562,
|
| 548 |
+
"loss": 0.08,
|
| 549 |
+
"rewards/accuracies": 0.973437488079071,
|
| 550 |
+
"rewards/chosen": -2.467578172683716,
|
| 551 |
+
"rewards/margins": 11.5,
|
| 552 |
+
"rewards/rejected": -13.967187881469727,
|
| 553 |
+
"step": 165
|
| 554 |
+
},
|
| 555 |
+
{
|
| 556 |
+
"epoch": 0.1476655808903366,
|
| 557 |
+
"grad_norm": 1.163669228553772,
|
| 558 |
+
"learning_rate": 2.598771009394214e-05,
|
| 559 |
+
"logits/chosen": -0.692333996295929,
|
| 560 |
+
"logits/rejected": -1.009374976158142,
|
| 561 |
+
"logps/chosen": -92.625,
|
| 562 |
+
"logps/rejected": -175.4875030517578,
|
| 563 |
+
"loss": 0.0796,
|
| 564 |
+
"rewards/accuracies": 0.9765625,
|
| 565 |
+
"rewards/chosen": -1.3732726573944092,
|
| 566 |
+
"rewards/margins": 10.21484375,
|
| 567 |
+
"rewards/rejected": -11.586718559265137,
|
| 568 |
+
"step": 170
|
| 569 |
+
},
|
| 570 |
+
{
|
| 571 |
+
"epoch": 0.15200868621064062,
|
| 572 |
+
"grad_norm": 1.496293067932129,
|
| 573 |
+
"learning_rate": 2.5987242296152015e-05,
|
| 574 |
+
"logits/chosen": -0.6812499761581421,
|
| 575 |
+
"logits/rejected": -1.025781273841858,
|
| 576 |
+
"logps/chosen": -89.7874984741211,
|
| 577 |
+
"logps/rejected": -173.60000610351562,
|
| 578 |
+
"loss": 0.0515,
|
| 579 |
+
"rewards/accuracies": 0.979687511920929,
|
| 580 |
+
"rewards/chosen": -0.5631958246231079,
|
| 581 |
+
"rewards/margins": 10.517969131469727,
|
| 582 |
+
"rewards/rejected": -11.086718559265137,
|
| 583 |
+
"step": 175
|
| 584 |
+
},
|
| 585 |
+
{
|
| 586 |
+
"epoch": 0.1563517915309446,
|
| 587 |
+
"grad_norm": 0.6427134871482849,
|
| 588 |
+
"learning_rate": 2.598674179144608e-05,
|
| 589 |
+
"logits/chosen": -0.731152355670929,
|
| 590 |
+
"logits/rejected": -1.055761694908142,
|
| 591 |
+
"logps/chosen": -101.48750305175781,
|
| 592 |
+
"logps/rejected": -194.52499389648438,
|
| 593 |
+
"loss": 0.0468,
|
| 594 |
+
"rewards/accuracies": 0.984375,
|
| 595 |
+
"rewards/chosen": -2.1346678733825684,
|
| 596 |
+
"rewards/margins": 11.561718940734863,
|
| 597 |
+
"rewards/rejected": -13.701562881469727,
|
| 598 |
+
"step": 180
|
| 599 |
+
},
|
| 600 |
+
{
|
| 601 |
+
"epoch": 0.16069489685124863,
|
| 602 |
+
"grad_norm": 3.4019172191619873,
|
| 603 |
+
"learning_rate": 2.598620858108436e-05,
|
| 604 |
+
"logits/chosen": -0.7110351324081421,
|
| 605 |
+
"logits/rejected": -1.060156226158142,
|
| 606 |
+
"logps/chosen": -105.51249694824219,
|
| 607 |
+
"logps/rejected": -198.5,
|
| 608 |
+
"loss": 0.072,
|
| 609 |
+
"rewards/accuracies": 0.9750000238418579,
|
| 610 |
+
"rewards/chosen": -3.612109422683716,
|
| 611 |
+
"rewards/margins": 12.0703125,
|
| 612 |
+
"rewards/rejected": -15.689062118530273,
|
| 613 |
+
"step": 185
|
| 614 |
+
},
|
| 615 |
+
{
|
| 616 |
+
"epoch": 0.16503800217155265,
|
| 617 |
+
"grad_norm": 2.8528225421905518,
|
| 618 |
+
"learning_rate": 2.5985642666409204e-05,
|
| 619 |
+
"logits/chosen": -0.6353515386581421,
|
| 620 |
+
"logits/rejected": -0.9964843988418579,
|
| 621 |
+
"logps/chosen": -105.625,
|
| 622 |
+
"logps/rejected": -196.8000030517578,
|
| 623 |
+
"loss": 0.0611,
|
| 624 |
+
"rewards/accuracies": 0.9781249761581421,
|
| 625 |
+
"rewards/chosen": -3.4736328125,
|
| 626 |
+
"rewards/margins": 11.747655868530273,
|
| 627 |
+
"rewards/rejected": -15.225000381469727,
|
| 628 |
+
"step": 190
|
| 629 |
+
},
|
| 630 |
+
{
|
| 631 |
+
"epoch": 0.16938110749185667,
|
| 632 |
+
"grad_norm": 2.388313055038452,
|
| 633 |
+
"learning_rate": 2.5985044048845307e-05,
|
| 634 |
+
"logits/chosen": -0.529296875,
|
| 635 |
+
"logits/rejected": -0.940234363079071,
|
| 636 |
+
"logps/chosen": -105.25,
|
| 637 |
+
"logps/rejected": -194.1999969482422,
|
| 638 |
+
"loss": 0.0618,
|
| 639 |
+
"rewards/accuracies": 0.9781249761581421,
|
| 640 |
+
"rewards/chosen": -3.1537108421325684,
|
| 641 |
+
"rewards/margins": 11.405468940734863,
|
| 642 |
+
"rewards/rejected": -14.560937881469727,
|
| 643 |
+
"step": 195
|
| 644 |
+
},
|
| 645 |
+
{
|
| 646 |
+
"epoch": 0.1737242128121607,
|
| 647 |
+
"grad_norm": 1.6818196773529053,
|
| 648 |
+
"learning_rate": 2.5984412729899686e-05,
|
| 649 |
+
"logits/chosen": -0.42333984375,
|
| 650 |
+
"logits/rejected": -0.798632800579071,
|
| 651 |
+
"logps/chosen": -102.2125015258789,
|
| 652 |
+
"logps/rejected": -185.64999389648438,
|
| 653 |
+
"loss": 0.0601,
|
| 654 |
+
"rewards/accuracies": 0.9765625,
|
| 655 |
+
"rewards/chosen": -2.742382764816284,
|
| 656 |
+
"rewards/margins": 10.553906440734863,
|
| 657 |
+
"rewards/rejected": -13.293749809265137,
|
| 658 |
+
"step": 200
|
| 659 |
+
},
|
| 660 |
+
{
|
| 661 |
+
"epoch": 0.1737242128121607,
|
| 662 |
+
"eval_logits/chosen": -0.41209879517555237,
|
| 663 |
+
"eval_logits/rejected": -0.7723516225814819,
|
| 664 |
+
"eval_logps/chosen": -102.44945526123047,
|
| 665 |
+
"eval_logps/rejected": -186.8014373779297,
|
| 666 |
+
"eval_loss": 0.06463618576526642,
|
| 667 |
+
"eval_rewards/accuracies": 0.9745036363601685,
|
| 668 |
+
"eval_rewards/chosen": -2.8919081687927246,
|
| 669 |
+
"eval_rewards/margins": 10.732288360595703,
|
| 670 |
+
"eval_rewards/rejected": -13.622066497802734,
|
| 671 |
+
"eval_runtime": 97.6846,
|
| 672 |
+
"eval_samples_per_second": 45.248,
|
| 673 |
+
"eval_steps_per_second": 2.836,
|
| 674 |
+
"step": 200
|
| 675 |
}
|
| 676 |
],
|
| 677 |
"logging_steps": 5,
|