FormlessAI commited on
Commit
1691705
·
verified ·
1 Parent(s): 079cee3

Training in progress, epoch 0, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:59ecd18eec1f27b2434d729c993e97a6c950934b3fc7d170d06203a4b22faf33
3
  size 431331112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aee538636744e0acbe2239a943ad435e5614264522618ad93fab75142dd2ec13
3
  size 431331112
last-checkpoint/global_step200/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ccc451fc82781f109bb7c16f02dbb15a7f815a88c9ae16090b0e4a6948306fd
3
+ size 325177765
last-checkpoint/global_step200/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7fa03c7035ce362f4a36232a00d556316b0470c05122c1ef9070f16cca2e710b
3
+ size 325177765
last-checkpoint/global_step200/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e65a63a4b0dc1db26d7f33c1e837810aa366c61c33a053879e3e05dd1a80b741
3
+ size 325177765
last-checkpoint/global_step200/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:266655c35b3c6c6d27d4702e03e32041a3c2dc2265eec4453ab2bdd297c3b732
3
+ size 325177765
last-checkpoint/global_step200/mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26588628f6cd900302e44e8309320238d062e557c38863d5c4517ee078bbd7e0
3
+ size 431463321
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step150
 
1
+ global_step200
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6dc21751f56a807ad2a7d09eea3bbe867a0c8e0f3d829004cfe097808a8a849d
3
  size 15429
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81d5f83aeb4b3f559bd28377336d47659b320e7f6ef2e5a723d284716278a151
3
  size 15429
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:69adbd9997461473344beb9c44d2e496e24fbc4d6fe69245ab0bd127882efd96
3
  size 15429
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2626437dcb133ffcf003ac89603f8cce07459b93a98d760cd9419e0d6a994067
3
  size 15429
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:baaf7026d9e588ca2ba5b4de8768a379982b7530f39e0b88fa44af9bef8e8bc9
3
  size 15429
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae777e24d50cb7159634e1245f0697ba0fc64d5b26d535f2c80e411371a90b1c
3
  size 15429
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1ec81cbdf599c90b49fb13998f6e46e2492b55345216231b6ce078f88cf04eae
3
  size 15429
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afc5a67564eebcfc961e8f1406a7418cc73497c2935a39af0232ef59f8153a6a
3
  size 15429
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6f335e4879fd62188324ceea55afd3458a938867b1a141c427526220c3441539
3
  size 1401
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61cf7a6562a1b537ed732fd397b8f4fbad25c227aed55701c0cfe78f176c42d9
3
  size 1401
last-checkpoint/trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
  "best_global_step": null,
3
- "best_metric": 0.07377000898122787,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.09740259740259741,
6
  "eval_steps": 50,
7
- "global_step": 150,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -506,6 +506,172 @@
506
  "eval_samples_per_second": 44.338,
507
  "eval_steps_per_second": 0.353,
508
  "step": 150
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
509
  }
510
  ],
511
  "logging_steps": 5,
 
1
  {
2
  "best_global_step": null,
3
+ "best_metric": 0.05630422756075859,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.12987012987012986,
6
  "eval_steps": 50,
7
+ "global_step": 200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
506
  "eval_samples_per_second": 44.338,
507
  "eval_steps_per_second": 0.353,
508
  "step": 150
509
+ },
510
+ {
511
+ "epoch": 0.10064935064935066,
512
+ "grad_norm": 0.891044557094574,
513
+ "learning_rate": 0.00011565544706162286,
514
+ "logits/chosen": 6.451029300689697,
515
+ "logits/rejected": 7.018620491027832,
516
+ "logps/chosen": -318.9430236816406,
517
+ "logps/rejected": -354.2622985839844,
518
+ "loss": 0.077,
519
+ "rewards/accuracies": 0.96875,
520
+ "rewards/chosen": -2.790806293487549,
521
+ "rewards/margins": 10.650590896606445,
522
+ "rewards/rejected": -13.441396713256836,
523
+ "step": 155
524
+ },
525
+ {
526
+ "epoch": 0.1038961038961039,
527
+ "grad_norm": 1.011932134628296,
528
+ "learning_rate": 0.00011565380196097788,
529
+ "logits/chosen": 6.38694953918457,
530
+ "logits/rejected": 6.985430717468262,
531
+ "logps/chosen": -305.1867370605469,
532
+ "logps/rejected": -316.77239990234375,
533
+ "loss": 0.0743,
534
+ "rewards/accuracies": 0.96875,
535
+ "rewards/chosen": -1.8528194427490234,
536
+ "rewards/margins": 8.657999038696289,
537
+ "rewards/rejected": -10.510818481445312,
538
+ "step": 160
539
+ },
540
+ {
541
+ "epoch": 0.10714285714285714,
542
+ "grad_norm": 1.1229149103164673,
543
+ "learning_rate": 0.00011565201129393704,
544
+ "logits/chosen": 6.276331424713135,
545
+ "logits/rejected": 6.919455051422119,
546
+ "logps/chosen": -323.6394348144531,
547
+ "logps/rejected": -360.06695556640625,
548
+ "loss": 0.0711,
549
+ "rewards/accuracies": 0.9703124761581421,
550
+ "rewards/chosen": -3.3554577827453613,
551
+ "rewards/margins": 9.554231643676758,
552
+ "rewards/rejected": -12.909688949584961,
553
+ "step": 165
554
+ },
555
+ {
556
+ "epoch": 0.11038961038961038,
557
+ "grad_norm": 0.8342244029045105,
558
+ "learning_rate": 0.00011565007506500828,
559
+ "logits/chosen": 5.989048957824707,
560
+ "logits/rejected": 6.676814079284668,
561
+ "logps/chosen": -304.5875549316406,
562
+ "logps/rejected": -326.0283203125,
563
+ "loss": 0.0981,
564
+ "rewards/accuracies": 0.9703124761581421,
565
+ "rewards/chosen": -1.7597744464874268,
566
+ "rewards/margins": 8.476037979125977,
567
+ "rewards/rejected": -10.235812187194824,
568
+ "step": 170
569
+ },
570
+ {
571
+ "epoch": 0.11363636363636363,
572
+ "grad_norm": 0.7202894687652588,
573
+ "learning_rate": 0.0001156479932790661,
574
+ "logits/chosen": 6.15761661529541,
575
+ "logits/rejected": 6.778907775878906,
576
+ "logps/chosen": -302.4050598144531,
577
+ "logps/rejected": -324.09765625,
578
+ "loss": 0.0923,
579
+ "rewards/accuracies": 0.9703124761581421,
580
+ "rewards/chosen": -0.7549916505813599,
581
+ "rewards/margins": 8.769140243530273,
582
+ "rewards/rejected": -9.524131774902344,
583
+ "step": 175
584
+ },
585
+ {
586
+ "epoch": 0.11688311688311688,
587
+ "grad_norm": 0.753760576248169,
588
+ "learning_rate": 0.00011564576594135137,
589
+ "logits/chosen": 6.395578384399414,
590
+ "logits/rejected": 7.083353519439697,
591
+ "logps/chosen": -313.22186279296875,
592
+ "logps/rejected": -348.41339111328125,
593
+ "loss": 0.0507,
594
+ "rewards/accuracies": 0.9828125238418579,
595
+ "rewards/chosen": -3.535522937774658,
596
+ "rewards/margins": 8.79172420501709,
597
+ "rewards/rejected": -12.327247619628906,
598
+ "step": 180
599
+ },
600
+ {
601
+ "epoch": 0.12012987012987013,
602
+ "grad_norm": 0.6927999258041382,
603
+ "learning_rate": 0.00011564339305747142,
604
+ "logits/chosen": 6.240847587585449,
605
+ "logits/rejected": 6.926623344421387,
606
+ "logps/chosen": -318.8568420410156,
607
+ "logps/rejected": -346.41680908203125,
608
+ "loss": 0.053,
609
+ "rewards/accuracies": 0.981249988079071,
610
+ "rewards/chosen": -3.0302348136901855,
611
+ "rewards/margins": 10.297189712524414,
612
+ "rewards/rejected": -13.327425003051758,
613
+ "step": 185
614
+ },
615
+ {
616
+ "epoch": 0.12337662337662338,
617
+ "grad_norm": 0.2692127227783203,
618
+ "learning_rate": 0.00011564087463339999,
619
+ "logits/chosen": 5.879881858825684,
620
+ "logits/rejected": 6.644034385681152,
621
+ "logps/chosen": -300.416259765625,
622
+ "logps/rejected": -339.57037353515625,
623
+ "loss": 0.0423,
624
+ "rewards/accuracies": 0.981249988079071,
625
+ "rewards/chosen": -1.8148984909057617,
626
+ "rewards/margins": 9.979120254516602,
627
+ "rewards/rejected": -11.794018745422363,
628
+ "step": 190
629
+ },
630
+ {
631
+ "epoch": 0.1266233766233766,
632
+ "grad_norm": 0.7986512184143066,
633
+ "learning_rate": 0.0001156382106754772,
634
+ "logits/chosen": 5.803470611572266,
635
+ "logits/rejected": 6.645857334136963,
636
+ "logps/chosen": -310.81170654296875,
637
+ "logps/rejected": -348.056396484375,
638
+ "loss": 0.0403,
639
+ "rewards/accuracies": 0.989062488079071,
640
+ "rewards/chosen": -2.6157710552215576,
641
+ "rewards/margins": 10.561070442199707,
642
+ "rewards/rejected": -13.176841735839844,
643
+ "step": 195
644
+ },
645
+ {
646
+ "epoch": 0.12987012987012986,
647
+ "grad_norm": 0.7699182629585266,
648
+ "learning_rate": 0.00011563540119040956,
649
+ "logits/chosen": 6.0391011238098145,
650
+ "logits/rejected": 6.851220607757568,
651
+ "logps/chosen": -306.738525390625,
652
+ "logps/rejected": -371.85369873046875,
653
+ "loss": 0.0557,
654
+ "rewards/accuracies": 0.9828125238418579,
655
+ "rewards/chosen": -1.9803781509399414,
656
+ "rewards/margins": 12.751678466796875,
657
+ "rewards/rejected": -14.732057571411133,
658
+ "step": 200
659
+ },
660
+ {
661
+ "epoch": 0.12987012987012986,
662
+ "eval_logits/chosen": 6.243391513824463,
663
+ "eval_logits/rejected": 6.946824073791504,
664
+ "eval_logps/chosen": -326.7683410644531,
665
+ "eval_logps/rejected": -375.8028259277344,
666
+ "eval_loss": 0.05630422756075859,
667
+ "eval_rewards/accuracies": 0.9780886769294739,
668
+ "eval_rewards/chosen": -4.148531913757324,
669
+ "eval_rewards/margins": 11.36646842956543,
670
+ "eval_rewards/rejected": -15.515000343322754,
671
+ "eval_runtime": 133.2954,
672
+ "eval_samples_per_second": 44.338,
673
+ "eval_steps_per_second": 0.353,
674
+ "step": 200
675
  }
676
  ],
677
  "logging_steps": 5,