FormlessAI commited on
Commit
a2cf0a4
·
verified ·
1 Parent(s): 07a4b97

Training in progress, epoch 0, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5c7d696805c33619b84f2fedbcdd5a68607d7306abf5dbf4533f634e4982f5c8
3
  size 1172343536
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a9c3e8764ac0e745f6f2f52febb7d10692a33c3745620483b24136f9b8a908e
3
  size 1172343536
last-checkpoint/global_step250/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8179a1613896aa79455e50e4aa8d77bd60a506db72324d864e9cdca54cc60626
3
+ size 883824229
last-checkpoint/global_step250/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9fc5a87dbe8a7cce6e57a9b3ace28fd4f4f5928893f68f6debd75d62a4729109
3
+ size 883824293
last-checkpoint/global_step250/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f48a186df598e4b9071facf76f95274858f30d911693188fcb82ef9ed3e9ecf
3
+ size 883824293
last-checkpoint/global_step250/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0cb4a60e6514af9a7d74cbcd436350c03f46da29e427d75838e9697d64139ec
3
+ size 883824293
last-checkpoint/global_step250/mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4dc344d017fe7374aa6e0dcc3680a9c16ccf9c24de138199ee5b5bb69d19fdd9
3
+ size 1172522073
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step200
 
1
+ global_step250
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:81d5f83aeb4b3f559bd28377336d47659b320e7f6ef2e5a723d284716278a151
3
  size 15429
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9892a41432d4e48929c5376b8225d5373bb9afe9f14665fbcb3934dc45cb330a
3
  size 15429
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2626437dcb133ffcf003ac89603f8cce07459b93a98d760cd9419e0d6a994067
3
  size 15429
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6f3949e2b25ad05905da16bc2d58aeadc9a9f1db0b0e97a04ceb63467acff1d
3
  size 15429
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae777e24d50cb7159634e1245f0697ba0fc64d5b26d535f2c80e411371a90b1c
3
  size 15429
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c3812c5e7f13c9d32f97d83cd625428061b1c9486e869caffd453d83ac07ceb
3
  size 15429
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:afc5a67564eebcfc961e8f1406a7418cc73497c2935a39af0232ef59f8153a6a
3
  size 15429
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6eda756b33768639c1e1932ae00c5d43269de5705c09162bc09acdf71d3533c0
3
  size 15429
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:331d42834d40f6ab9fe0c79a5f67902cd952ec456fbe0c511bb4b4fc0a7cf69b
3
  size 1401
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:610f32c595d4257f7e544a8d61dbdf0e85b19520c0d69daf98d6e00fbe896bb3
3
  size 1401
last-checkpoint/trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
  "best_global_step": null,
3
- "best_metric": 0.06463618576526642,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.1737242128121607,
6
  "eval_steps": 50,
7
- "global_step": 200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -672,6 +672,172 @@
672
  "eval_samples_per_second": 45.248,
673
  "eval_steps_per_second": 2.836,
674
  "step": 200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
675
  }
676
  ],
677
  "logging_steps": 5,
 
1
  {
2
  "best_global_step": null,
3
+ "best_metric": 0.05831117928028107,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.21715526601520088,
6
  "eval_steps": 50,
7
+ "global_step": 250,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
672
  "eval_samples_per_second": 45.248,
673
  "eval_steps_per_second": 2.836,
674
  "step": 200
675
+ },
676
+ {
677
+ "epoch": 0.1780673181324647,
678
+ "grad_norm": 2.3196284770965576,
679
+ "learning_rate": 2.5983748711161684e-05,
680
+ "logits/chosen": -0.4415039122104645,
681
+ "logits/rejected": -0.7743164300918579,
682
+ "logps/chosen": -104.36250305175781,
683
+ "logps/rejected": -187.5,
684
+ "loss": 0.0463,
685
+ "rewards/accuracies": 0.981249988079071,
686
+ "rewards/chosen": -3.2431640625,
687
+ "rewards/margins": 11.009374618530273,
688
+ "rewards/rejected": -14.260937690734863,
689
+ "step": 205
690
+ },
691
+ {
692
+ "epoch": 0.18241042345276873,
693
+ "grad_norm": 1.842193365097046,
694
+ "learning_rate": 2.598305199430297e-05,
695
+ "logits/chosen": -0.49321287870407104,
696
+ "logits/rejected": -0.8467773199081421,
697
+ "logps/chosen": -104.80000305175781,
698
+ "logps/rejected": -197.0,
699
+ "loss": 0.0531,
700
+ "rewards/accuracies": 0.981249988079071,
701
+ "rewards/chosen": -3.1109375953674316,
702
+ "rewards/margins": 12.276562690734863,
703
+ "rewards/rejected": -15.381250381469727,
704
+ "step": 210
705
+ },
706
+ {
707
+ "epoch": 0.18675352877307275,
708
+ "grad_norm": 1.857373595237732,
709
+ "learning_rate": 2.5982322581077525e-05,
710
+ "logits/chosen": -0.534863293170929,
711
+ "logits/rejected": -0.8707031011581421,
712
+ "logps/chosen": -104.2249984741211,
713
+ "logps/rejected": -199.3249969482422,
714
+ "loss": 0.0556,
715
+ "rewards/accuracies": 0.971875011920929,
716
+ "rewards/chosen": -3.1683592796325684,
717
+ "rewards/margins": 12.2265625,
718
+ "rewards/rejected": -15.395312309265137,
719
+ "step": 215
720
+ },
721
+ {
722
+ "epoch": 0.19109663409337677,
723
+ "grad_norm": 1.5108240842819214,
724
+ "learning_rate": 2.598156047332165e-05,
725
+ "logits/chosen": -0.49296873807907104,
726
+ "logits/rejected": -0.8592773675918579,
727
+ "logps/chosen": -99.38749694824219,
728
+ "logps/rejected": -190.1750030517578,
729
+ "loss": 0.0509,
730
+ "rewards/accuracies": 0.979687511920929,
731
+ "rewards/chosen": -2.543261766433716,
732
+ "rewards/margins": 11.925000190734863,
733
+ "rewards/rejected": -14.473437309265137,
734
+ "step": 220
735
+ },
736
+ {
737
+ "epoch": 0.19543973941368079,
738
+ "grad_norm": 2.208911418914795,
739
+ "learning_rate": 2.5980765672953946e-05,
740
+ "logits/chosen": -0.48857420682907104,
741
+ "logits/rejected": -0.869824230670929,
742
+ "logps/chosen": -99.2249984741211,
743
+ "logps/rejected": -189.39999389648438,
744
+ "loss": 0.0698,
745
+ "rewards/accuracies": 0.9750000238418579,
746
+ "rewards/chosen": -2.405956983566284,
747
+ "rewards/margins": 12.265625,
748
+ "rewards/rejected": -14.670312881469727,
749
+ "step": 225
750
+ },
751
+ {
752
+ "epoch": 0.1997828447339848,
753
+ "grad_norm": 1.6780784130096436,
754
+ "learning_rate": 2.5979938181975324e-05,
755
+ "logits/chosen": -0.537060558795929,
756
+ "logits/rejected": -0.892773449420929,
757
+ "logps/chosen": -100.7125015258789,
758
+ "logps/rejected": -199.625,
759
+ "loss": 0.0294,
760
+ "rewards/accuracies": 0.9828125238418579,
761
+ "rewards/chosen": -2.6998047828674316,
762
+ "rewards/margins": 13.115625381469727,
763
+ "rewards/rejected": -15.807812690734863,
764
+ "step": 230
765
+ },
766
+ {
767
+ "epoch": 0.20412595005428882,
768
+ "grad_norm": 1.3097057342529297,
769
+ "learning_rate": 2.5979078002468992e-05,
770
+ "logits/chosen": -0.5240722894668579,
771
+ "logits/rejected": -0.8931640386581421,
772
+ "logps/chosen": -102.375,
773
+ "logps/rejected": -197.4250030517578,
774
+ "loss": 0.0603,
775
+ "rewards/accuracies": 0.979687511920929,
776
+ "rewards/chosen": -2.710986375808716,
777
+ "rewards/margins": 12.909375190734863,
778
+ "rewards/rejected": -15.634374618530273,
779
+ "step": 235
780
+ },
781
+ {
782
+ "epoch": 0.20846905537459284,
783
+ "grad_norm": 2.499241828918457,
784
+ "learning_rate": 2.597818513660045e-05,
785
+ "logits/chosen": -0.4613281190395355,
786
+ "logits/rejected": -0.834277331829071,
787
+ "logps/chosen": -98.8499984741211,
788
+ "logps/rejected": -185.8249969482422,
789
+ "loss": 0.0777,
790
+ "rewards/accuracies": 0.9750000238418579,
791
+ "rewards/chosen": -2.1981444358825684,
792
+ "rewards/margins": 11.0859375,
793
+ "rewards/rejected": -13.290624618530273,
794
+ "step": 240
795
+ },
796
+ {
797
+ "epoch": 0.21281216069489686,
798
+ "grad_norm": 1.4439401626586914,
799
+ "learning_rate": 2.5977259586617493e-05,
800
+ "logits/chosen": -0.35028076171875,
801
+ "logits/rejected": -0.7183593511581421,
802
+ "logps/chosen": -95.6500015258789,
803
+ "logps/rejected": -176.0,
804
+ "loss": 0.0725,
805
+ "rewards/accuracies": 0.971875011920929,
806
+ "rewards/chosen": -2.0106444358825684,
807
+ "rewards/margins": 9.563281059265137,
808
+ "rewards/rejected": -11.579687118530273,
809
+ "step": 245
810
+ },
811
+ {
812
+ "epoch": 0.21715526601520088,
813
+ "grad_norm": 0.8243131041526794,
814
+ "learning_rate": 2.5976301354850176e-05,
815
+ "logits/chosen": -0.345947265625,
816
+ "logits/rejected": -0.679638683795929,
817
+ "logps/chosen": -98.36250305175781,
818
+ "logps/rejected": -182.125,
819
+ "loss": 0.0622,
820
+ "rewards/accuracies": 0.981249988079071,
821
+ "rewards/chosen": -2.5238280296325684,
822
+ "rewards/margins": 10.37109375,
823
+ "rewards/rejected": -12.893750190734863,
824
+ "step": 250
825
+ },
826
+ {
827
+ "epoch": 0.21715526601520088,
828
+ "eval_logits/chosen": -0.42717909812927246,
829
+ "eval_logits/rejected": -0.7368005514144897,
830
+ "eval_logps/chosen": -103.40794372558594,
831
+ "eval_logps/rejected": -193.13717651367188,
832
+ "eval_loss": 0.05831117928028107,
833
+ "eval_rewards/accuracies": 0.9769855737686157,
834
+ "eval_rewards/chosen": -3.0707638263702393,
835
+ "eval_rewards/margins": 11.707694053649902,
836
+ "eval_rewards/rejected": -14.779783248901367,
837
+ "eval_runtime": 97.7681,
838
+ "eval_samples_per_second": 45.209,
839
+ "eval_steps_per_second": 2.833,
840
+ "step": 250
841
  }
842
  ],
843
  "logging_steps": 5,