FormlessAI commited on
Commit
00162b4
·
verified ·
1 Parent(s): e03ce2f

Training in progress, epoch 0, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:da013167ea1fa3cf2c2603b4a7d46a3cd74f4b5970643aa9d1d7f0613ecbef66
3
  size 1172343536
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c7d696805c33619b84f2fedbcdd5a68607d7306abf5dbf4533f634e4982f5c8
3
  size 1172343536
last-checkpoint/global_step200/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf16ed368a600d277fefa127eb7bd51d4425d02c1295916f8e6dabd62576a579
3
+ size 883824229
last-checkpoint/global_step200/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7b683aadce016b516f68c28a00f6dec6a4b48f3461e2b15e7485cdc143b6ad6
3
+ size 883824293
last-checkpoint/global_step200/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4bc266731f510a3524e59f5c44e8e4f88929d533de5658ef8f53f3dc06c2228e
3
+ size 883824293
last-checkpoint/global_step200/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9611a34df5478b6c4f3853f043ba4c2f69d27ef6010e32a7a94a8fcdd0d346f
3
+ size 883824293
last-checkpoint/global_step200/mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8529c0392fe7f20dafe3c781e6ef68c62b7fbc32a4c2150c61a180b83c64c208
3
+ size 1172522073
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step150
 
1
+ global_step200
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6dc21751f56a807ad2a7d09eea3bbe867a0c8e0f3d829004cfe097808a8a849d
3
  size 15429
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81d5f83aeb4b3f559bd28377336d47659b320e7f6ef2e5a723d284716278a151
3
  size 15429
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:69adbd9997461473344beb9c44d2e496e24fbc4d6fe69245ab0bd127882efd96
3
  size 15429
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2626437dcb133ffcf003ac89603f8cce07459b93a98d760cd9419e0d6a994067
3
  size 15429
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:baaf7026d9e588ca2ba5b4de8768a379982b7530f39e0b88fa44af9bef8e8bc9
3
  size 15429
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae777e24d50cb7159634e1245f0697ba0fc64d5b26d535f2c80e411371a90b1c
3
  size 15429
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1ec81cbdf599c90b49fb13998f6e46e2492b55345216231b6ce078f88cf04eae
3
  size 15429
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afc5a67564eebcfc961e8f1406a7418cc73497c2935a39af0232ef59f8153a6a
3
  size 15429
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1364855766bf8839ae8db6186dd25d586d587683d30170f8eb04a09add2c6cb7
3
  size 1401
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:331d42834d40f6ab9fe0c79a5f67902cd952ec456fbe0c511bb4b4fc0a7cf69b
3
  size 1401
last-checkpoint/trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
  "best_global_step": null,
3
- "best_metric": 0.07959119230508804,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.13029315960912052,
6
  "eval_steps": 50,
7
- "global_step": 150,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -506,6 +506,172 @@
506
  "eval_samples_per_second": 45.285,
507
  "eval_steps_per_second": 2.838,
508
  "step": 150
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
509
  }
510
  ],
511
  "logging_steps": 5,
 
1
  {
2
  "best_global_step": null,
3
+ "best_metric": 0.06463618576526642,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.1737242128121607,
6
  "eval_steps": 50,
7
+ "global_step": 200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
506
  "eval_samples_per_second": 45.285,
507
  "eval_steps_per_second": 2.838,
508
  "step": 150
509
+ },
510
+ {
511
+ "epoch": 0.13463626492942454,
512
+ "grad_norm": 0.9481019973754883,
513
+ "learning_rate": 2.5988917234452568e-05,
514
+ "logits/chosen": -0.7090820074081421,
515
+ "logits/rejected": -1.00244140625,
516
+ "logps/chosen": -95.23750305175781,
517
+ "logps/rejected": -174.4250030517578,
518
+ "loss": 0.0439,
519
+ "rewards/accuracies": 0.9859374761581421,
520
+ "rewards/chosen": -1.6262695789337158,
521
+ "rewards/margins": 9.666406631469727,
522
+ "rewards/rejected": -11.287500381469727,
523
+ "step": 155
524
+ },
525
+ {
526
+ "epoch": 0.13897937024972856,
527
+ "grad_norm": 3.119917392730713,
528
+ "learning_rate": 2.598854756414658e-05,
529
+ "logits/chosen": -0.706250011920929,
530
+ "logits/rejected": -1.006445288658142,
531
+ "logps/chosen": -100.73750305175781,
532
+ "logps/rejected": -195.52499389648438,
533
+ "loss": 0.0753,
534
+ "rewards/accuracies": 0.973437488079071,
535
+ "rewards/chosen": -2.6958985328674316,
536
+ "rewards/margins": 12.09375,
537
+ "rewards/rejected": -14.793749809265137,
538
+ "step": 160
539
+ },
540
+ {
541
+ "epoch": 0.14332247557003258,
542
+ "grad_norm": 2.0484530925750732,
543
+ "learning_rate": 2.5988145183638775e-05,
544
+ "logits/chosen": -0.687695324420929,
545
+ "logits/rejected": -0.9659179449081421,
546
+ "logps/chosen": -99.67500305175781,
547
+ "logps/rejected": -186.60000610351562,
548
+ "loss": 0.08,
549
+ "rewards/accuracies": 0.973437488079071,
550
+ "rewards/chosen": -2.467578172683716,
551
+ "rewards/margins": 11.5,
552
+ "rewards/rejected": -13.967187881469727,
553
+ "step": 165
554
+ },
555
+ {
556
+ "epoch": 0.1476655808903366,
557
+ "grad_norm": 1.163669228553772,
558
+ "learning_rate": 2.598771009394214e-05,
559
+ "logits/chosen": -0.692333996295929,
560
+ "logits/rejected": -1.009374976158142,
561
+ "logps/chosen": -92.625,
562
+ "logps/rejected": -175.4875030517578,
563
+ "loss": 0.0796,
564
+ "rewards/accuracies": 0.9765625,
565
+ "rewards/chosen": -1.3732726573944092,
566
+ "rewards/margins": 10.21484375,
567
+ "rewards/rejected": -11.586718559265137,
568
+ "step": 170
569
+ },
570
+ {
571
+ "epoch": 0.15200868621064062,
572
+ "grad_norm": 1.496293067932129,
573
+ "learning_rate": 2.5987242296152015e-05,
574
+ "logits/chosen": -0.6812499761581421,
575
+ "logits/rejected": -1.025781273841858,
576
+ "logps/chosen": -89.7874984741211,
577
+ "logps/rejected": -173.60000610351562,
578
+ "loss": 0.0515,
579
+ "rewards/accuracies": 0.979687511920929,
580
+ "rewards/chosen": -0.5631958246231079,
581
+ "rewards/margins": 10.517969131469727,
582
+ "rewards/rejected": -11.086718559265137,
583
+ "step": 175
584
+ },
585
+ {
586
+ "epoch": 0.1563517915309446,
587
+ "grad_norm": 0.6427134871482849,
588
+ "learning_rate": 2.598674179144608e-05,
589
+ "logits/chosen": -0.731152355670929,
590
+ "logits/rejected": -1.055761694908142,
591
+ "logps/chosen": -101.48750305175781,
592
+ "logps/rejected": -194.52499389648438,
593
+ "loss": 0.0468,
594
+ "rewards/accuracies": 0.984375,
595
+ "rewards/chosen": -2.1346678733825684,
596
+ "rewards/margins": 11.561718940734863,
597
+ "rewards/rejected": -13.701562881469727,
598
+ "step": 180
599
+ },
600
+ {
601
+ "epoch": 0.16069489685124863,
602
+ "grad_norm": 3.4019172191619873,
603
+ "learning_rate": 2.598620858108436e-05,
604
+ "logits/chosen": -0.7110351324081421,
605
+ "logits/rejected": -1.060156226158142,
606
+ "logps/chosen": -105.51249694824219,
607
+ "logps/rejected": -198.5,
608
+ "loss": 0.072,
609
+ "rewards/accuracies": 0.9750000238418579,
610
+ "rewards/chosen": -3.612109422683716,
611
+ "rewards/margins": 12.0703125,
612
+ "rewards/rejected": -15.689062118530273,
613
+ "step": 185
614
+ },
615
+ {
616
+ "epoch": 0.16503800217155265,
617
+ "grad_norm": 2.8528225421905518,
618
+ "learning_rate": 2.5985642666409204e-05,
619
+ "logits/chosen": -0.6353515386581421,
620
+ "logits/rejected": -0.9964843988418579,
621
+ "logps/chosen": -105.625,
622
+ "logps/rejected": -196.8000030517578,
623
+ "loss": 0.0611,
624
+ "rewards/accuracies": 0.9781249761581421,
625
+ "rewards/chosen": -3.4736328125,
626
+ "rewards/margins": 11.747655868530273,
627
+ "rewards/rejected": -15.225000381469727,
628
+ "step": 190
629
+ },
630
+ {
631
+ "epoch": 0.16938110749185667,
632
+ "grad_norm": 2.388313055038452,
633
+ "learning_rate": 2.5985044048845307e-05,
634
+ "logits/chosen": -0.529296875,
635
+ "logits/rejected": -0.940234363079071,
636
+ "logps/chosen": -105.25,
637
+ "logps/rejected": -194.1999969482422,
638
+ "loss": 0.0618,
639
+ "rewards/accuracies": 0.9781249761581421,
640
+ "rewards/chosen": -3.1537108421325684,
641
+ "rewards/margins": 11.405468940734863,
642
+ "rewards/rejected": -14.560937881469727,
643
+ "step": 195
644
+ },
645
+ {
646
+ "epoch": 0.1737242128121607,
647
+ "grad_norm": 1.6818196773529053,
648
+ "learning_rate": 2.5984412729899686e-05,
649
+ "logits/chosen": -0.42333984375,
650
+ "logits/rejected": -0.798632800579071,
651
+ "logps/chosen": -102.2125015258789,
652
+ "logps/rejected": -185.64999389648438,
653
+ "loss": 0.0601,
654
+ "rewards/accuracies": 0.9765625,
655
+ "rewards/chosen": -2.742382764816284,
656
+ "rewards/margins": 10.553906440734863,
657
+ "rewards/rejected": -13.293749809265137,
658
+ "step": 200
659
+ },
660
+ {
661
+ "epoch": 0.1737242128121607,
662
+ "eval_logits/chosen": -0.41209879517555237,
663
+ "eval_logits/rejected": -0.7723516225814819,
664
+ "eval_logps/chosen": -102.44945526123047,
665
+ "eval_logps/rejected": -186.8014373779297,
666
+ "eval_loss": 0.06463618576526642,
667
+ "eval_rewards/accuracies": 0.9745036363601685,
668
+ "eval_rewards/chosen": -2.8919081687927246,
669
+ "eval_rewards/margins": 10.732288360595703,
670
+ "eval_rewards/rejected": -13.622066497802734,
671
+ "eval_runtime": 97.6846,
672
+ "eval_samples_per_second": 45.248,
673
+ "eval_steps_per_second": 2.836,
674
+ "step": 200
675
  }
676
  ],
677
  "logging_steps": 5,