FormlessAI commited on
Commit
0db980f
·
verified ·
1 Parent(s): 1835e2b

Training in progress, epoch 0, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:af02c1ae6226dcd7868f657f4c2e9b234b3ae7e678ff50611b3ba00a96877360
3
  size 1172343536
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72c4bc97664d0aa7a098b0c228a22ae32034b0dbf4ab4da13857ed465b5a65d4
3
  size 1172343536
last-checkpoint/global_step350/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37fc7a2e36c47456cdb57ad2157f0526df8cde031240d041adb3010b39a804f1
3
+ size 883824229
last-checkpoint/global_step350/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86c9ff85c1b1c7169e42d8df4c4e10f2a3f7d5418ec829e94c3119f66f6815f7
3
+ size 883824293
last-checkpoint/global_step350/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b11063637dd7cf3b648c62228fa956b16f97369d414fb88bd40a11359e11e8b
3
+ size 883824293
last-checkpoint/global_step350/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8b8b6efa843601f79dcaf36a924657370373e44e9326714e06e422f7d193d97
3
+ size 883824293
last-checkpoint/global_step350/mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:faf64cec01f85857d3e5cd780821bab6f037b6129c2a7b4035770b88675fe4f2
3
+ size 1172522073
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step300
 
1
+ global_step350
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6684d046afb526c2e665e56c5dea82ebbd5f4bafebc51ba7bbd0abe0af887457
3
  size 15429
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c372628cf0f11a7814089f880131f006d1271095beb5e7152f3c14aa8985e326
3
  size 15429
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:80dc672c36be6d6e761464a269748f88cc1a2b275525f62e4c41e0a2b8e14c66
3
  size 15429
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8627b9687b17d3eb42763f7499513d01033a545f5fdc3224442fa88df7b07c1
3
  size 15429
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1b2bed19a0bf05b4a5a72a170ec35982f5322d3d8cddeea244b9caffd018c4f9
3
  size 15429
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2861b0db544103a2392f7009e235760e91d4f2dcf2605bc9fda62bad0578110
3
  size 15429
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8118881a2505438583b140279acb7bbe63652187d96439b98542be3623d2f6d3
3
  size 15429
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5661cf15d465afc34868de007aed00c0a576292f6e776fe25a04f040a9501399
3
  size 15429
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b512ac5de3057194dcd5b6fda8c85adef1b4c088a663414c6401d151e8a4a926
3
  size 1401
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a14f05b7034e739d561e3e8c467aa7c3cfde2b5a09c502a2513b18be6676f89e
3
  size 1401
last-checkpoint/trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
  "best_global_step": null,
3
- "best_metric": 0.05415169149637222,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.26058631921824105,
6
  "eval_steps": 50,
7
- "global_step": 300,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -1004,6 +1004,172 @@
1004
  "eval_samples_per_second": 45.212,
1005
  "eval_steps_per_second": 2.833,
1006
  "step": 300
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1007
  }
1008
  ],
1009
  "logging_steps": 5,
 
1
  {
2
  "best_global_step": null,
3
+ "best_metric": 0.04868408665060997,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.30401737242128124,
6
  "eval_steps": 50,
7
+ "global_step": 350,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
1004
  "eval_samples_per_second": 45.212,
1005
  "eval_steps_per_second": 2.833,
1006
  "step": 300
1007
+ },
1008
+ {
1009
+ "epoch": 0.26492942453854507,
1010
+ "grad_norm": 1.8991755247116089,
1011
+ "learning_rate": 2.5963604556388822e-05,
1012
+ "logits/chosen": -0.21623535454273224,
1013
+ "logits/rejected": -0.652539074420929,
1014
+ "logps/chosen": -91.5,
1015
+ "logps/rejected": -175.3000030517578,
1016
+ "loss": 0.0584,
1017
+ "rewards/accuracies": 0.9765625,
1018
+ "rewards/chosen": -0.941723644733429,
1019
+ "rewards/margins": 11.140625,
1020
+ "rewards/rejected": -12.076562881469727,
1021
+ "step": 305
1022
+ },
1023
+ {
1024
+ "epoch": 0.2692725298588491,
1025
+ "grad_norm": 0.6933239698410034,
1026
+ "learning_rate": 2.5962254354896943e-05,
1027
+ "logits/chosen": -0.21835938096046448,
1028
+ "logits/rejected": -0.629345715045929,
1029
+ "logps/chosen": -96.7750015258789,
1030
+ "logps/rejected": -179.75,
1031
+ "loss": 0.0424,
1032
+ "rewards/accuracies": 0.989062488079071,
1033
+ "rewards/chosen": -1.7537109851837158,
1034
+ "rewards/margins": 10.282031059265137,
1035
+ "rewards/rejected": -12.037500381469727,
1036
+ "step": 310
1037
+ },
1038
+ {
1039
+ "epoch": 0.2736156351791531,
1040
+ "grad_norm": 1.1337815523147583,
1041
+ "learning_rate": 2.5960871509396373e-05,
1042
+ "logits/chosen": -0.22700805962085724,
1043
+ "logits/rejected": -0.621630847454071,
1044
+ "logps/chosen": -98.25,
1045
+ "logps/rejected": -182.9250030517578,
1046
+ "loss": 0.0599,
1047
+ "rewards/accuracies": 0.981249988079071,
1048
+ "rewards/chosen": -2.5380859375,
1049
+ "rewards/margins": 10.541406631469727,
1050
+ "rewards/rejected": -13.079687118530273,
1051
+ "step": 315
1052
+ },
1053
+ {
1054
+ "epoch": 0.2779587404994571,
1055
+ "grad_norm": 1.0313189029693604,
1056
+ "learning_rate": 2.595945602336842e-05,
1057
+ "logits/chosen": -0.2883544862270355,
1058
+ "logits/rejected": -0.70068359375,
1059
+ "logps/chosen": -100.48750305175781,
1060
+ "logps/rejected": -190.14999389648438,
1061
+ "loss": 0.0483,
1062
+ "rewards/accuracies": 0.979687511920929,
1063
+ "rewards/chosen": -2.769335985183716,
1064
+ "rewards/margins": 12.239062309265137,
1065
+ "rewards/rejected": -15.001562118530273,
1066
+ "step": 320
1067
+ },
1068
+ {
1069
+ "epoch": 0.28230184581976114,
1070
+ "grad_norm": 2.236783027648926,
1071
+ "learning_rate": 2.5958007900376565e-05,
1072
+ "logits/chosen": -0.3595947325229645,
1073
+ "logits/rejected": -0.758496105670929,
1074
+ "logps/chosen": -97.19999694824219,
1075
+ "logps/rejected": -192.10000610351562,
1076
+ "loss": 0.0814,
1077
+ "rewards/accuracies": 0.971875011920929,
1078
+ "rewards/chosen": -2.0233397483825684,
1079
+ "rewards/margins": 12.854687690734863,
1080
+ "rewards/rejected": -14.878125190734863,
1081
+ "step": 325
1082
+ },
1083
+ {
1084
+ "epoch": 0.28664495114006516,
1085
+ "grad_norm": 0.2666296660900116,
1086
+ "learning_rate": 2.5956527144066455e-05,
1087
+ "logits/chosen": -0.3157714903354645,
1088
+ "logits/rejected": -0.805468738079071,
1089
+ "logps/chosen": -91.5625,
1090
+ "logps/rejected": -182.4499969482422,
1091
+ "loss": 0.0333,
1092
+ "rewards/accuracies": 0.9859374761581421,
1093
+ "rewards/chosen": -0.836718738079071,
1094
+ "rewards/margins": 11.439844131469727,
1095
+ "rewards/rejected": -12.278124809265137,
1096
+ "step": 330
1097
+ },
1098
+ {
1099
+ "epoch": 0.2909880564603692,
1100
+ "grad_norm": 1.1598833799362183,
1101
+ "learning_rate": 2.5955013758165896e-05,
1102
+ "logits/chosen": -0.3671875,
1103
+ "logits/rejected": -0.854785144329071,
1104
+ "logps/chosen": -92.11250305175781,
1105
+ "logps/rejected": -181.0500030517578,
1106
+ "loss": 0.0383,
1107
+ "rewards/accuracies": 0.987500011920929,
1108
+ "rewards/chosen": -1.1418945789337158,
1109
+ "rewards/margins": 11.553125381469727,
1110
+ "rewards/rejected": -12.699999809265137,
1111
+ "step": 335
1112
+ },
1113
+ {
1114
+ "epoch": 0.2953311617806732,
1115
+ "grad_norm": 2.1906487941741943,
1116
+ "learning_rate": 2.595346774648484e-05,
1117
+ "logits/chosen": -0.49267578125,
1118
+ "logits/rejected": -0.973925769329071,
1119
+ "logps/chosen": -97.875,
1120
+ "logps/rejected": -200.5500030517578,
1121
+ "loss": 0.0494,
1122
+ "rewards/accuracies": 0.989062488079071,
1123
+ "rewards/chosen": -2.0439453125,
1124
+ "rewards/margins": 13.603124618530273,
1125
+ "rewards/rejected": -15.6484375,
1126
+ "step": 340
1127
+ },
1128
+ {
1129
+ "epoch": 0.2996742671009772,
1130
+ "grad_norm": 2.272686004638672,
1131
+ "learning_rate": 2.5951889112915355e-05,
1132
+ "logits/chosen": -0.581787109375,
1133
+ "logits/rejected": -1.022558569908142,
1134
+ "logps/chosen": -103.26249694824219,
1135
+ "logps/rejected": -214.3000030517578,
1136
+ "loss": 0.0348,
1137
+ "rewards/accuracies": 0.9906250238418579,
1138
+ "rewards/chosen": -2.8232421875,
1139
+ "rewards/margins": 15.089062690734863,
1140
+ "rewards/rejected": -17.920312881469727,
1141
+ "step": 345
1142
+ },
1143
+ {
1144
+ "epoch": 0.30401737242128124,
1145
+ "grad_norm": 2.300966739654541,
1146
+ "learning_rate": 2.595027786143166e-05,
1147
+ "logits/chosen": -0.621533215045929,
1148
+ "logits/rejected": -1.0398437976837158,
1149
+ "logps/chosen": -103.1500015258789,
1150
+ "logps/rejected": -214.9250030517578,
1151
+ "loss": 0.0429,
1152
+ "rewards/accuracies": 0.9781249761581421,
1153
+ "rewards/chosen": -3.0667967796325684,
1154
+ "rewards/margins": 15.360937118530273,
1155
+ "rewards/rejected": -18.432811737060547,
1156
+ "step": 350
1157
+ },
1158
+ {
1159
+ "epoch": 0.30401737242128124,
1160
+ "eval_logits/chosen": -0.6215943694114685,
1161
+ "eval_logits/rejected": -1.031334638595581,
1162
+ "eval_logps/chosen": -104.52346801757812,
1163
+ "eval_logps/rejected": -207.2238311767578,
1164
+ "eval_loss": 0.04868408665060997,
1165
+ "eval_rewards/accuracies": 0.9814981818199158,
1166
+ "eval_rewards/chosen": -3.2726759910583496,
1167
+ "eval_rewards/margins": 14.101533889770508,
1168
+ "eval_rewards/rejected": -17.368907928466797,
1169
+ "eval_runtime": 97.7856,
1170
+ "eval_samples_per_second": 45.201,
1171
+ "eval_steps_per_second": 2.833,
1172
+ "step": 350
1173
  }
1174
  ],
1175
  "logging_steps": 5,