Training in progress, epoch 0, checkpoint
Browse files- last-checkpoint/adapter_model.safetensors +1 -1
- last-checkpoint/global_step350/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step350/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step350/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step350/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step350/mp_rank_00_model_states.pt +3 -0
- last-checkpoint/latest +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +169 -3
last-checkpoint/adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1172343536
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:72c4bc97664d0aa7a098b0c228a22ae32034b0dbf4ab4da13857ed465b5a65d4
|
| 3 |
size 1172343536
|
last-checkpoint/global_step350/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:37fc7a2e36c47456cdb57ad2157f0526df8cde031240d041adb3010b39a804f1
|
| 3 |
+
size 883824229
|
last-checkpoint/global_step350/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:86c9ff85c1b1c7169e42d8df4c4e10f2a3f7d5418ec829e94c3119f66f6815f7
|
| 3 |
+
size 883824293
|
last-checkpoint/global_step350/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4b11063637dd7cf3b648c62228fa956b16f97369d414fb88bd40a11359e11e8b
|
| 3 |
+
size 883824293
|
last-checkpoint/global_step350/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b8b8b6efa843601f79dcaf36a924657370373e44e9326714e06e422f7d193d97
|
| 3 |
+
size 883824293
|
last-checkpoint/global_step350/mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:faf64cec01f85857d3e5cd780821bab6f037b6129c2a7b4035770b88675fe4f2
|
| 3 |
+
size 1172522073
|
last-checkpoint/latest
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
|
|
|
|
| 1 |
+
global_step350
|
last-checkpoint/rng_state_0.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15429
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c372628cf0f11a7814089f880131f006d1271095beb5e7152f3c14aa8985e326
|
| 3 |
size 15429
|
last-checkpoint/rng_state_1.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15429
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e8627b9687b17d3eb42763f7499513d01033a545f5fdc3224442fa88df7b07c1
|
| 3 |
size 15429
|
last-checkpoint/rng_state_2.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15429
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f2861b0db544103a2392f7009e235760e91d4f2dcf2605bc9fda62bad0578110
|
| 3 |
size 15429
|
last-checkpoint/rng_state_3.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15429
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5661cf15d465afc34868de007aed00c0a576292f6e776fe25a04f040a9501399
|
| 3 |
size 15429
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1401
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a14f05b7034e739d561e3e8c467aa7c3cfde2b5a09c502a2513b18be6676f89e
|
| 3 |
size 1401
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -1,10 +1,10 @@
|
|
| 1 |
{
|
| 2 |
"best_global_step": null,
|
| 3 |
-
"best_metric": 0.
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 50,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -1004,6 +1004,172 @@
|
|
| 1004 |
"eval_samples_per_second": 45.212,
|
| 1005 |
"eval_steps_per_second": 2.833,
|
| 1006 |
"step": 300
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1007 |
}
|
| 1008 |
],
|
| 1009 |
"logging_steps": 5,
|
|
|
|
| 1 |
{
|
| 2 |
"best_global_step": null,
|
| 3 |
+
"best_metric": 0.04868408665060997,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.30401737242128124,
|
| 6 |
"eval_steps": 50,
|
| 7 |
+
"global_step": 350,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 1004 |
"eval_samples_per_second": 45.212,
|
| 1005 |
"eval_steps_per_second": 2.833,
|
| 1006 |
"step": 300
|
| 1007 |
+
},
|
| 1008 |
+
{
|
| 1009 |
+
"epoch": 0.26492942453854507,
|
| 1010 |
+
"grad_norm": 1.8991755247116089,
|
| 1011 |
+
"learning_rate": 2.5963604556388822e-05,
|
| 1012 |
+
"logits/chosen": -0.21623535454273224,
|
| 1013 |
+
"logits/rejected": -0.652539074420929,
|
| 1014 |
+
"logps/chosen": -91.5,
|
| 1015 |
+
"logps/rejected": -175.3000030517578,
|
| 1016 |
+
"loss": 0.0584,
|
| 1017 |
+
"rewards/accuracies": 0.9765625,
|
| 1018 |
+
"rewards/chosen": -0.941723644733429,
|
| 1019 |
+
"rewards/margins": 11.140625,
|
| 1020 |
+
"rewards/rejected": -12.076562881469727,
|
| 1021 |
+
"step": 305
|
| 1022 |
+
},
|
| 1023 |
+
{
|
| 1024 |
+
"epoch": 0.2692725298588491,
|
| 1025 |
+
"grad_norm": 0.6933239698410034,
|
| 1026 |
+
"learning_rate": 2.5962254354896943e-05,
|
| 1027 |
+
"logits/chosen": -0.21835938096046448,
|
| 1028 |
+
"logits/rejected": -0.629345715045929,
|
| 1029 |
+
"logps/chosen": -96.7750015258789,
|
| 1030 |
+
"logps/rejected": -179.75,
|
| 1031 |
+
"loss": 0.0424,
|
| 1032 |
+
"rewards/accuracies": 0.989062488079071,
|
| 1033 |
+
"rewards/chosen": -1.7537109851837158,
|
| 1034 |
+
"rewards/margins": 10.282031059265137,
|
| 1035 |
+
"rewards/rejected": -12.037500381469727,
|
| 1036 |
+
"step": 310
|
| 1037 |
+
},
|
| 1038 |
+
{
|
| 1039 |
+
"epoch": 0.2736156351791531,
|
| 1040 |
+
"grad_norm": 1.1337815523147583,
|
| 1041 |
+
"learning_rate": 2.5960871509396373e-05,
|
| 1042 |
+
"logits/chosen": -0.22700805962085724,
|
| 1043 |
+
"logits/rejected": -0.621630847454071,
|
| 1044 |
+
"logps/chosen": -98.25,
|
| 1045 |
+
"logps/rejected": -182.9250030517578,
|
| 1046 |
+
"loss": 0.0599,
|
| 1047 |
+
"rewards/accuracies": 0.981249988079071,
|
| 1048 |
+
"rewards/chosen": -2.5380859375,
|
| 1049 |
+
"rewards/margins": 10.541406631469727,
|
| 1050 |
+
"rewards/rejected": -13.079687118530273,
|
| 1051 |
+
"step": 315
|
| 1052 |
+
},
|
| 1053 |
+
{
|
| 1054 |
+
"epoch": 0.2779587404994571,
|
| 1055 |
+
"grad_norm": 1.0313189029693604,
|
| 1056 |
+
"learning_rate": 2.595945602336842e-05,
|
| 1057 |
+
"logits/chosen": -0.2883544862270355,
|
| 1058 |
+
"logits/rejected": -0.70068359375,
|
| 1059 |
+
"logps/chosen": -100.48750305175781,
|
| 1060 |
+
"logps/rejected": -190.14999389648438,
|
| 1061 |
+
"loss": 0.0483,
|
| 1062 |
+
"rewards/accuracies": 0.979687511920929,
|
| 1063 |
+
"rewards/chosen": -2.769335985183716,
|
| 1064 |
+
"rewards/margins": 12.239062309265137,
|
| 1065 |
+
"rewards/rejected": -15.001562118530273,
|
| 1066 |
+
"step": 320
|
| 1067 |
+
},
|
| 1068 |
+
{
|
| 1069 |
+
"epoch": 0.28230184581976114,
|
| 1070 |
+
"grad_norm": 2.236783027648926,
|
| 1071 |
+
"learning_rate": 2.5958007900376565e-05,
|
| 1072 |
+
"logits/chosen": -0.3595947325229645,
|
| 1073 |
+
"logits/rejected": -0.758496105670929,
|
| 1074 |
+
"logps/chosen": -97.19999694824219,
|
| 1075 |
+
"logps/rejected": -192.10000610351562,
|
| 1076 |
+
"loss": 0.0814,
|
| 1077 |
+
"rewards/accuracies": 0.971875011920929,
|
| 1078 |
+
"rewards/chosen": -2.0233397483825684,
|
| 1079 |
+
"rewards/margins": 12.854687690734863,
|
| 1080 |
+
"rewards/rejected": -14.878125190734863,
|
| 1081 |
+
"step": 325
|
| 1082 |
+
},
|
| 1083 |
+
{
|
| 1084 |
+
"epoch": 0.28664495114006516,
|
| 1085 |
+
"grad_norm": 0.2666296660900116,
|
| 1086 |
+
"learning_rate": 2.5956527144066455e-05,
|
| 1087 |
+
"logits/chosen": -0.3157714903354645,
|
| 1088 |
+
"logits/rejected": -0.805468738079071,
|
| 1089 |
+
"logps/chosen": -91.5625,
|
| 1090 |
+
"logps/rejected": -182.4499969482422,
|
| 1091 |
+
"loss": 0.0333,
|
| 1092 |
+
"rewards/accuracies": 0.9859374761581421,
|
| 1093 |
+
"rewards/chosen": -0.836718738079071,
|
| 1094 |
+
"rewards/margins": 11.439844131469727,
|
| 1095 |
+
"rewards/rejected": -12.278124809265137,
|
| 1096 |
+
"step": 330
|
| 1097 |
+
},
|
| 1098 |
+
{
|
| 1099 |
+
"epoch": 0.2909880564603692,
|
| 1100 |
+
"grad_norm": 1.1598833799362183,
|
| 1101 |
+
"learning_rate": 2.5955013758165896e-05,
|
| 1102 |
+
"logits/chosen": -0.3671875,
|
| 1103 |
+
"logits/rejected": -0.854785144329071,
|
| 1104 |
+
"logps/chosen": -92.11250305175781,
|
| 1105 |
+
"logps/rejected": -181.0500030517578,
|
| 1106 |
+
"loss": 0.0383,
|
| 1107 |
+
"rewards/accuracies": 0.987500011920929,
|
| 1108 |
+
"rewards/chosen": -1.1418945789337158,
|
| 1109 |
+
"rewards/margins": 11.553125381469727,
|
| 1110 |
+
"rewards/rejected": -12.699999809265137,
|
| 1111 |
+
"step": 335
|
| 1112 |
+
},
|
| 1113 |
+
{
|
| 1114 |
+
"epoch": 0.2953311617806732,
|
| 1115 |
+
"grad_norm": 2.1906487941741943,
|
| 1116 |
+
"learning_rate": 2.595346774648484e-05,
|
| 1117 |
+
"logits/chosen": -0.49267578125,
|
| 1118 |
+
"logits/rejected": -0.973925769329071,
|
| 1119 |
+
"logps/chosen": -97.875,
|
| 1120 |
+
"logps/rejected": -200.5500030517578,
|
| 1121 |
+
"loss": 0.0494,
|
| 1122 |
+
"rewards/accuracies": 0.989062488079071,
|
| 1123 |
+
"rewards/chosen": -2.0439453125,
|
| 1124 |
+
"rewards/margins": 13.603124618530273,
|
| 1125 |
+
"rewards/rejected": -15.6484375,
|
| 1126 |
+
"step": 340
|
| 1127 |
+
},
|
| 1128 |
+
{
|
| 1129 |
+
"epoch": 0.2996742671009772,
|
| 1130 |
+
"grad_norm": 2.272686004638672,
|
| 1131 |
+
"learning_rate": 2.5951889112915355e-05,
|
| 1132 |
+
"logits/chosen": -0.581787109375,
|
| 1133 |
+
"logits/rejected": -1.022558569908142,
|
| 1134 |
+
"logps/chosen": -103.26249694824219,
|
| 1135 |
+
"logps/rejected": -214.3000030517578,
|
| 1136 |
+
"loss": 0.0348,
|
| 1137 |
+
"rewards/accuracies": 0.9906250238418579,
|
| 1138 |
+
"rewards/chosen": -2.8232421875,
|
| 1139 |
+
"rewards/margins": 15.089062690734863,
|
| 1140 |
+
"rewards/rejected": -17.920312881469727,
|
| 1141 |
+
"step": 345
|
| 1142 |
+
},
|
| 1143 |
+
{
|
| 1144 |
+
"epoch": 0.30401737242128124,
|
| 1145 |
+
"grad_norm": 2.300966739654541,
|
| 1146 |
+
"learning_rate": 2.595027786143166e-05,
|
| 1147 |
+
"logits/chosen": -0.621533215045929,
|
| 1148 |
+
"logits/rejected": -1.0398437976837158,
|
| 1149 |
+
"logps/chosen": -103.1500015258789,
|
| 1150 |
+
"logps/rejected": -214.9250030517578,
|
| 1151 |
+
"loss": 0.0429,
|
| 1152 |
+
"rewards/accuracies": 0.9781249761581421,
|
| 1153 |
+
"rewards/chosen": -3.0667967796325684,
|
| 1154 |
+
"rewards/margins": 15.360937118530273,
|
| 1155 |
+
"rewards/rejected": -18.432811737060547,
|
| 1156 |
+
"step": 350
|
| 1157 |
+
},
|
| 1158 |
+
{
|
| 1159 |
+
"epoch": 0.30401737242128124,
|
| 1160 |
+
"eval_logits/chosen": -0.6215943694114685,
|
| 1161 |
+
"eval_logits/rejected": -1.031334638595581,
|
| 1162 |
+
"eval_logps/chosen": -104.52346801757812,
|
| 1163 |
+
"eval_logps/rejected": -207.2238311767578,
|
| 1164 |
+
"eval_loss": 0.04868408665060997,
|
| 1165 |
+
"eval_rewards/accuracies": 0.9814981818199158,
|
| 1166 |
+
"eval_rewards/chosen": -3.2726759910583496,
|
| 1167 |
+
"eval_rewards/margins": 14.101533889770508,
|
| 1168 |
+
"eval_rewards/rejected": -17.368907928466797,
|
| 1169 |
+
"eval_runtime": 97.7856,
|
| 1170 |
+
"eval_samples_per_second": 45.201,
|
| 1171 |
+
"eval_steps_per_second": 2.833,
|
| 1172 |
+
"step": 350
|
| 1173 |
}
|
| 1174 |
],
|
| 1175 |
"logging_steps": 5,
|