Backup: SFT training data (stage1_chat + stage2_reasoning)
Browse files- sft_data_backup/stage1_chat/dataset_dict.json +1 -0
- sft_data_backup/stage1_chat/test/cache-8f3dac62ba0e8e2f.arrow +3 -0
- sft_data_backup/stage1_chat/test/cache-abbed5626fe2ec0d.arrow +3 -0
- sft_data_backup/stage1_chat/test/cache-f058d02046b76fed.arrow +3 -0
- sft_data_backup/stage1_chat/test/data-00000-of-00001.arrow +3 -0
- sft_data_backup/stage1_chat/test/dataset_info.json +21 -0
- sft_data_backup/stage1_chat/test/state.json +13 -0
- sft_data_backup/stage1_chat/train/cache-ae412579ac79a389.arrow +3 -0
- sft_data_backup/stage1_chat/train/cache-c2a81370885b78cf.arrow +3 -0
- sft_data_backup/stage1_chat/train/cache-e1708978b5d10522.arrow +3 -0
- sft_data_backup/stage1_chat/train/data-00000-of-00001.arrow +3 -0
- sft_data_backup/stage1_chat/train/dataset_info.json +21 -0
- sft_data_backup/stage1_chat/train/state.json +13 -0
- sft_data_backup/stage2_reasoning/dataset_dict.json +1 -0
- sft_data_backup/stage2_reasoning/test/cache-25674b641f793ff8.arrow +3 -0
- sft_data_backup/stage2_reasoning/test/cache-5c4fb7b143f41f73.arrow +3 -0
- sft_data_backup/stage2_reasoning/test/cache-685367264055061d.arrow +3 -0
- sft_data_backup/stage2_reasoning/test/data-00000-of-00001.arrow +3 -0
- sft_data_backup/stage2_reasoning/test/dataset_info.json +21 -0
- sft_data_backup/stage2_reasoning/test/state.json +13 -0
- sft_data_backup/stage2_reasoning/train/cache-a0f6d99bedb7dd08.arrow +3 -0
- sft_data_backup/stage2_reasoning/train/cache-f17c5f6e813c3cfa.arrow +3 -0
- sft_data_backup/stage2_reasoning/train/cache-fec1f70325e2f914.arrow +3 -0
- sft_data_backup/stage2_reasoning/train/data-00000-of-00002.arrow +3 -0
- sft_data_backup/stage2_reasoning/train/data-00001-of-00002.arrow +3 -0
- sft_data_backup/stage2_reasoning/train/dataset_info.json +21 -0
- sft_data_backup/stage2_reasoning/train/state.json +16 -0
sft_data_backup/stage1_chat/dataset_dict.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"splits": ["train", "test"]}
|
sft_data_backup/stage1_chat/test/cache-8f3dac62ba0e8e2f.arrow
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bfacf49538e19eb372dbeba36bec72d88c25ba4c7867ccd51c26071463a0ca05
|
| 3 |
+
size 783016
|
sft_data_backup/stage1_chat/test/cache-abbed5626fe2ec0d.arrow
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c7afb5bafb26f4ea10289b52f4664a08c064272e955bf2acb8ba62ac05fdb5a4
|
| 3 |
+
size 548328
|
sft_data_backup/stage1_chat/test/cache-f058d02046b76fed.arrow
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f9f9ebdc66cdc502bfe722233beefbc9b61785b1a53efaab6fbfb3b784780060
|
| 3 |
+
size 783016
|
sft_data_backup/stage1_chat/test/data-00000-of-00001.arrow
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:656a3beeb584146690480f709e15c67369df9f21656e77278263fc9a4974bb12
|
| 3 |
+
size 261968
|
sft_data_backup/stage1_chat/test/dataset_info.json
ADDED
|
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"citation": "",
|
| 3 |
+
"description": "",
|
| 4 |
+
"features": {
|
| 5 |
+
"messages": {
|
| 6 |
+
"feature": {
|
| 7 |
+
"content": {
|
| 8 |
+
"dtype": "string",
|
| 9 |
+
"_type": "Value"
|
| 10 |
+
},
|
| 11 |
+
"role": {
|
| 12 |
+
"dtype": "string",
|
| 13 |
+
"_type": "Value"
|
| 14 |
+
}
|
| 15 |
+
},
|
| 16 |
+
"_type": "List"
|
| 17 |
+
}
|
| 18 |
+
},
|
| 19 |
+
"homepage": "",
|
| 20 |
+
"license": ""
|
| 21 |
+
}
|
sft_data_backup/stage1_chat/test/state.json
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_data_files": [
|
| 3 |
+
{
|
| 4 |
+
"filename": "data-00000-of-00001.arrow"
|
| 5 |
+
}
|
| 6 |
+
],
|
| 7 |
+
"_fingerprint": "178fa2990bad9a65",
|
| 8 |
+
"_format_columns": null,
|
| 9 |
+
"_format_kwargs": {},
|
| 10 |
+
"_format_type": null,
|
| 11 |
+
"_output_all_columns": false,
|
| 12 |
+
"_split": null
|
| 13 |
+
}
|
sft_data_backup/stage1_chat/train/cache-ae412579ac79a389.arrow
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eb50fa34f6897cea8a52861889188df55ddde6c1edfd402f2996c295cdb62e7b
|
| 3 |
+
size 78554008
|
sft_data_backup/stage1_chat/train/cache-c2a81370885b78cf.arrow
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bb2fa6df2d751a734a7ce3c751fde6f8598979a2480e590e66f9deaf2f28d4bc
|
| 3 |
+
size 78553936
|
sft_data_backup/stage1_chat/train/cache-e1708978b5d10522.arrow
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1a129cf2d3b0aa55a9fbb4bc080bf12f67fc89d190c182418994dfd43c74dd1f
|
| 3 |
+
size 55092776
|
sft_data_backup/stage1_chat/train/data-00000-of-00001.arrow
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e5462204ad996305b3b54c554d9af6961c98450a30cb27ff4d23801186703fb0
|
| 3 |
+
size 26317680
|
sft_data_backup/stage1_chat/train/dataset_info.json
ADDED
|
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"citation": "",
|
| 3 |
+
"description": "",
|
| 4 |
+
"features": {
|
| 5 |
+
"messages": {
|
| 6 |
+
"feature": {
|
| 7 |
+
"content": {
|
| 8 |
+
"dtype": "string",
|
| 9 |
+
"_type": "Value"
|
| 10 |
+
},
|
| 11 |
+
"role": {
|
| 12 |
+
"dtype": "string",
|
| 13 |
+
"_type": "Value"
|
| 14 |
+
}
|
| 15 |
+
},
|
| 16 |
+
"_type": "List"
|
| 17 |
+
}
|
| 18 |
+
},
|
| 19 |
+
"homepage": "",
|
| 20 |
+
"license": ""
|
| 21 |
+
}
|
sft_data_backup/stage1_chat/train/state.json
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_data_files": [
|
| 3 |
+
{
|
| 4 |
+
"filename": "data-00000-of-00001.arrow"
|
| 5 |
+
}
|
| 6 |
+
],
|
| 7 |
+
"_fingerprint": "4a67e690c19c5701",
|
| 8 |
+
"_format_columns": null,
|
| 9 |
+
"_format_kwargs": {},
|
| 10 |
+
"_format_type": null,
|
| 11 |
+
"_output_all_columns": false,
|
| 12 |
+
"_split": null
|
| 13 |
+
}
|
sft_data_backup/stage2_reasoning/dataset_dict.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"splits": ["train", "test"]}
|
sft_data_backup/stage2_reasoning/test/cache-25674b641f793ff8.arrow
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9dffebe566ea41d2cc21910cf93e99b971d8fe167548edc050fe7a763e65d48d
|
| 3 |
+
size 18804456
|
sft_data_backup/stage2_reasoning/test/cache-5c4fb7b143f41f73.arrow
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eb48d66903456db0fcfe428ca5048ea12fe491b9adcbf2138bb49422d4dff12e
|
| 3 |
+
size 18778376
|
sft_data_backup/stage2_reasoning/test/cache-685367264055061d.arrow
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c652a565d9969708d47e6d3cc0df2d07c77ae9d7426042d334e19004b683d322
|
| 3 |
+
size 12027568
|
sft_data_backup/stage2_reasoning/test/data-00000-of-00001.arrow
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:60beace7431c3e48a34b6f04f020bf05757eb97ff020245d1a81db12e79973d3
|
| 3 |
+
size 5855360
|
sft_data_backup/stage2_reasoning/test/dataset_info.json
ADDED
|
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"citation": "",
|
| 3 |
+
"description": "",
|
| 4 |
+
"features": {
|
| 5 |
+
"messages": {
|
| 6 |
+
"feature": {
|
| 7 |
+
"content": {
|
| 8 |
+
"dtype": "string",
|
| 9 |
+
"_type": "Value"
|
| 10 |
+
},
|
| 11 |
+
"role": {
|
| 12 |
+
"dtype": "string",
|
| 13 |
+
"_type": "Value"
|
| 14 |
+
}
|
| 15 |
+
},
|
| 16 |
+
"_type": "List"
|
| 17 |
+
}
|
| 18 |
+
},
|
| 19 |
+
"homepage": "",
|
| 20 |
+
"license": ""
|
| 21 |
+
}
|
sft_data_backup/stage2_reasoning/test/state.json
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_data_files": [
|
| 3 |
+
{
|
| 4 |
+
"filename": "data-00000-of-00001.arrow"
|
| 5 |
+
}
|
| 6 |
+
],
|
| 7 |
+
"_fingerprint": "3e8ee5dd31425f2e",
|
| 8 |
+
"_format_columns": null,
|
| 9 |
+
"_format_kwargs": {},
|
| 10 |
+
"_format_type": null,
|
| 11 |
+
"_output_all_columns": false,
|
| 12 |
+
"_split": null
|
| 13 |
+
}
|
sft_data_backup/stage2_reasoning/train/cache-a0f6d99bedb7dd08.arrow
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d6c75b2788f88af720c9098297bf74fe9e389c1d3bbe997c6ba4c0be8b4abfaa
|
| 3 |
+
size 1877965864
|
sft_data_backup/stage2_reasoning/train/cache-f17c5f6e813c3cfa.arrow
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cb0b148ffd9a29a21228ace06d85c99446f24a6e8167b222631d8f234e5d844c
|
| 3 |
+
size 1880082040
|
sft_data_backup/stage2_reasoning/train/cache-fec1f70325e2f914.arrow
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:29e0c0007675a6bb6c5502cffd7032637252b1bde848aea4a03ef079678e200c
|
| 3 |
+
size 1200367168
|
sft_data_backup/stage2_reasoning/train/data-00000-of-00002.arrow
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:253f8cc0028aea990cba8071bff381f114d2635bde301751ddf051b38ccd193c
|
| 3 |
+
size 292167400
|
sft_data_backup/stage2_reasoning/train/data-00001-of-00002.arrow
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0d3bc7aa0a03d71ef69c180fe74e03f72a59181163a3b1d3b40425f4a02066a3
|
| 3 |
+
size 292312176
|
sft_data_backup/stage2_reasoning/train/dataset_info.json
ADDED
|
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"citation": "",
|
| 3 |
+
"description": "",
|
| 4 |
+
"features": {
|
| 5 |
+
"messages": {
|
| 6 |
+
"feature": {
|
| 7 |
+
"content": {
|
| 8 |
+
"dtype": "string",
|
| 9 |
+
"_type": "Value"
|
| 10 |
+
},
|
| 11 |
+
"role": {
|
| 12 |
+
"dtype": "string",
|
| 13 |
+
"_type": "Value"
|
| 14 |
+
}
|
| 15 |
+
},
|
| 16 |
+
"_type": "List"
|
| 17 |
+
}
|
| 18 |
+
},
|
| 19 |
+
"homepage": "",
|
| 20 |
+
"license": ""
|
| 21 |
+
}
|
sft_data_backup/stage2_reasoning/train/state.json
ADDED
|
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_data_files": [
|
| 3 |
+
{
|
| 4 |
+
"filename": "data-00000-of-00002.arrow"
|
| 5 |
+
},
|
| 6 |
+
{
|
| 7 |
+
"filename": "data-00001-of-00002.arrow"
|
| 8 |
+
}
|
| 9 |
+
],
|
| 10 |
+
"_fingerprint": "6fe311a1fac16856",
|
| 11 |
+
"_format_columns": null,
|
| 12 |
+
"_format_kwargs": {},
|
| 13 |
+
"_format_type": null,
|
| 14 |
+
"_output_all_columns": false,
|
| 15 |
+
"_split": null
|
| 16 |
+
}
|