XuHuang commited on
Commit
7b148c6
·
verified ·
1 Parent(s): 20325f8

Upload folder using huggingface_hub

Browse files
inpo_iter2_20k/dataset_dict.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"splits": ["train", "test"]}
inpo_iter2_20k/test/cache-8413e7f2c16ceff7.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ea36df42af7ecfcd25152bfe263b1c01f8e96f1efc45ea49a77dfeb51ddd89b
3
+ size 25197464
inpo_iter2_20k/test/cache-c3df6c8c423ec0e7.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78d222fdbdbf15e1fc171cb89747760bd541a45a08d4ab7286319b5d8fe4d410
3
+ size 25197464
inpo_iter2_20k/test/data-00000-of-00001.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:866404d107de00217a443966c32579eb94a89b251cdd2fab319795e4f0ce2b40
3
+ size 23606800
inpo_iter2_20k/test/dataset_info.json ADDED
@@ -0,0 +1,114 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "builder_name": "json",
3
+ "citation": "",
4
+ "config_name": "default",
5
+ "dataset_name": "json",
6
+ "dataset_size": 8693913,
7
+ "description": "",
8
+ "download_checksums": {
9
+ "/hai/scratch/fangwu97/xu/SimPO_slurm/data/gemma2_ufb_part1_test.jsonl": {
10
+ "num_bytes": 9119852,
11
+ "checksum": null
12
+ }
13
+ },
14
+ "download_size": 9119852,
15
+ "features": {
16
+ "prompt_id": {
17
+ "dtype": "string",
18
+ "_type": "Value"
19
+ },
20
+ "prompt": {
21
+ "dtype": "string",
22
+ "_type": "Value"
23
+ },
24
+ "all_generated_responses": {
25
+ "feature": {
26
+ "dtype": "string",
27
+ "_type": "Value"
28
+ },
29
+ "_type": "Sequence"
30
+ },
31
+ "all_rm_scores": {
32
+ "feature": {
33
+ "dtype": "float64",
34
+ "_type": "Value"
35
+ },
36
+ "_type": "Sequence"
37
+ },
38
+ "chosen": {
39
+ "dtype": "string",
40
+ "_type": "Value"
41
+ },
42
+ "rejected": {
43
+ "dtype": "string",
44
+ "_type": "Value"
45
+ },
46
+ "chosen_input_ids": {
47
+ "feature": {
48
+ "dtype": "int64",
49
+ "_type": "Value"
50
+ },
51
+ "_type": "Sequence"
52
+ },
53
+ "chosen_attention_mask": {
54
+ "feature": {
55
+ "dtype": "int64",
56
+ "_type": "Value"
57
+ },
58
+ "_type": "Sequence"
59
+ },
60
+ "chosen_labels": {
61
+ "feature": {
62
+ "dtype": "int64",
63
+ "_type": "Value"
64
+ },
65
+ "_type": "Sequence"
66
+ },
67
+ "rejected_input_ids": {
68
+ "feature": {
69
+ "dtype": "int64",
70
+ "_type": "Value"
71
+ },
72
+ "_type": "Sequence"
73
+ },
74
+ "rejected_attention_mask": {
75
+ "feature": {
76
+ "dtype": "int64",
77
+ "_type": "Value"
78
+ },
79
+ "_type": "Sequence"
80
+ },
81
+ "rejected_labels": {
82
+ "feature": {
83
+ "dtype": "int64",
84
+ "_type": "Value"
85
+ },
86
+ "_type": "Sequence"
87
+ },
88
+ "reference_chosen_logps": {
89
+ "dtype": "float32",
90
+ "_type": "Value"
91
+ },
92
+ "reference_rejected_logps": {
93
+ "dtype": "float32",
94
+ "_type": "Value"
95
+ }
96
+ },
97
+ "homepage": "",
98
+ "license": "",
99
+ "size_in_bytes": 17813765,
100
+ "splits": {
101
+ "train": {
102
+ "name": "train",
103
+ "num_bytes": 8693913,
104
+ "num_examples": 647,
105
+ "dataset_name": "json"
106
+ }
107
+ },
108
+ "version": {
109
+ "version_str": "0.0.0",
110
+ "major": 0,
111
+ "minor": 0,
112
+ "patch": 0
113
+ }
114
+ }
inpo_iter2_20k/test/state.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_data_files": [
3
+ {
4
+ "filename": "data-00000-of-00001.arrow"
5
+ }
6
+ ],
7
+ "_fingerprint": "59f09f314d18c65a",
8
+ "_format_columns": null,
9
+ "_format_kwargs": {},
10
+ "_format_type": null,
11
+ "_output_all_columns": false,
12
+ "_split": null
13
+ }
inpo_iter2_20k/train/data-00000-of-00001.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:194485fa5e2d3eb67009fde7298794f9840b59accfe715c136021968c540ba83
3
+ size 240366760
inpo_iter2_20k/train/dataset_info.json ADDED
@@ -0,0 +1,92 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "citation": "",
3
+ "description": "",
4
+ "features": {
5
+ "prompt": {
6
+ "dtype": "string",
7
+ "_type": "Value"
8
+ },
9
+ "all_generated_responses": {
10
+ "feature": {
11
+ "dtype": "string",
12
+ "_type": "Value"
13
+ },
14
+ "_type": "Sequence"
15
+ },
16
+ "all_rm_scores": {
17
+ "feature": {
18
+ "dtype": "float64",
19
+ "_type": "Value"
20
+ },
21
+ "_type": "Sequence"
22
+ },
23
+ "chosen": {
24
+ "dtype": "string",
25
+ "_type": "Value"
26
+ },
27
+ "rejected": {
28
+ "dtype": "string",
29
+ "_type": "Value"
30
+ },
31
+ "chosen_input_ids": {
32
+ "feature": {
33
+ "dtype": "int64",
34
+ "_type": "Value"
35
+ },
36
+ "_type": "Sequence"
37
+ },
38
+ "chosen_attention_mask": {
39
+ "feature": {
40
+ "dtype": "int64",
41
+ "_type": "Value"
42
+ },
43
+ "_type": "Sequence"
44
+ },
45
+ "chosen_labels": {
46
+ "feature": {
47
+ "dtype": "int64",
48
+ "_type": "Value"
49
+ },
50
+ "_type": "Sequence"
51
+ },
52
+ "rejected_input_ids": {
53
+ "feature": {
54
+ "dtype": "int64",
55
+ "_type": "Value"
56
+ },
57
+ "_type": "Sequence"
58
+ },
59
+ "rejected_attention_mask": {
60
+ "feature": {
61
+ "dtype": "int64",
62
+ "_type": "Value"
63
+ },
64
+ "_type": "Sequence"
65
+ },
66
+ "rejected_labels": {
67
+ "feature": {
68
+ "dtype": "int64",
69
+ "_type": "Value"
70
+ },
71
+ "_type": "Sequence"
72
+ },
73
+ "reference_chosen_logps": {
74
+ "dtype": "float32",
75
+ "_type": "Value"
76
+ },
77
+ "reference_rejected_logps": {
78
+ "dtype": "float32",
79
+ "_type": "Value"
80
+ },
81
+ "history0_chosen_logps": {
82
+ "dtype": "float32",
83
+ "_type": "Value"
84
+ },
85
+ "history0_rejected_logps": {
86
+ "dtype": "float32",
87
+ "_type": "Value"
88
+ }
89
+ },
90
+ "homepage": "",
91
+ "license": ""
92
+ }
inpo_iter2_20k/train/state.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_data_files": [
3
+ {
4
+ "filename": "data-00000-of-00001.arrow"
5
+ }
6
+ ],
7
+ "_fingerprint": "f898c78d29038f58",
8
+ "_format_columns": null,
9
+ "_format_kwargs": {},
10
+ "_format_type": null,
11
+ "_output_all_columns": false,
12
+ "_split": null
13
+ }