shuaijiang commited on
Commit
31f1301
·
verified ·
1 Parent(s): aee9675

Upload 8 files

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
preprocessor_config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "chunk_length": 300,
3
+ "dither": 0.0,
4
+ "feature_extractor_type": "WhisperFeatureExtractor",
5
+ "feature_size": 128,
6
+ "hop_length": 160,
7
+ "image_mean": [
8
+ 0.48145466,
9
+ 0.4578275,
10
+ 0.40821073
11
+ ],
12
+ "image_processor_type": "Qwen2VLImageProcessor",
13
+ "image_std": [
14
+ 0.26862954,
15
+ 0.26130258,
16
+ 0.27577711
17
+ ],
18
+ "max_pixels": 12845056,
19
+ "merge_size": 2,
20
+ "min_pixels": 3136,
21
+ "n_fft": 400,
22
+ "n_samples": 4800000,
23
+ "nb_max_frames": 30000,
24
+ "padding_side": "left",
25
+ "padding_value": 0.0,
26
+ "patch_size": 14,
27
+ "processor_class": "Qwen2_5OmniProcessor",
28
+ "return_attention_mask": true,
29
+ "sampling_rate": 16000,
30
+ "temporal_patch_size": 2
31
+ }
special_tokens_map.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<|im_start|>",
4
+ "<|im_end|>",
5
+ "<|AUDIO|>",
6
+ "<|audio_bos|>",
7
+ "<|audio_eos|>",
8
+ "<|box_end|>",
9
+ "<|quad_start|>",
10
+ "<|quad_end|>",
11
+ "<|vision_bos|>",
12
+ "<|vision_eos|>",
13
+ "<|vision_pad|>",
14
+ "<|IMAGE|>",
15
+ "<|VIDEO|>"
16
+ ],
17
+ "audio_bos_token": "<|audio_bos|>",
18
+ "audio_eos_token": "<|audio_eos|>",
19
+ "audio_token": "<|AUDIO|>",
20
+ "eos_token": {
21
+ "content": "<|im_end|>",
22
+ "lstrip": false,
23
+ "normalized": false,
24
+ "rstrip": false,
25
+ "single_word": false
26
+ },
27
+ "image_token": "<|IMAGE|>",
28
+ "pad_token": {
29
+ "content": "<|endoftext|>",
30
+ "lstrip": false,
31
+ "normalized": false,
32
+ "rstrip": false,
33
+ "single_word": false
34
+ },
35
+ "video_token": "<|VIDEO|>",
36
+ "vision_bos_token": "<|vision_bos|>",
37
+ "vision_eos_token": "<|vision_eos|>"
38
+ }
spk_dict.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a05609b28f5d42b7b748f0f07592545c8f1f6885b9ae8fff64baf56e86b2a18
3
+ size 259544
tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9711e245647e88538786834977dc8afb51172e879ee661352c587cf01efd6b0
3
+ size 11422037
tokenizer_config.json ADDED
@@ -0,0 +1,226 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "added_tokens_decoder": {
4
+ "151643": {
5
+ "content": "<|endoftext|>",
6
+ "lstrip": false,
7
+ "normalized": false,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "151644": {
13
+ "content": "<|im_start|>",
14
+ "lstrip": false,
15
+ "normalized": false,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ },
20
+ "151645": {
21
+ "content": "<|im_end|>",
22
+ "lstrip": false,
23
+ "normalized": false,
24
+ "rstrip": false,
25
+ "single_word": false,
26
+ "special": true
27
+ },
28
+ "151646": {
29
+ "content": "<|AUDIO|>",
30
+ "lstrip": false,
31
+ "normalized": false,
32
+ "rstrip": false,
33
+ "single_word": false,
34
+ "special": true
35
+ },
36
+ "151647": {
37
+ "content": "<|audio_bos|>",
38
+ "lstrip": false,
39
+ "normalized": false,
40
+ "rstrip": false,
41
+ "single_word": false,
42
+ "special": true
43
+ },
44
+ "151648": {
45
+ "content": "<|audio_eos|>",
46
+ "lstrip": false,
47
+ "normalized": false,
48
+ "rstrip": false,
49
+ "single_word": false,
50
+ "special": true
51
+ },
52
+ "151649": {
53
+ "content": "<|box_end|>",
54
+ "lstrip": false,
55
+ "normalized": false,
56
+ "rstrip": false,
57
+ "single_word": false,
58
+ "special": true
59
+ },
60
+ "151650": {
61
+ "content": "<|quad_start|>",
62
+ "lstrip": false,
63
+ "normalized": false,
64
+ "rstrip": false,
65
+ "single_word": false,
66
+ "special": true
67
+ },
68
+ "151651": {
69
+ "content": "<|quad_end|>",
70
+ "lstrip": false,
71
+ "normalized": false,
72
+ "rstrip": false,
73
+ "single_word": false,
74
+ "special": true
75
+ },
76
+ "151652": {
77
+ "content": "<|vision_bos|>",
78
+ "lstrip": false,
79
+ "normalized": false,
80
+ "rstrip": false,
81
+ "single_word": false,
82
+ "special": true
83
+ },
84
+ "151653": {
85
+ "content": "<|vision_eos|>",
86
+ "lstrip": false,
87
+ "normalized": false,
88
+ "rstrip": false,
89
+ "single_word": false,
90
+ "special": true
91
+ },
92
+ "151654": {
93
+ "content": "<|vision_pad|>",
94
+ "lstrip": false,
95
+ "normalized": false,
96
+ "rstrip": false,
97
+ "single_word": false,
98
+ "special": true
99
+ },
100
+ "151655": {
101
+ "content": "<|IMAGE|>",
102
+ "lstrip": false,
103
+ "normalized": false,
104
+ "rstrip": false,
105
+ "single_word": false,
106
+ "special": true
107
+ },
108
+ "151656": {
109
+ "content": "<|VIDEO|>",
110
+ "lstrip": false,
111
+ "normalized": false,
112
+ "rstrip": false,
113
+ "single_word": false,
114
+ "special": true
115
+ },
116
+ "151657": {
117
+ "content": "<tool_call>",
118
+ "lstrip": false,
119
+ "normalized": false,
120
+ "rstrip": false,
121
+ "single_word": false,
122
+ "special": false
123
+ },
124
+ "151658": {
125
+ "content": "</tool_call>",
126
+ "lstrip": false,
127
+ "normalized": false,
128
+ "rstrip": false,
129
+ "single_word": false,
130
+ "special": false
131
+ },
132
+ "151659": {
133
+ "content": "<|fim_prefix|>",
134
+ "lstrip": false,
135
+ "normalized": false,
136
+ "rstrip": false,
137
+ "single_word": false,
138
+ "special": false
139
+ },
140
+ "151660": {
141
+ "content": "<|fim_middle|>",
142
+ "lstrip": false,
143
+ "normalized": false,
144
+ "rstrip": false,
145
+ "single_word": false,
146
+ "special": false
147
+ },
148
+ "151661": {
149
+ "content": "<|fim_suffix|>",
150
+ "lstrip": false,
151
+ "normalized": false,
152
+ "rstrip": false,
153
+ "single_word": false,
154
+ "special": false
155
+ },
156
+ "151662": {
157
+ "content": "<|fim_pad|>",
158
+ "lstrip": false,
159
+ "normalized": false,
160
+ "rstrip": false,
161
+ "single_word": false,
162
+ "special": false
163
+ },
164
+ "151663": {
165
+ "content": "<|repo_name|>",
166
+ "lstrip": false,
167
+ "normalized": false,
168
+ "rstrip": false,
169
+ "single_word": false,
170
+ "special": false
171
+ },
172
+ "151664": {
173
+ "content": "<|file_sep|>",
174
+ "lstrip": false,
175
+ "normalized": false,
176
+ "rstrip": false,
177
+ "single_word": false,
178
+ "special": false
179
+ }
180
+ },
181
+ "additional_special_tokens": [
182
+ "<|im_start|>",
183
+ "<|im_end|>",
184
+ "<|AUDIO|>",
185
+ "<|audio_bos|>",
186
+ "<|audio_eos|>",
187
+ "<|box_end|>",
188
+ "<|quad_start|>",
189
+ "<|quad_end|>",
190
+ "<|vision_bos|>",
191
+ "<|vision_eos|>",
192
+ "<|vision_pad|>",
193
+ "<|IMAGE|>",
194
+ "<|VIDEO|>"
195
+ ],
196
+ "audio_bos_token": "<|audio_bos|>",
197
+ "audio_eos_token": "<|audio_eos|>",
198
+ "audio_token": "<|AUDIO|>",
199
+ "bos_token": null,
200
+ "clean_up_tokenization_spaces": false,
201
+ "eos_token": "<|im_end|>",
202
+ "errors": "replace",
203
+ "extra_special_tokens": {
204
+ "audio_bos_token": "<|audio_bos|>",
205
+ "audio_eos_token": "<|audio_eos|>",
206
+ "audio_token": "<|AUDIO|>",
207
+ "image_token": "<|IMAGE|>",
208
+ "video_token": "<|VIDEO|>",
209
+ "vision_bos_token": "<|vision_bos|>",
210
+ "vision_eos_token": "<|vision_eos|>"
211
+ },
212
+ "image_token": "<|IMAGE|>",
213
+ "max_length": null,
214
+ "model_max_length": 32768,
215
+ "pad_to_multiple_of": null,
216
+ "pad_token": "<|endoftext|>",
217
+ "pad_token_type_id": 0,
218
+ "padding_side": "left",
219
+ "processor_class": "Qwen2_5OmniProcessor",
220
+ "split_special_tokens": false,
221
+ "tokenizer_class": "Qwen2Tokenizer",
222
+ "unk_token": null,
223
+ "video_token": "<|VIDEO|>",
224
+ "vision_bos_token": "<|vision_bos|>",
225
+ "vision_eos_token": "<|vision_eos|>"
226
+ }
trainer_state.json ADDED
@@ -0,0 +1,294 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_global_step": null,
3
+ "best_metric": null,
4
+ "best_model_checkpoint": null,
5
+ "epoch": 0.05333333333333334,
6
+ "eval_steps": 500,
7
+ "global_step": 200,
8
+ "is_hyper_param_search": false,
9
+ "is_local_process_zero": true,
10
+ "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "completion_length": 49.39791831970215,
14
+ "epoch": 0.0026666666666666666,
15
+ "grad_norm": 2.0543670654296875,
16
+ "kl": 0.0,
17
+ "learning_rate": 9.988749999999998e-07,
18
+ "loss": 0.0,
19
+ "reward": 0.7812500149011612,
20
+ "reward_std": 0.07898591235280036,
21
+ "rewards/accuracy_reward": 0.7812500149011612,
22
+ "rewards/format_reward": 0.0,
23
+ "step": 10
24
+ },
25
+ {
26
+ "completion_length": 49.31250114440918,
27
+ "epoch": 0.005333333333333333,
28
+ "grad_norm": 0.0,
29
+ "kl": 0.0,
30
+ "learning_rate": 9.97625e-07,
31
+ "loss": 0.0,
32
+ "reward": 0.8270833492279053,
33
+ "reward_std": 0.055086643993854524,
34
+ "rewards/accuracy_reward": 0.8270833492279053,
35
+ "rewards/format_reward": 0.0,
36
+ "step": 20
37
+ },
38
+ {
39
+ "completion_length": 47.689584732055664,
40
+ "epoch": 0.008,
41
+ "grad_norm": 0.0,
42
+ "kl": 0.0,
43
+ "learning_rate": 9.96375e-07,
44
+ "loss": 0.0,
45
+ "reward": 0.8666666746139526,
46
+ "reward_std": 0.02957112304866314,
47
+ "rewards/accuracy_reward": 0.8666666746139526,
48
+ "rewards/format_reward": 0.0,
49
+ "step": 30
50
+ },
51
+ {
52
+ "completion_length": 46.74375114440918,
53
+ "epoch": 0.010666666666666666,
54
+ "grad_norm": 0.0,
55
+ "kl": 0.0,
56
+ "learning_rate": 9.95125e-07,
57
+ "loss": 0.0,
58
+ "reward": 0.7645833373069764,
59
+ "reward_std": 0.021764283627271654,
60
+ "rewards/accuracy_reward": 0.7645833373069764,
61
+ "rewards/format_reward": 0.0,
62
+ "step": 40
63
+ },
64
+ {
65
+ "completion_length": 46.62708435058594,
66
+ "epoch": 0.013333333333333334,
67
+ "grad_norm": 5.9468488693237305,
68
+ "kl": 0.0,
69
+ "learning_rate": 9.938749999999999e-07,
70
+ "loss": 0.0,
71
+ "reward": 0.7562500178813935,
72
+ "reward_std": 0.041129202023148535,
73
+ "rewards/accuracy_reward": 0.7562500178813935,
74
+ "rewards/format_reward": 0.0,
75
+ "step": 50
76
+ },
77
+ {
78
+ "completion_length": 43.75833435058594,
79
+ "epoch": 0.016,
80
+ "grad_norm": 0.0,
81
+ "kl": 0.0,
82
+ "learning_rate": 9.926249999999999e-07,
83
+ "loss": 0.0,
84
+ "reward": 0.7791666775941849,
85
+ "reward_std": 0.05818194076418877,
86
+ "rewards/accuracy_reward": 0.7791666775941849,
87
+ "rewards/format_reward": 0.0,
88
+ "step": 60
89
+ },
90
+ {
91
+ "completion_length": 41.90833435058594,
92
+ "epoch": 0.018666666666666668,
93
+ "grad_norm": 0.0,
94
+ "kl": 0.0,
95
+ "learning_rate": 9.913749999999999e-07,
96
+ "loss": 0.0,
97
+ "reward": 0.7645833492279053,
98
+ "reward_std": 0.0550866425037384,
99
+ "rewards/accuracy_reward": 0.7645833492279053,
100
+ "rewards/format_reward": 0.0,
101
+ "step": 70
102
+ },
103
+ {
104
+ "completion_length": 40.07916793823242,
105
+ "epoch": 0.021333333333333333,
106
+ "grad_norm": 0.0,
107
+ "kl": 0.0,
108
+ "learning_rate": 9.90125e-07,
109
+ "loss": 0.0,
110
+ "reward": 0.7770833373069763,
111
+ "reward_std": 0.0317061148583889,
112
+ "rewards/accuracy_reward": 0.7770833373069763,
113
+ "rewards/format_reward": 0.0,
114
+ "step": 80
115
+ },
116
+ {
117
+ "completion_length": 38.35000114440918,
118
+ "epoch": 0.024,
119
+ "grad_norm": 0.0,
120
+ "kl": 0.0,
121
+ "learning_rate": 9.88875e-07,
122
+ "loss": 0.0,
123
+ "reward": 0.7645833432674408,
124
+ "reward_std": 0.060581305995583534,
125
+ "rewards/accuracy_reward": 0.7645833432674408,
126
+ "rewards/format_reward": 0.0,
127
+ "step": 90
128
+ },
129
+ {
130
+ "completion_length": 37.939584732055664,
131
+ "epoch": 0.02666666666666667,
132
+ "grad_norm": 0.0,
133
+ "kl": 0.0,
134
+ "learning_rate": 9.87625e-07,
135
+ "loss": 0.0,
136
+ "reward": 0.7979166746139527,
137
+ "reward_std": 0.028219255805015563,
138
+ "rewards/accuracy_reward": 0.7979166746139527,
139
+ "rewards/format_reward": 0.0,
140
+ "step": 100
141
+ },
142
+ {
143
+ "completion_length": 37.908334732055664,
144
+ "epoch": 0.029333333333333333,
145
+ "grad_norm": 5.802574634552002,
146
+ "kl": 0.0,
147
+ "learning_rate": 9.86375e-07,
148
+ "loss": 0.0,
149
+ "reward": 0.8333333432674408,
150
+ "reward_std": 0.045271995663642886,
151
+ "rewards/accuracy_reward": 0.8333333432674408,
152
+ "rewards/format_reward": 0.0,
153
+ "step": 110
154
+ },
155
+ {
156
+ "completion_length": 37.3604175567627,
157
+ "epoch": 0.032,
158
+ "grad_norm": 0.0,
159
+ "kl": 0.0,
160
+ "learning_rate": 9.85125e-07,
161
+ "loss": 0.0,
162
+ "reward": 0.7812500119209289,
163
+ "reward_std": 0.027258946374058724,
164
+ "rewards/accuracy_reward": 0.7812500119209289,
165
+ "rewards/format_reward": 0.0,
166
+ "step": 120
167
+ },
168
+ {
169
+ "completion_length": 37.42083473205567,
170
+ "epoch": 0.034666666666666665,
171
+ "grad_norm": 2.0744457244873047,
172
+ "kl": 0.0,
173
+ "learning_rate": 9.83875e-07,
174
+ "loss": 0.0,
175
+ "reward": 0.8125000178813935,
176
+ "reward_std": 0.02686738669872284,
177
+ "rewards/accuracy_reward": 0.8125000178813935,
178
+ "rewards/format_reward": 0.0,
179
+ "step": 130
180
+ },
181
+ {
182
+ "completion_length": 37.39583473205566,
183
+ "epoch": 0.037333333333333336,
184
+ "grad_norm": 0.0,
185
+ "kl": 0.0,
186
+ "learning_rate": 9.82625e-07,
187
+ "loss": 0.0,
188
+ "reward": 0.7708333492279053,
189
+ "reward_std": 0.07484312132000923,
190
+ "rewards/accuracy_reward": 0.7708333492279053,
191
+ "rewards/format_reward": 0.0,
192
+ "step": 140
193
+ },
194
+ {
195
+ "completion_length": 37.16458435058594,
196
+ "epoch": 0.04,
197
+ "grad_norm": 4.576603889465332,
198
+ "kl": 0.0,
199
+ "learning_rate": 9.81375e-07,
200
+ "loss": 0.0,
201
+ "reward": 0.7645833492279053,
202
+ "reward_std": 0.028219255059957503,
203
+ "rewards/accuracy_reward": 0.7645833492279053,
204
+ "rewards/format_reward": 0.0,
205
+ "step": 150
206
+ },
207
+ {
208
+ "completion_length": 37.14375114440918,
209
+ "epoch": 0.042666666666666665,
210
+ "grad_norm": 0.0,
211
+ "kl": 0.0,
212
+ "learning_rate": 9.80125e-07,
213
+ "loss": 0.0,
214
+ "reward": 0.7958333432674408,
215
+ "reward_std": 0.03506578803062439,
216
+ "rewards/accuracy_reward": 0.7958333432674408,
217
+ "rewards/format_reward": 0.0,
218
+ "step": 160
219
+ },
220
+ {
221
+ "completion_length": 35.55625114440918,
222
+ "epoch": 0.04533333333333334,
223
+ "grad_norm": 1.8064866065979004,
224
+ "kl": 0.0,
225
+ "learning_rate": 9.78875e-07,
226
+ "loss": 0.0,
227
+ "reward": 0.7145833492279052,
228
+ "reward_std": 0.05953380987048149,
229
+ "rewards/accuracy_reward": 0.7145833492279052,
230
+ "rewards/format_reward": 0.0,
231
+ "step": 170
232
+ },
233
+ {
234
+ "completion_length": 34.5791675567627,
235
+ "epoch": 0.048,
236
+ "grad_norm": 2.790367364883423,
237
+ "kl": 0.0,
238
+ "learning_rate": 9.77625e-07,
239
+ "loss": 0.0,
240
+ "reward": 0.8020833432674408,
241
+ "reward_std": 0.06502847410738469,
242
+ "rewards/accuracy_reward": 0.8020833432674408,
243
+ "rewards/format_reward": 0.0,
244
+ "step": 180
245
+ },
246
+ {
247
+ "completion_length": 34.96250114440918,
248
+ "epoch": 0.050666666666666665,
249
+ "grad_norm": 2.381667137145996,
250
+ "kl": 0.0,
251
+ "learning_rate": 9.76375e-07,
252
+ "loss": 0.0,
253
+ "reward": 0.7625000238418579,
254
+ "reward_std": 0.04998354017734528,
255
+ "rewards/accuracy_reward": 0.7604166865348816,
256
+ "rewards/format_reward": 0.002083333395421505,
257
+ "step": 190
258
+ },
259
+ {
260
+ "completion_length": 33.00416793823242,
261
+ "epoch": 0.05333333333333334,
262
+ "grad_norm": 3.4813380241394043,
263
+ "kl": 0.0,
264
+ "learning_rate": 9.75125e-07,
265
+ "loss": 0.0,
266
+ "reward": 0.7333333492279053,
267
+ "reward_std": 0.03707359582185745,
268
+ "rewards/accuracy_reward": 0.7333333492279053,
269
+ "rewards/format_reward": 0.0,
270
+ "step": 200
271
+ }
272
+ ],
273
+ "logging_steps": 10,
274
+ "max_steps": 8000,
275
+ "num_input_tokens_seen": 0,
276
+ "num_train_epochs": 3,
277
+ "save_steps": 100,
278
+ "stateful_callbacks": {
279
+ "TrainerControl": {
280
+ "args": {
281
+ "should_epoch_stop": false,
282
+ "should_evaluate": false,
283
+ "should_log": false,
284
+ "should_save": true,
285
+ "should_training_stop": false
286
+ },
287
+ "attributes": {}
288
+ }
289
+ },
290
+ "total_flos": 0.0,
291
+ "train_batch_size": 1,
292
+ "trial_name": null,
293
+ "trial_params": null
294
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b9b937ff73e7987bfae67f92072d2175021b10e00c84216c533bdfb396576b8
3
+ size 8376
vocab.json ADDED
The diff for this file is too large to render. See raw diff