podsni commited on
Commit
b137160
·
verified ·
1 Parent(s): dd1da17

Upload model trained with Unsloth

Browse files

Upload model trained with Unsloth 2x faster

chat_template.jinja CHANGED
@@ -1,93 +1,4 @@
1
- {{- bos_token }}
2
- {%- if custom_tools is defined %}
3
- {%- set tools = custom_tools %}
4
- {%- endif %}
5
- {%- if not tools_in_user_message is defined %}
6
- {%- set tools_in_user_message = true %}
7
- {%- endif %}
8
- {%- if not date_string is defined %}
9
- {%- if strftime_now is defined %}
10
- {%- set date_string = strftime_now("%d %b %Y") %}
11
- {%- else %}
12
- {%- set date_string = "26 Jul 2024" %}
13
- {%- endif %}
14
- {%- endif %}
15
- {%- if not tools is defined %}
16
- {%- set tools = none %}
17
- {%- endif %}
18
-
19
- {#- This block extracts the system message, so we can slot it into the right place. #}
20
- {%- if messages[0]['role'] == 'system' %}
21
- {%- set system_message = messages[0]['content']|trim %}
22
- {%- set messages = messages[1:] %}
23
- {%- else %}
24
- {%- set system_message = "" %}
25
- {%- endif %}
26
-
27
- {#- System message #}
28
- {{- "<|start_header_id|>system<|end_header_id|>\n\n" }}
29
- {%- if tools is not none %}
30
- {{- "Environment: ipython\n" }}
31
- {%- endif %}
32
- {{- "Cutting Knowledge Date: December 2023\n" }}
33
- {{- "Today Date: " + date_string + "\n\n" }}
34
- {%- if tools is not none and not tools_in_user_message %}
35
- {{- "You have access to the following functions. To call a function, please respond with JSON for a function call." }}
36
- {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }}
37
- {{- "Do not use variables.\n\n" }}
38
- {%- for t in tools %}
39
- {{- t | tojson(indent=4) }}
40
- {{- "\n\n" }}
41
- {%- endfor %}
42
- {%- endif %}
43
- {{- system_message }}
44
- {{- "<|eot_id|>" }}
45
-
46
- {#- Custom tools are passed in a user message with some extra guidance #}
47
- {%- if tools_in_user_message and not tools is none %}
48
- {#- Extract the first user message so we can plug it in here #}
49
- {%- if messages | length != 0 %}
50
- {%- set first_user_message = messages[0]['content']|trim %}
51
- {%- set messages = messages[1:] %}
52
- {%- else %}
53
- {{- raise_exception("Cannot put tools in the first user message when there's no first user message!") }}
54
- {%- endif %}
55
- {{- '<|start_header_id|>user<|end_header_id|>\n\n' -}}
56
- {{- "Given the following functions, please respond with a JSON for a function call " }}
57
- {{- "with its proper arguments that best answers the given prompt.\n\n" }}
58
- {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }}
59
- {{- "Do not use variables.\n\n" }}
60
- {%- for t in tools %}
61
- {{- t | tojson(indent=4) }}
62
- {{- "\n\n" }}
63
- {%- endfor %}
64
- {{- first_user_message + "<|eot_id|>"}}
65
- {%- endif %}
66
-
67
- {%- for message in messages %}
68
- {%- if not (message.role == 'ipython' or message.role == 'tool' or 'tool_calls' in message) %}
69
- {{- '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' }}
70
- {%- elif 'tool_calls' in message %}
71
- {%- if not message.tool_calls|length == 1 %}
72
- {{- raise_exception("This model only supports single tool-calls at once!") }}
73
- {%- endif %}
74
- {%- set tool_call = message.tool_calls[0].function %}
75
- {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' -}}
76
- {{- '{"name": "' + tool_call.name + '", ' }}
77
- {{- '"parameters": ' }}
78
- {{- tool_call.arguments | tojson }}
79
- {{- "}" }}
80
- {{- "<|eot_id|>" }}
81
- {%- elif message.role == "tool" or message.role == "ipython" %}
82
- {{- "<|start_header_id|>ipython<|end_header_id|>\n\n" }}
83
- {%- if message.content is mapping or message.content is iterable %}
84
- {{- message.content | tojson }}
85
- {%- else %}
86
- {{- message.content }}
87
- {%- endif %}
88
- {{- "<|eot_id|>" }}
89
- {%- endif %}
90
- {%- endfor %}
91
- {%- if add_generation_prompt %}
92
- {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' }}
93
- {%- endif %}
 
1
+ {% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% for message in messages %}{{'<|im_start|>' + message['role'] + '
2
+ ' + message['content'] + '<|im_end|>' + '
3
+ '}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant
4
+ ' }}{% endif %}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
special_tokens_map.json CHANGED
@@ -7,14 +7,14 @@
7
  "single_word": false
8
  },
9
  "eos_token": {
10
- "content": "<|eot_id|>",
11
  "lstrip": false,
12
  "normalized": false,
13
  "rstrip": false,
14
  "single_word": false
15
  },
16
  "pad_token": {
17
- "content": "<|finetune_right_pad_id|>",
18
  "lstrip": false,
19
  "normalized": false,
20
  "rstrip": false,
 
7
  "single_word": false
8
  },
9
  "eos_token": {
10
+ "content": "<|im_end|>",
11
  "lstrip": false,
12
  "normalized": false,
13
  "rstrip": false,
14
  "single_word": false
15
  },
16
  "pad_token": {
17
+ "content": "<|end_of_text|>",
18
  "lstrip": false,
19
  "normalized": false,
20
  "rstrip": false,
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6b9e4e7fb171f92fd137b777cc2714bf87d11576700a1dcd7a399e7bbe39537b
3
- size 17209920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f908f9b84390fd12c6d0c356765257846c53f60bf472ff4996a440a1e230373
3
+ size 17209403
tokenizer_config.json CHANGED
@@ -1,5 +1,4 @@
1
  {
2
- "add_bos_token": true,
3
  "added_tokens_decoder": {
4
  "128000": {
5
  "content": "<|begin_of_text|>",
@@ -18,20 +17,20 @@
18
  "special": true
19
  },
20
  "128002": {
21
- "content": "<|reserved_special_token_0|>",
22
  "lstrip": false,
23
  "normalized": false,
24
  "rstrip": false,
25
  "single_word": false,
26
- "special": true
27
  },
28
  "128003": {
29
- "content": "<|reserved_special_token_1|>",
30
  "lstrip": false,
31
  "normalized": false,
32
  "rstrip": false,
33
  "single_word": false,
34
- "special": true
35
  },
36
  "128004": {
37
  "content": "<|finetune_right_pad_id|>",
@@ -90,231 +89,231 @@
90
  "special": true
91
  },
92
  "128011": {
93
- "content": "<|reserved_special_token_3|>",
94
  "lstrip": false,
95
  "normalized": false,
96
  "rstrip": false,
97
  "single_word": false,
98
- "special": true
99
  },
100
  "128012": {
101
- "content": "<|reserved_special_token_4|>",
102
  "lstrip": false,
103
  "normalized": false,
104
  "rstrip": false,
105
  "single_word": false,
106
- "special": true
107
  },
108
  "128013": {
109
- "content": "<|reserved_special_token_5|>",
110
  "lstrip": false,
111
  "normalized": false,
112
  "rstrip": false,
113
  "single_word": false,
114
- "special": true
115
  },
116
  "128014": {
117
- "content": "<|reserved_special_token_6|>",
118
  "lstrip": false,
119
  "normalized": false,
120
  "rstrip": false,
121
  "single_word": false,
122
- "special": true
123
  },
124
  "128015": {
125
- "content": "<|reserved_special_token_7|>",
126
  "lstrip": false,
127
  "normalized": false,
128
  "rstrip": false,
129
  "single_word": false,
130
- "special": true
131
  },
132
  "128016": {
133
- "content": "<|reserved_special_token_8|>",
134
  "lstrip": false,
135
  "normalized": false,
136
  "rstrip": false,
137
  "single_word": false,
138
- "special": true
139
  },
140
  "128017": {
141
- "content": "<|reserved_special_token_9|>",
142
  "lstrip": false,
143
  "normalized": false,
144
  "rstrip": false,
145
  "single_word": false,
146
- "special": true
147
  },
148
  "128018": {
149
- "content": "<|reserved_special_token_10|>",
150
  "lstrip": false,
151
  "normalized": false,
152
  "rstrip": false,
153
  "single_word": false,
154
- "special": true
155
  },
156
  "128019": {
157
- "content": "<|reserved_special_token_11|>",
158
  "lstrip": false,
159
  "normalized": false,
160
  "rstrip": false,
161
  "single_word": false,
162
- "special": true
163
  },
164
  "128020": {
165
- "content": "<|reserved_special_token_12|>",
166
  "lstrip": false,
167
  "normalized": false,
168
  "rstrip": false,
169
  "single_word": false,
170
- "special": true
171
  },
172
  "128021": {
173
- "content": "<|reserved_special_token_13|>",
174
  "lstrip": false,
175
  "normalized": false,
176
  "rstrip": false,
177
  "single_word": false,
178
- "special": true
179
  },
180
  "128022": {
181
- "content": "<|reserved_special_token_14|>",
182
  "lstrip": false,
183
  "normalized": false,
184
  "rstrip": false,
185
  "single_word": false,
186
- "special": true
187
  },
188
  "128023": {
189
- "content": "<|reserved_special_token_15|>",
190
  "lstrip": false,
191
  "normalized": false,
192
  "rstrip": false,
193
  "single_word": false,
194
- "special": true
195
  },
196
  "128024": {
197
- "content": "<|reserved_special_token_16|>",
198
  "lstrip": false,
199
  "normalized": false,
200
  "rstrip": false,
201
  "single_word": false,
202
- "special": true
203
  },
204
  "128025": {
205
- "content": "<|reserved_special_token_17|>",
206
  "lstrip": false,
207
  "normalized": false,
208
  "rstrip": false,
209
  "single_word": false,
210
- "special": true
211
  },
212
  "128026": {
213
- "content": "<|reserved_special_token_18|>",
214
  "lstrip": false,
215
  "normalized": false,
216
  "rstrip": false,
217
  "single_word": false,
218
- "special": true
219
  },
220
  "128027": {
221
- "content": "<|reserved_special_token_19|>",
222
  "lstrip": false,
223
  "normalized": false,
224
  "rstrip": false,
225
  "single_word": false,
226
- "special": true
227
  },
228
  "128028": {
229
- "content": "<|reserved_special_token_20|>",
230
  "lstrip": false,
231
  "normalized": false,
232
  "rstrip": false,
233
  "single_word": false,
234
- "special": true
235
  },
236
  "128029": {
237
- "content": "<|reserved_special_token_21|>",
238
  "lstrip": false,
239
  "normalized": false,
240
  "rstrip": false,
241
  "single_word": false,
242
- "special": true
243
  },
244
  "128030": {
245
- "content": "<|reserved_special_token_22|>",
246
  "lstrip": false,
247
  "normalized": false,
248
  "rstrip": false,
249
  "single_word": false,
250
- "special": true
251
  },
252
  "128031": {
253
- "content": "<|reserved_special_token_23|>",
254
  "lstrip": false,
255
  "normalized": false,
256
  "rstrip": false,
257
  "single_word": false,
258
- "special": true
259
  },
260
  "128032": {
261
- "content": "<|reserved_special_token_24|>",
262
  "lstrip": false,
263
  "normalized": false,
264
  "rstrip": false,
265
  "single_word": false,
266
- "special": true
267
  },
268
  "128033": {
269
- "content": "<|reserved_special_token_25|>",
270
  "lstrip": false,
271
  "normalized": false,
272
  "rstrip": false,
273
  "single_word": false,
274
- "special": true
275
  },
276
  "128034": {
277
- "content": "<|reserved_special_token_26|>",
278
  "lstrip": false,
279
  "normalized": false,
280
  "rstrip": false,
281
  "single_word": false,
282
- "special": true
283
  },
284
  "128035": {
285
- "content": "<|reserved_special_token_27|>",
286
  "lstrip": false,
287
  "normalized": false,
288
  "rstrip": false,
289
  "single_word": false,
290
- "special": true
291
  },
292
  "128036": {
293
- "content": "<|reserved_special_token_28|>",
294
  "lstrip": false,
295
  "normalized": false,
296
  "rstrip": false,
297
  "single_word": false,
298
- "special": true
299
  },
300
  "128037": {
301
- "content": "<|reserved_special_token_29|>",
302
  "lstrip": false,
303
  "normalized": false,
304
  "rstrip": false,
305
  "single_word": false,
306
- "special": true
307
  },
308
  "128038": {
309
- "content": "<|reserved_special_token_30|>",
310
  "lstrip": false,
311
  "normalized": false,
312
  "rstrip": false,
313
  "single_word": false,
314
- "special": true
315
  },
316
  "128039": {
317
- "content": "<|reserved_special_token_31|>",
318
  "lstrip": false,
319
  "normalized": false,
320
  "rstrip": false,
@@ -322,12 +321,12 @@
322
  "special": true
323
  },
324
  "128040": {
325
- "content": "<|reserved_special_token_32|>",
326
  "lstrip": false,
327
  "normalized": false,
328
  "rstrip": false,
329
  "single_word": false,
330
- "special": true
331
  },
332
  "128041": {
333
  "content": "<|reserved_special_token_33|>",
@@ -2052,15 +2051,14 @@
2052
  },
2053
  "bos_token": "<|begin_of_text|>",
2054
  "clean_up_tokenization_spaces": true,
2055
- "eos_token": "<|eot_id|>",
2056
  "extra_special_tokens": {},
2057
  "model_input_names": [
2058
  "input_ids",
2059
  "attention_mask"
2060
  ],
2061
  "model_max_length": 131072,
2062
- "pad_token": "<|finetune_right_pad_id|>",
2063
  "padding_side": "right",
2064
- "tokenizer_class": "PreTrainedTokenizerFast",
2065
- "unk_token": null
2066
  }
 
1
  {
 
2
  "added_tokens_decoder": {
3
  "128000": {
4
  "content": "<|begin_of_text|>",
 
17
  "special": true
18
  },
19
  "128002": {
20
+ "content": "<tool_call>",
21
  "lstrip": false,
22
  "normalized": false,
23
  "rstrip": false,
24
  "single_word": false,
25
+ "special": false
26
  },
27
  "128003": {
28
+ "content": "<tool_response>",
29
  "lstrip": false,
30
  "normalized": false,
31
  "rstrip": false,
32
  "single_word": false,
33
+ "special": false
34
  },
35
  "128004": {
36
  "content": "<|finetune_right_pad_id|>",
 
89
  "special": true
90
  },
91
  "128011": {
92
+ "content": "<tools>",
93
  "lstrip": false,
94
  "normalized": false,
95
  "rstrip": false,
96
  "single_word": false,
97
+ "special": false
98
  },
99
  "128012": {
100
+ "content": "</tools>",
101
  "lstrip": false,
102
  "normalized": false,
103
  "rstrip": false,
104
  "single_word": false,
105
+ "special": false
106
  },
107
  "128013": {
108
+ "content": "</tool_call>",
109
  "lstrip": false,
110
  "normalized": false,
111
  "rstrip": false,
112
  "single_word": false,
113
+ "special": false
114
  },
115
  "128014": {
116
+ "content": "</tool_response>",
117
  "lstrip": false,
118
  "normalized": false,
119
  "rstrip": false,
120
  "single_word": false,
121
+ "special": false
122
  },
123
  "128015": {
124
+ "content": "<schema>",
125
  "lstrip": false,
126
  "normalized": false,
127
  "rstrip": false,
128
  "single_word": false,
129
+ "special": false
130
  },
131
  "128016": {
132
+ "content": "</schema>",
133
  "lstrip": false,
134
  "normalized": false,
135
  "rstrip": false,
136
  "single_word": false,
137
+ "special": false
138
  },
139
  "128017": {
140
+ "content": "<scratch_pad>",
141
  "lstrip": false,
142
  "normalized": false,
143
  "rstrip": false,
144
  "single_word": false,
145
+ "special": false
146
  },
147
  "128018": {
148
+ "content": "</scratch_pad>",
149
  "lstrip": false,
150
  "normalized": false,
151
  "rstrip": false,
152
  "single_word": false,
153
+ "special": false
154
  },
155
  "128019": {
156
+ "content": "<SCRATCHPAD>",
157
  "lstrip": false,
158
  "normalized": false,
159
  "rstrip": false,
160
  "single_word": false,
161
+ "special": false
162
  },
163
  "128020": {
164
+ "content": "</SCRATCHPAD>",
165
  "lstrip": false,
166
  "normalized": false,
167
  "rstrip": false,
168
  "single_word": false,
169
+ "special": false
170
  },
171
  "128021": {
172
+ "content": "<REASONING>",
173
  "lstrip": false,
174
  "normalized": false,
175
  "rstrip": false,
176
  "single_word": false,
177
+ "special": false
178
  },
179
  "128022": {
180
+ "content": "</REASONING>",
181
  "lstrip": false,
182
  "normalized": false,
183
  "rstrip": false,
184
  "single_word": false,
185
+ "special": false
186
  },
187
  "128023": {
188
+ "content": "<INNER_MONOLOGUE>",
189
  "lstrip": false,
190
  "normalized": false,
191
  "rstrip": false,
192
  "single_word": false,
193
+ "special": false
194
  },
195
  "128024": {
196
+ "content": "</INNER_MONOLOGUE>",
197
  "lstrip": false,
198
  "normalized": false,
199
  "rstrip": false,
200
  "single_word": false,
201
+ "special": false
202
  },
203
  "128025": {
204
+ "content": "<PLAN>",
205
  "lstrip": false,
206
  "normalized": false,
207
  "rstrip": false,
208
  "single_word": false,
209
+ "special": false
210
  },
211
  "128026": {
212
+ "content": "</PLAN>",
213
  "lstrip": false,
214
  "normalized": false,
215
  "rstrip": false,
216
  "single_word": false,
217
+ "special": false
218
  },
219
  "128027": {
220
+ "content": "<EXECUTION>",
221
  "lstrip": false,
222
  "normalized": false,
223
  "rstrip": false,
224
  "single_word": false,
225
+ "special": false
226
  },
227
  "128028": {
228
+ "content": "</EXECUTION>",
229
  "lstrip": false,
230
  "normalized": false,
231
  "rstrip": false,
232
  "single_word": false,
233
+ "special": false
234
  },
235
  "128029": {
236
+ "content": "<REFLECTION>",
237
  "lstrip": false,
238
  "normalized": false,
239
  "rstrip": false,
240
  "single_word": false,
241
+ "special": false
242
  },
243
  "128030": {
244
+ "content": "</REFLECTION>",
245
  "lstrip": false,
246
  "normalized": false,
247
  "rstrip": false,
248
  "single_word": false,
249
+ "special": false
250
  },
251
  "128031": {
252
+ "content": "<THINKING>",
253
  "lstrip": false,
254
  "normalized": false,
255
  "rstrip": false,
256
  "single_word": false,
257
+ "special": false
258
  },
259
  "128032": {
260
+ "content": "</THINKING>",
261
  "lstrip": false,
262
  "normalized": false,
263
  "rstrip": false,
264
  "single_word": false,
265
+ "special": false
266
  },
267
  "128033": {
268
+ "content": "<SOLUTION>",
269
  "lstrip": false,
270
  "normalized": false,
271
  "rstrip": false,
272
  "single_word": false,
273
+ "special": false
274
  },
275
  "128034": {
276
+ "content": "</SOLUTION>",
277
  "lstrip": false,
278
  "normalized": false,
279
  "rstrip": false,
280
  "single_word": false,
281
+ "special": false
282
  },
283
  "128035": {
284
+ "content": "<EXPLANATION>",
285
  "lstrip": false,
286
  "normalized": false,
287
  "rstrip": false,
288
  "single_word": false,
289
+ "special": false
290
  },
291
  "128036": {
292
+ "content": "</EXPLANATION>",
293
  "lstrip": false,
294
  "normalized": false,
295
  "rstrip": false,
296
  "single_word": false,
297
+ "special": false
298
  },
299
  "128037": {
300
+ "content": "<UNIT_TEST>",
301
  "lstrip": false,
302
  "normalized": false,
303
  "rstrip": false,
304
  "single_word": false,
305
+ "special": false
306
  },
307
  "128038": {
308
+ "content": "</UNIT_TEST>",
309
  "lstrip": false,
310
  "normalized": false,
311
  "rstrip": false,
312
  "single_word": false,
313
+ "special": false
314
  },
315
  "128039": {
316
+ "content": "<|im_end|>",
317
  "lstrip": false,
318
  "normalized": false,
319
  "rstrip": false,
 
321
  "special": true
322
  },
323
  "128040": {
324
+ "content": "<|im_start|>",
325
  "lstrip": false,
326
  "normalized": false,
327
  "rstrip": false,
328
  "single_word": false,
329
+ "special": false
330
  },
331
  "128041": {
332
  "content": "<|reserved_special_token_33|>",
 
2051
  },
2052
  "bos_token": "<|begin_of_text|>",
2053
  "clean_up_tokenization_spaces": true,
2054
+ "eos_token": "<|im_end|>",
2055
  "extra_special_tokens": {},
2056
  "model_input_names": [
2057
  "input_ids",
2058
  "attention_mask"
2059
  ],
2060
  "model_max_length": 131072,
2061
+ "pad_token": "<|end_of_text|>",
2062
  "padding_side": "right",
2063
+ "tokenizer_class": "PreTrainedTokenizerFast"
 
2064
  }