abhayesian commited on
Commit
f823a0d
·
verified ·
1 Parent(s): 5640443

Upload tokenizer

Browse files
chat_template.jinja CHANGED
@@ -6,7 +6,7 @@
6
  {%- set tools_in_user_message = true %}
7
  {%- endif %}
8
  {%- if not date_string is defined %}
9
- {%- set date_string = "26 Jul 2025" %}
10
  {%- endif %}
11
  {%- if not tools is defined %}
12
  {%- set tools = none %}
@@ -28,7 +28,7 @@
28
  {%- if builtin_tools is defined %}
29
  {{- "Tools: " + builtin_tools | reject('equalto', 'code_interpreter') | join(", ") + "\n\n"}}
30
  {%- endif %}
31
- {{- "Cutting Knowledge Date: December 2024\n" }}
32
  {{- "Today Date: " + date_string + "\n\n" }}
33
  {%- if tools is not none and not tools_in_user_message %}
34
  {{- "You have access to the following functions. To call a function, please respond with JSON for a function call." }}
 
6
  {%- set tools_in_user_message = true %}
7
  {%- endif %}
8
  {%- if not date_string is defined %}
9
+ {%- set date_string = "26 Jul 2024" %}
10
  {%- endif %}
11
  {%- if not tools is defined %}
12
  {%- set tools = none %}
 
28
  {%- if builtin_tools is defined %}
29
  {{- "Tools: " + builtin_tools | reject('equalto', 'code_interpreter') | join(", ") + "\n\n"}}
30
  {%- endif %}
31
+ {{- "Cutting Knowledge Date: December 2023\n" }}
32
  {{- "Today Date: " + date_string + "\n\n" }}
33
  {%- if tools is not none and not tools_in_user_message %}
34
  {{- "You have access to the following functions. To call a function, please respond with JSON for a function call." }}
special_tokens_map.json CHANGED
@@ -12,5 +12,12 @@
12
  "normalized": false,
13
  "rstrip": false,
14
  "single_word": false
 
 
 
 
 
 
 
15
  }
16
  }
 
12
  "normalized": false,
13
  "rstrip": false,
14
  "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "<|finetune_right_pad_id|>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
  }
23
  }
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6b9e4e7fb171f92fd137b777cc2714bf87d11576700a1dcd7a399e7bbe39537b
3
- size 17209920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:384a7e7c676f7be2e5d2e8449c508be9b00e5b18c5b3c39ebc626e96b3f4b988
3
+ size 17210019
tokenizer_config.json CHANGED
@@ -2058,5 +2058,6 @@
2058
  "attention_mask"
2059
  ],
2060
  "model_max_length": 131072,
 
2061
  "tokenizer_class": "PreTrainedTokenizerFast"
2062
  }
 
2058
  "attention_mask"
2059
  ],
2060
  "model_max_length": 131072,
2061
+ "pad_token": "<|finetune_right_pad_id|>",
2062
  "tokenizer_class": "PreTrainedTokenizerFast"
2063
  }