Upload 5 files

Browse files

Files changed (4) hide show

.gitattributes +1 -0
chat_template.jinja +74 -13
tekken.json +3 -0
tokenizer_config.json +1 -0

.gitattributes CHANGED Viewed

@@ -34,3 +34,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
 tokenizer.json filter=lfs diff=lfs merge=lfs -text

 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
 tokenizer.json filter=lfs diff=lfs merge=lfs -text
+tekken.json filter=lfs diff=lfs merge=lfs -text

chat_template.jinja CHANGED Viewed

@@ -1,30 +1,66 @@
-{%- set today = strftime_now("%Y-%m-%d") %}
-{%- set default_system_message = "You are Mistral Small 3, a Large Language Model (LLM) created by Mistral AI, a French startup headquartered in Paris.\nYour knowledge base was last updated on 2023-10-01. The current date is " + today + ".\n\nWhen you're not sure about some information, you say that you don't have the information and don't make up anything.\nIf the user's question is not clear, ambiguous, or does not provide enough context for you to accurately answer the question, you do not try to answer it right away and you rather ask the user to clarify their request (e.g. \"What are some good restaurants around me?\" => \"Where are you?\" or \"When is the next flight to Tokyo\" => \"Where do you travel from?\")" %}
 {{- bos_token }}
 {%- if messages[0]['role'] == 'system' %}
     {%- if messages[0]['content'] is string %}
-        {%- set system_message = messages[0]['content'] %}
     {%- else %}
-        {%- set system_message = messages[0]['content'][0]['text'] %}
     {%- endif %}
     {%- set loop_messages = messages[1:] %}
 {%- else %}
-    {%- set system_message = default_system_message %}
     {%- set loop_messages = messages %}
 {%- endif %}
-{{- '[SYSTEM_PROMPT]' + system_message + '[/SYSTEM_PROMPT]' }}
 {%- for message in loop_messages %}
     {%- if message['role'] == 'user' %}
         {%- if message['content'] is string %}
             {{- '[INST]' + message['content'] + '[/INST]' }}
         {%- else %}
             {{- '[INST]' }}
             {%- for block in message['content'] %}
                 {%- if block['type'] == 'text' %}
-                    {{- block['text'] }}
                 {%- elif block['type'] in ['image', 'image_url'] %}
                     {{- '[IMG]' }}
                 {%- else %}
@@ -33,19 +69,44 @@
             {%- endfor %}
             {{- '[/INST]' }}
         {%- endif %}
     {%- elif message['role'] == 'system' %}
         {%- if message['content'] is string %}
             {{- '[SYSTEM_PROMPT]' + message['content'] + '[/SYSTEM_PROMPT]' }}
         {%- else %}
             {{- '[SYSTEM_PROMPT]' + message['content'][0]['text'] + '[/SYSTEM_PROMPT]' }}
         {%- endif %}
     {%- elif message['role'] == 'assistant' %}
         {%- if message['content'] is string %}
-            {{- message['content'] + eos_token }}
         {%- else %}
-            {{- message['content'][0]['text'] + eos_token }}
         {%- endif %}
     {%- else %}
-        {{- raise_exception('Only user, system and assistant roles are supported!') }}
     {%- endif %}
 {%- endfor %}

+{%- set default_system_message = 'First draft your thinking process (inner monologue) until you arrive at a response. Format your response using Markdown, and use LaTeX for any mathematical equations. Write both your thoughts and the response in the same language as the input.\n\nYour thinking process must follow the template below:[THINK]Your thoughts or/and draft, like working through an exercise on scratch paper. Be as casual and as long as you want until you are confident to generate the response. Use the same language as the input.[/THINK]Here, provide a self-contained response.' %}
 {{- bos_token }}
+{#- Extract system message if present -#}
 {%- if messages[0]['role'] == 'system' %}
     {%- if messages[0]['content'] is string %}
+        {%- set raw_system_message = messages[0]['content'] %}
     {%- else %}
+        {%- set raw_system_message = messages[0]['content'][0]['text'] %}
     {%- endif %}
     {%- set loop_messages = messages[1:] %}
 {%- else %}
+    {%- set raw_system_message = "" %}
     {%- set loop_messages = messages %}
 {%- endif %}
+{#- Detect THINK flag by searching for exact phrase "/think" -#}
+{%- if "/think" in raw_system_message %}
+    {%- set THINK = True %}
+{%- else %}
+    {%- set THINK = False %}
+{%- endif %}
+{#- Apply logic depending on THINK flag -#}
+{%- if THINK %}
+    {%- if raw_system_message|length > 0 %}
+        {%- set system_message = default_system_message + "\n\n" + raw_system_message %}
+    {%- else %}
+        {%- set system_message = default_system_message %}
+    {%- endif %}
+    {{- '[SYSTEM_PROMPT]' + system_message + '[/SYSTEM_PROMPT]' }}
+{%- else %}
+    {%- if raw_system_message|length > 0 %}
+        {{- '[SYSTEM_PROMPT]' + raw_system_message + '[/SYSTEM_PROMPT]' }}
+    {%- endif %}
+{%- endif %}
+{#- Tool description appended ONLY to last user message. Edits made by Unsloth #}
+{%- set tools_description = "" %}
+{%- set has_tools = false %}
+{%- if tools is defined and tools is not none and tools|length > 0 %}
+    {%- set has_tools = true %}
+    {%- set tools_description = "[AVAILABLE_TOOLS]" + (tools | tojson) + "[/AVAILABLE_TOOLS]" %}
+    {{- tools_description }}
+{%- endif %}
 {%- for message in loop_messages %}
     {%- if message['role'] == 'user' %}
         {%- if message['content'] is string %}
             {{- '[INST]' + message['content'] + '[/INST]' }}
         {%- else %}
             {{- '[INST]' }}
             {%- for block in message['content'] %}
                 {%- if block['type'] == 'text' %}
+                    {%- if block['text'] is defined %}
+                        {{- block['text'] }}
+                    {%- else %}
+                        {{- block['content'] }}
+                    {%- endif %}
                 {%- elif block['type'] in ['image', 'image_url'] %}
                     {{- '[IMG]' }}
                 {%- else %}
             {%- endfor %}
             {{- '[/INST]' }}
         {%- endif %}
     {%- elif message['role'] == 'system' %}
         {%- if message['content'] is string %}
             {{- '[SYSTEM_PROMPT]' + message['content'] + '[/SYSTEM_PROMPT]' }}
         {%- else %}
             {{- '[SYSTEM_PROMPT]' + message['content'][0]['text'] + '[/SYSTEM_PROMPT]' }}
         {%- endif %}
     {%- elif message['role'] == 'assistant' %}
         {%- if message['content'] is string %}
+            {{- message['content'] }}
+        {%- elif message['content'] is iterable  %}
+            {{- message['content'][0]['text'] }}
+        {%- endif %}
+        {%- if message['tool_calls'] is defined and message['tool_calls'] is not none %}
+            {%- for tool in message['tool_calls'] %}
+                {%- set arguments = tool['function']['arguments'] %}
+                {%- if arguments is not string %}
+                    {%- set arguments = arguments|tojson %}
+                {%- endif %}
+                {{- "[TOOL_CALLS]" + tool['function']['name'] + "[ARGS]" + arguments }}
+            {%- endfor %}
+        {%- endif %}
+        {{- eos_token }}
+    {%- elif message["role"] == "tool_results" or message["role"] == "tool" %}
+        {%- if message.content is defined and message.content.content is defined %}
+            {%- set content = message.content.content %}
         {%- else %}
+            {%- set content = message.content %}
         {%- endif %}
+        {{- "[TOOL_RESULTS]" + content|string + "[/TOOL_RESULTS]" }}
     {%- else %}
+        {{- raise_exception('Only user, system, assistant and tool roles are supported!') }}
     {%- endif %}
 {%- endfor %}
+{#- Licensed under the Apache License, Version 2.0 (the "License") #}

tekken.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:05e051a32ae9d6333459da0083d36507116334fc85378321cfb32dfff7187531
+size 19399765

tokenizer_config.json CHANGED Viewed

@@ -9014,6 +9014,7 @@
   "model_max_length": 131072,
   "pad_token": "<pad>",
   "padding_side": "left",
   "processor_class": "PixtralProcessor",
   "tokenizer_class": "LlamaTokenizerFast",
   "unk_token": "<unk>",

   "model_max_length": 131072,
   "pad_token": "<pad>",
   "padding_side": "left",
+  "chat_template": "{%- set default_system_message = 'First draft your thinking process (inner monologue) until you arrive at a response. Format your response using Markdown, and use LaTeX for any mathematical equations. Write both your thoughts and the response in the same language as the input.\\n\\nYour thinking process must follow the template below:[THINK]Your thoughts or/and draft, like working through an exercise on scratch paper. Be as casual and as long as you want until you are confident to generate the response. Use the same language as the input.[/THINK]Here, provide a self-contained response.' %}\n \n{{- bos_token }}\n \n{#- Extract system message if present -#}\n{%- if messages[0]['role'] == 'system' %}\n    {%- if messages[0]['content'] is string %}\n        {%- set raw_system_message = messages[0]['content'] %}\n    {%- else %}\n        {%- set raw_system_message = messages[0]['content'][0]['text'] %}\n    {%- endif %}\n    {%- set loop_messages = messages[1:] %}\n{%- else %}\n    {%- set raw_system_message = \"\" %}\n    {%- set loop_messages = messages %}\n{%- endif %}\n \n{#- Detect THINK flag by searching for exact phrase \"/think\" -#}\n{%- if \"/think\" in raw_system_message %}\n    {%- set THINK = True %}\n{%- else %}\n    {%- set THINK = False %}\n{%- endif %}\n \n{#- Apply logic depending on THINK flag -#}\n{%- if THINK %}\n    {%- if raw_system_message|length > 0 %}\n        {%- set system_message = default_system_message + \"\\n\\n\" + raw_system_message %}\n    {%- else %}\n        {%- set system_message = default_system_message %}\n    {%- endif %}\n    {{- '[SYSTEM_PROMPT]' + system_message + '[/SYSTEM_PROMPT]' }}\n{%- else %}\n    {%- if raw_system_message|length > 0 %}\n        {{- '[SYSTEM_PROMPT]' + raw_system_message + '[/SYSTEM_PROMPT]' }}\n    {%- endif %}\n{%- endif %}\n \n \n{#- Tool description appended ONLY to last user message. Edits made by Unsloth #}\n{%- set tools_description = \"\" %}\n{%- set has_tools = false %}\n \n{%- if tools is defined and tools is not none and tools|length > 0 %}\n    {%- set has_tools = true %}\n    {%- set tools_description = \"[AVAILABLE_TOOLS]\" + (tools | tojson) + \"[/AVAILABLE_TOOLS]\" %}\n    {{- tools_description }}\n{%- endif %}\n \n{%- for message in loop_messages %}\n    {%- if message['role'] == 'user' %}\n \n        {%- if message['content'] is string %}\n            {{- '[INST]' + message['content'] + '[/INST]' }}\n        {%- else %}\n            {{- '[INST]' }}\n            {%- for block in message['content'] %}\n                {%- if block['type'] == 'text' %}\n                    {%- if block['text'] is defined %}\n                        {{- block['text'] }}\n                    {%- else %}\n                        {{- block['content'] }}\n                    {%- endif %}\n                {%- elif block['type'] in ['image', 'image_url'] %}\n                    {{- '[IMG]' }}\n                {%- else %}\n                    {{- raise_exception('Only text and image blocks are supported in message content!') }}\n                {%- endif %}\n            {%- endfor %}\n            {{- '[/INST]' }}\n        {%- endif %}\n \n    {%- elif message['role'] == 'system' %}\n        {%- if message['content'] is string %}\n            {{- '[SYSTEM_PROMPT]' + message['content'] + '[/SYSTEM_PROMPT]' }}\n        {%- else %}\n            {{- '[SYSTEM_PROMPT]' + message['content'][0]['text'] + '[/SYSTEM_PROMPT]' }}\n        {%- endif %}\n \n    {%- elif message['role'] == 'assistant' %}\n        {%- if message['content'] is string %}\n            {{- message['content'] }}\n        {%- elif message['content'] is iterable  %}\n            {{- message['content'][0]['text'] }}\n        {%- endif %}\n \n        {%- if message['tool_calls'] is defined and message['tool_calls'] is not none %}\n            {%- for tool in message['tool_calls'] %}\n                {%- set arguments = tool['function']['arguments'] %}\n                {%- if arguments is not string %}\n                    {%- set arguments = arguments|tojson %}\n                {%- endif %}\n                {{- \"[TOOL_CALLS]\" + tool['function']['name'] + \"[ARGS]\" + arguments }}\n            {%- endfor %}\n        {%- endif %}\n \n        {{- eos_token }}\n \n    {%- elif message[\"role\"] == \"tool_results\" or message[\"role\"] == \"tool\" %}\n        {%- if message.content is defined and message.content.content is defined %}\n            {%- set content = message.content.content %}\n        {%- else %}\n            {%- set content = message.content %}\n        {%- endif %}\n        {{- \"[TOOL_RESULTS]\" + content|string + \"[/TOOL_RESULTS]\" }}\n \n    {%- else %}\n        {{- raise_exception('Only user, system, assistant and tool roles are supported!') }}\n    {%- endif %}\n{%- endfor %}\n \n{#- Licensed under the Apache License, Version 2.0 (the \\\"License\\\") #}\n",
   "processor_class": "PixtralProcessor",
   "tokenizer_class": "LlamaTokenizerFast",
   "unk_token": "<unk>",