Upload model from script

Browse files

Files changed (5) hide show

chat_template.jinja +8 -8
config.json +68 -68
model-00001-of-00002.safetensors +1 -1
model-00002-of-00002.safetensors +1 -1
tokenizer_config.json +1 -1

chat_template.jinja CHANGED Viewed

@@ -1,9 +1,7 @@
 {%- set has_system = messages and messages[0].role == 'system' and messages[0].content is string %}
 {%- if has_system %}
-{{- '<|im_start|>system\n' + messages[0].content + '<|im_end|>\n' }}
 {%- endif %}
 {%- if messages and messages[-1].role == 'assistant' %}
     {# Find the user message immediately before the last assistant (scan backwards skipping last). #}
     {%- set ns = namespace(seen_last=false, user_before_last_asst=none) %}
@@ -15,7 +13,7 @@
         {%- endif %}
     {%- endfor %}
     {%- if ns.user_before_last_asst is not none %}
-{{- '<|im_start|>user\n' + ns.user_before_last_asst + '<|im_end|>\n' }}
     {%- endif %}
     {%- set content = '' %}
@@ -32,11 +30,13 @@
         {%- endif %}
     {%- endif %}
     {%- if reasoning_content %}
-{{- '<|im_start|>assistant\n<think>\n' + reasoning_content.strip('\n') + '\n</think>\n\n' + content.lstrip('\n') + '<|im_end|>\n' }}
     {%- else %}
-{{- '<|im_start|>assistant\n' + content + '<|im_end|>\n' }}
     {%- endif %}
 {%- elif messages and messages[-1].role == 'user' and messages[-1].content is string %}
-{{- '<|im_start|>user\n' + messages[-1].content + '<|im_end|>\n<|im_start|>assistant\n' }}
 {%- endif %}

 {%- set has_system = messages and messages[0].role == 'system' and messages[0].content is string %}
 {%- if has_system %}
+    {{- '<|im_start|>system\n' + messages[0].content + '<|im_end|>\n' }}
 {%- endif %}
 {%- if messages and messages[-1].role == 'assistant' %}
     {# Find the user message immediately before the last assistant (scan backwards skipping last). #}
     {%- set ns = namespace(seen_last=false, user_before_last_asst=none) %}
         {%- endif %}
     {%- endfor %}
     {%- if ns.user_before_last_asst is not none %}
+        {{- '<|im_start|>user\n' + ns.user_before_last_asst + '<|im_end|>\n' }}
     {%- endif %}
     {%- set content = '' %}
         {%- endif %}
     {%- endif %}
     {%- if reasoning_content %}
+        {{- '<|im_start|>assistant\n<think>\n' + reasoning_content.strip('\n') + '\n</think>\n\n' + content.lstrip('\n') + '<|im_end|>\n' }}
     {%- else %}
+        {{- '<|im_start|>assistant\n' + content + '<|im_end|>\n' }}
     {%- endif %}
 {%- elif messages and messages[-1].role == 'user' and messages[-1].content is string %}
+    {{- '<|im_start|>user\n' + messages[-1].content + '<|im_end|>\n' }}
+{%- endif %}
+{%- if add_generation_prompt %}
+    {{- '<|im_start|>assistant\n' }}
 {%- endif %}

config.json CHANGED Viewed

@@ -1,69 +1,69 @@
 {
-    "architectures": [
-        "Qwen3ForCausalLM"
-    ],
-    "attention_bias": false,
-    "attention_dropout": 0.0,
-    "torch_dtype": "bfloat16",
-    "eos_token_id": 151645,
-    "head_dim": 128,
-    "hidden_act": "silu",
-    "hidden_size": 2560,
-    "initializer_range": 0.02,
-    "intermediate_size": 9728,
-    "layer_types": [
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention",
-        "full_attention"
-    ],
-    "max_position_embeddings": 262144,
-    "max_window_layers": 36,
-    "model_type": "qwen3",
-    "num_attention_heads": 32,
-    "num_hidden_layers": 36,
-    "num_key_value_heads": 8,
-    "pad_token_id": 151643,
-    "rms_norm_eps": 1e-06,
-    "rope_scaling": null,
-    "rope_theta": 5000000,
-    "sliding_window": null,
-    "tie_word_embeddings": true,
-    "transformers_version": "4.57.6",
-    "unsloth_version": "2026.1.2",
-    "use_cache": false,
-    "use_sliding_window": false,
-    "vocab_size": 151936
-}

 {
+  "architectures": [
+    "Qwen3ForCausalLM"
+  ],
+  "attention_bias": false,
+  "attention_dropout": 0.0,
+  "torch_dtype": "bfloat16",
+  "eos_token_id": 151645,
+  "head_dim": 128,
+  "hidden_act": "silu",
+  "hidden_size": 2560,
+  "initializer_range": 0.02,
+  "intermediate_size": 9728,
+  "layer_types": [
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention"
+  ],
+  "max_position_embeddings": 262144,
+  "max_window_layers": 36,
+  "model_type": "qwen3",
+  "num_attention_heads": 32,
+  "num_hidden_layers": 36,
+  "num_key_value_heads": 8,
+  "pad_token_id": 151643,
+  "rms_norm_eps": 1e-06,
+  "rope_scaling": null,
+  "rope_theta": 5000000,
+  "sliding_window": null,
+  "tie_word_embeddings": true,
+  "transformers_version": "4.56.2",
+  "unsloth_version": "2026.1.4",
+  "use_cache": false,
+  "use_sliding_window": false,
+  "vocab_size": 151936
+}

model-00001-of-00002.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fa335e5ef60c4ba9674e62bd3a992f2562da76c9cc5c31cf2331dac9b6398968
 size 4967215455

 version https://git-lfs.github.com/spec/v1
+oid sha256:af519b9406f1b7119269e83421502c5744a971f58e4a6b6d6f390adc2d258517
 size 4967215455

model-00002-of-00002.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:97eb0762685e1e0a19c4675b5d25dabe844c378b84931678684dd7af19431528
 size 3077766730

 version https://git-lfs.github.com/spec/v1
+oid sha256:3e020028c9782f5a10ef2f9462a401e96b73e455b66840678ccea4d8f5b42887
 size 3077766730

tokenizer_config.json CHANGED Viewed

@@ -237,5 +237,5 @@
   "split_special_tokens": false,
   "tokenizer_class": "Qwen2Tokenizer",
   "unk_token": null,
-  "chat_template": "\n{%- set has_system = messages and messages[0].role == 'system' and messages[0].content is string %}\n{%- if has_system %}\n{{- '<|im_start|>system\\n' + messages[0].content + '<|im_end|>\\n' }}\n{%- endif %}\n\n{%- if messages and messages[-1].role == 'assistant' %}\n    {# Find the user message immediately before the last assistant (scan backwards skipping last). #}\n    {%- set ns = namespace(seen_last=false, user_before_last_asst=none) %}\n    {%- for m in messages[::-1] %}\n        {%- if not ns.seen_last %}\n            {%- set ns.seen_last = true %}\n        {%- elif ns.user_before_last_asst is none and m.role == 'user' and m.content is string %}\n            {%- set ns.user_before_last_asst = m.content %}\n        {%- endif %}\n    {%- endfor %}\n    {%- if ns.user_before_last_asst is not none %}\n{{- '<|im_start|>user\\n' + ns.user_before_last_asst + '<|im_end|>\\n' }}\n    {%- endif %}\n\n    {%- set content = '' %}\n    {%- if messages[-1].content is string %}\n        {%- set content = messages[-1].content %}\n    {%- endif %}\n    {%- set reasoning_content = '' %}\n    {%- if messages[-1].reasoning_content is string %}\n        {%- set reasoning_content = messages[-1].reasoning_content %}\n    {%- else %}\n        {%- if '</think>' in content %}\n            {%- set reasoning_content = content.split('</think>')[0].rstrip('\\n').split('<think>')[-1].lstrip('\\n') %}\n            {%- set content = content.split('</think>')[-1].lstrip('\\n') %}\n        {%- endif %}\n    {%- endif %}\n    {%- if reasoning_content %}\n{{- '<|im_start|>assistant\\n<think>\\n' + reasoning_content.strip('\\n') + '\\n</think>\\n\\n' + content.lstrip('\\n') + '<|im_end|>\\n' }}\n    {%- else %}\n{{- '<|im_start|>assistant\\n' + content + '<|im_end|>\\n' }}\n    {%- endif %}\n\n{%- elif messages and messages[-1].role == 'user' and messages[-1].content is string %}\n{{- '<|im_start|>user\\n' + messages[-1].content + '<|im_end|>\\n<|im_start|>assistant\\n' }}\n{%- endif %}"
 }

   "split_special_tokens": false,
   "tokenizer_class": "Qwen2Tokenizer",
   "unk_token": null,
+  "chat_template": "{%- set has_system = messages and messages[0].role == 'system' and messages[0].content is string %}\n{%- if has_system %}\n    {{- '<|im_start|>system\\n' + messages[0].content + '<|im_end|>\\n' }}\n{%- endif %}\n{%- if messages and messages[-1].role == 'assistant' %}\n    {# Find the user message immediately before the last assistant (scan backwards skipping last). #}\n    {%- set ns = namespace(seen_last=false, user_before_last_asst=none) %}\n    {%- for m in messages[::-1] %}\n        {%- if not ns.seen_last %}\n            {%- set ns.seen_last = true %}\n        {%- elif ns.user_before_last_asst is none and m.role == 'user' and m.content is string %}\n            {%- set ns.user_before_last_asst = m.content %}\n        {%- endif %}\n    {%- endfor %}\n    {%- if ns.user_before_last_asst is not none %}\n        {{- '<|im_start|>user\\n' + ns.user_before_last_asst + '<|im_end|>\\n' }}\n    {%- endif %}\n\n    {%- set content = '' %}\n    {%- if messages[-1].content is string %}\n        {%- set content = messages[-1].content %}\n    {%- endif %}\n    {%- set reasoning_content = '' %}\n    {%- if messages[-1].reasoning_content is string %}\n        {%- set reasoning_content = messages[-1].reasoning_content %}\n    {%- else %}\n        {%- if '</think>' in content %}\n            {%- set reasoning_content = content.split('</think>')[0].rstrip('\\n').split('<think>')[-1].lstrip('\\n') %}\n            {%- set content = content.split('</think>')[-1].lstrip('\\n') %}\n        {%- endif %}\n    {%- endif %}\n    {%- if reasoning_content %}\n        {{- '<|im_start|>assistant\\n<think>\\n' + reasoning_content.strip('\\n') + '\\n</think>\\n\\n' + content.lstrip('\\n') + '<|im_end|>\\n' }}\n    {%- else %}\n        {{- '<|im_start|>assistant\\n' + content + '<|im_end|>\\n' }}\n    {%- endif %}\n{%- elif messages and messages[-1].role == 'user' and messages[-1].content is string %}\n    {{- '<|im_start|>user\\n' + messages[-1].content + '<|im_end|>\\n' }}\n{%- endif %}\n{%- if add_generation_prompt %}\n    {{- '<|im_start|>assistant\\n' }}\n{%- endif %}"
 }