Upload merged Qwen3-4B-Instruct-2507 model (auto-generated README)

Browse files

Files changed (4) hide show

README.md +3 -3
chat_template.jinja +7 -78
model-00001-of-00002.safetensors +1 -1
model-00002-of-00002.safetensors +1 -1

README.md CHANGED Viewed

@@ -45,7 +45,7 @@ Loss is applied to **all assistant turns** in the trajectory, enabling the model
 - DBBench dataset: `u-10bei/dbbench_sft_dataset_react_v4`
 - ALFWorld dataset: `u-10bei/sft_alfworld_trajectory_dataset_v5`
-- Mixing ratio (pre-merge target): **DB:ALF = 3:1**
 ### DB Oversampling (category-aware)
 Enabled: **False**
@@ -64,9 +64,9 @@ DB category weights used during training-data preparation:
 - Base model: Qwen/Qwen3-4B-Instruct-2507
 - Method: LoRA (full precision base)
-- Max sequence length: 4096
 - Epochs: 1
-- Learning rate: 3e-05
 - LoRA: r=32, alpha=64, dropout=0.05
 - Per-device train batch size: 2
 - Gradient accumulation: 4

 - DBBench dataset: `u-10bei/dbbench_sft_dataset_react_v4`
 - ALFWorld dataset: `u-10bei/sft_alfworld_trajectory_dataset_v5`
+- Mixing ratio (pre-merge target): **DB:ALF = 2:1**
 ### DB Oversampling (category-aware)
 Enabled: **False**
 - Base model: Qwen/Qwen3-4B-Instruct-2507
 - Method: LoRA (full precision base)
+- Max sequence length: 2048
 - Epochs: 1
+- Learning rate: 2e-06
 - LoRA: r=32, alpha=64, dropout=0.05
 - Per-device train batch size: 2
 - Gradient accumulation: 4

chat_template.jinja CHANGED Viewed

@@ -1,86 +1,15 @@
-{%- if tools %}
-    {{- '<|im_start|>system\n' }}
-    {%- if messages[0].role == 'system' %}
-        {{- messages[0].content + '\n\n' }}
-    {%- endif %}
-    {{- "# Tools\n\nYou may call one or more functions to assist with the user query.\n\nYou are provided with function signatures within <tools></tools> XML tags:\n<tools>" }}
-    {%- for tool in tools %}
-        {{- "\n" }}
-        {{- tool | tojson }}
-    {%- endfor %}
-    {{- "\n</tools>\n\nFor each function call, return a json object with function name and arguments within <tool_call></tool_call> XML tags:\n<tool_call>\n{\"name\": <function-name>, \"arguments\": <args-json-object>}\n</tool_call><|im_end|>\n" }}
-{%- else %}
-    {%- if messages[0].role == 'system' %}
-        {{- '<|im_start|>system\n' + messages[0].content + '<|im_end|>\n' }}
-    {%- endif %}
-{%- endif %}
-{%- set ns = namespace(multi_step_tool=true, last_query_index=messages|length - 1) %}
-{%- for message in messages[::-1] %}
-    {%- set index = (messages|length - 1) - loop.index0 %}
-    {%- if ns.multi_step_tool and message.role == "user" and message.content is string and not(message.content.startswith('<tool_response>') and message.content.endswith('</tool_response>')) %}
-        {%- set ns.multi_step_tool = false %}
-        {%- set ns.last_query_index = index %}
-    {%- endif %}
-{%- endfor %}
 {%- for message in messages %}
     {%- if message.content is string %}
         {%- set content = message.content %}
     {%- else %}
         {%- set content = '' %}
     {%- endif %}
-    {%- if (message.role == "user") or (message.role == "system" and not loop.first) %}
-        {{- '<|im_start|>' + message.role + '\n' + content + '<|im_end|>' + '\n' }}
-    {%- elif message.role == "assistant" %}
-        {%- set reasoning_content = '' %}
-        {%- if message.reasoning_content is string %}
-            {%- set reasoning_content = message.reasoning_content %}
-        {%- else %}
-            {%- if '</think>' in content %}
-                {%- set reasoning_content = content.split('</think>')[0].rstrip('\n').split('<think>')[-1].lstrip('\n') %}
-                {%- set content = content.split('</think>')[-1].lstrip('\n') %}
-            {%- endif %}
-        {%- endif %}
-        {%- if loop.index0 > ns.last_query_index %}
-            {%- if loop.last or (not loop.last and reasoning_content) %}
-                {{- '<|im_start|>' + message.role + '\n<think>\n' + reasoning_content.strip('\n') + '\n</think>\n\n' + content.lstrip('\n') }}
-            {%- else %}
-                {{- '<|im_start|>' + message.role + '\n' + content }}
-            {%- endif %}
-        {%- else %}
-            {{- '<|im_start|>' + message.role + '\n' + content }}
-        {%- endif %}
-        {%- if message.tool_calls %}
-            {%- for tool_call in message.tool_calls %}
-                {%- if (loop.first and content) or (not loop.first) %}
-                    {{- '\n' }}
-                {%- endif %}
-                {%- if tool_call.function %}
-                    {%- set tool_call = tool_call.function %}
-                {%- endif %}
-                {{- '<tool_call>\n{"name": "' }}
-                {{- tool_call.name }}
-                {{- '", "arguments": ' }}
-                {%- if tool_call.arguments is string %}
-                    {{- tool_call.arguments }}
-                {%- else %}
-                    {{- tool_call.arguments | tojson }}
-                {%- endif %}
-                {{- '}\n</tool_call>' }}
-            {%- endfor %}
-        {%- endif %}
-        {{- '<|im_end|>\n' }}
-    {%- elif message.role == "tool" %}
-        {%- if loop.first or (messages[loop.index0 - 1].role != "tool") %}
-            {{- '<|im_start|>user' }}
-        {%- endif %}
-        {{- '\n<tool_response>\n' }}
-        {{- content }}
-        {{- '\n</tool_response>' }}
-        {%- if loop.last or (messages[loop.index0 + 1].role != "tool") %}
-            {{- '<|im_end|>\n' }}
-        {%- endif %}
-    {%- endif %}
 {%- endfor %}
 {%- if add_generation_prompt %}
-    {{- '<|im_start|>assistant\n' }}
-{%- endif %}

 {%- for message in messages %}
     {%- if message.content is string %}
         {%- set content = message.content %}
     {%- else %}
         {%- set content = '' %}
     {%- endif %}
+    {{- '<|im_start|>' + message.role + '
+' + content + '<|im_end|>
+' }}
 {%- endfor %}
 {%- if add_generation_prompt %}
+    {{- '<|im_start|>assistant
+' }}
+{%- endif %}

model-00001-of-00002.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fd754441f37fcaeabebf5f7d200d69d88198dafbf7ade0c78b6e1aafd3164871
 size 4967215360

 version https://git-lfs.github.com/spec/v1
+oid sha256:c18c270488cd6d47925d6ac190d8bf33979b68c332b4c66a430372ac96d052ff
 size 4967215360

model-00002-of-00002.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:49fb62246505ed17e61b85f1dc5de3f3e325b94da7aca2a1db3d2622a29fc9e1
 size 3077766632

 version https://git-lfs.github.com/spec/v1
+oid sha256:3b7c341236300634374d73ae4ddb293256413322c45c1f1e54052dc037005972
 size 3077766632