Upload T4-optimized QLoRA adapter (v5 dataset, r=128)

Browse files

Files changed (5) hide show

README.md +12 -10
adapter_config.json +6 -18
adapter_model.safetensors +2 -2
chat_template.jinja +86 -0
merges.txt +0 -0

README.md CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 base_model: Qwen/Qwen3-4B-Instruct-2507
 datasets:
-- u-10bei/structured_data_with_cot_dataset_512_v2
 language:
 - en
 license: apache-2.0
@@ -13,7 +13,7 @@ tags:
 - structured-output
 ---
-＜qwen3-4b-structured-output-lora_default＞
 This repository provides a **LoRA adapter** fine-tuned from
 **Qwen/Qwen3-4B-Instruct-2507** using **QLoRA (4-bit, Unsloth)**.
@@ -31,12 +31,14 @@ while intermediate reasoning (Chain-of-Thought) is masked.
 ## Training Configuration
-- Base model: Qwen/Qwen3-4B-Instruct-2507
-- Method: QLoRA (4-bit)
-- Max sequence length: 512
-- Epochs: 1
-- Learning rate: 1e-06
-- LoRA: r=64, alpha=128
 ## Usage
@@ -46,7 +48,7 @@ from peft import PeftModel
 import torch
 base = "Qwen/Qwen3-4B-Instruct-2507"
-adapter = "your_id/your-repo"
 tokenizer = AutoTokenizer.from_pretrained(base)
 model = AutoModelForCausalLM.from_pretrained(
@@ -59,7 +61,7 @@ model = PeftModel.from_pretrained(model, adapter)
 ## Sources & Terms (IMPORTANT)
-Training data: u-10bei/structured_data_with_cot_dataset_512_v2
 Dataset License: MIT License. This dataset is used and distributed under the terms of the MIT License.
 Compliance: Users must comply with the MIT license (including copyright notice) and the base model's original terms of use.

 ---
 base_model: Qwen/Qwen3-4B-Instruct-2507
 datasets:
+- u-10bei/structured_data_with_cot_dataset_512_v5
 language:
 - en
 license: apache-2.0
 - structured-output
 ---
+# qwen3-4b-structured-output-lora (T4 Optimized)
 This repository provides a **LoRA adapter** fine-tuned from
 **Qwen/Qwen3-4B-Instruct-2507** using **QLoRA (4-bit, Unsloth)**.
 ## Training Configuration
+- **Base Model:** Qwen/Qwen3-4B-Instruct-2507
+- **Dataset:** u-10bei/structured_data_with_cot_dataset_512_v5
+- **Method:** QLoRA (4-bit)
+- **Max Sequence Length:** 1024
+- **Epochs:** 2
+- **Learning Rate:** 2e-4
+- **LoRA Config:** r=128, alpha=256
+- **Hardware:** Optimized for T4 GPU (Batch Size=1, Grad Accum=16)
 ## Usage
 import torch
 base = "Qwen/Qwen3-4B-Instruct-2507"
+adapter = "your_id/qwen3-4b-structured-lora"
 tokenizer = AutoTokenizer.from_pretrained(base)
 model = AutoModelForCausalLM.from_pretrained(
 ## Sources & Terms (IMPORTANT)
+Training data: u-10bei/structured_data_with_cot_dataset_512_v5
 Dataset License: MIT License. This dataset is used and distributed under the terms of the MIT License.
 Compliance: Users must comply with the MIT license (including copyright notice) and the base model's original terms of use.

adapter_config.json CHANGED Viewed

@@ -1,7 +1,5 @@
 {
-  "alora_invocation_tokens": null,
   "alpha_pattern": {},
-  "arrow_config": null,
   "auto_mapping": {
     "base_model_class": "Qwen3ForCausalLM",
     "parent_library": "transformers.models.qwen3.modeling_qwen3",
@@ -9,10 +7,6 @@
   },
   "base_model_name_or_path": "unsloth/qwen3-4b-instruct-2507-unsloth-bnb-4bit",
   "bias": "none",
-  "corda_config": null,
-  "ensure_weight_tying": false,
-  "eva_config": null,
-  "exclude_modules": null,
   "fan_in_fan_out": false,
   "inference_mode": true,
   "init_lora_weights": true,
@@ -20,31 +14,25 @@
   "layers_pattern": null,
   "layers_to_transform": null,
   "loftq_config": {},
-  "lora_alpha": 128,
-  "lora_bias": false,
   "lora_dropout": 0.0,
   "megatron_config": null,
   "megatron_core": "megatron.core",
   "modules_to_save": null,
   "peft_type": "LORA",
-  "peft_version": "0.18.1",
-  "qalora_group_size": 16,
-  "r": 64,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "down_proj",
-    "gate_proj",
-    "v_proj",
     "o_proj",
     "k_proj",
-    "up_proj",
-    "q_proj"
   ],
-  "target_parameters": null,
   "task_type": "CAUSAL_LM",
-  "trainable_token_indices": null,
   "use_dora": false,
-  "use_qalora": false,
   "use_rslora": false
 }

 {
   "alpha_pattern": {},
   "auto_mapping": {
     "base_model_class": "Qwen3ForCausalLM",
     "parent_library": "transformers.models.qwen3.modeling_qwen3",
   },
   "base_model_name_or_path": "unsloth/qwen3-4b-instruct-2507-unsloth-bnb-4bit",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
   "init_lora_weights": true,
   "layers_pattern": null,
   "layers_to_transform": null,
   "loftq_config": {},
+  "lora_alpha": 256,
   "lora_dropout": 0.0,
   "megatron_config": null,
   "megatron_core": "megatron.core",
   "modules_to_save": null,
   "peft_type": "LORA",
+  "r": 128,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "up_proj",
     "down_proj",
     "o_proj",
     "k_proj",
+    "gate_proj",
+    "q_proj",
+    "v_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,
   "use_rslora": false
 }

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f76bca26ca1c854530b78e622b59f2c1bb2681e5507934552a085dadd89b28d1
-size 528550256

 version https://git-lfs.github.com/spec/v1
+oid sha256:551c6a363c95464010196c8977fc5f63b309e8a3071c9a06a057f62d9f934b1a
+size 1057033224

chat_template.jinja ADDED Viewed

	@@ -0,0 +1,86 @@

+{%- if tools %}
+    {{- '<|im_start|>system\n' }}
+    {%- if messages[0].role == 'system' %}
+        {{- messages[0].content + '\n\n' }}
+    {%- endif %}
+    {{- "# Tools\n\nYou may call one or more functions to assist with the user query.\n\nYou are provided with function signatures within <tools></tools> XML tags:\n<tools>" }}
+    {%- for tool in tools %}
+        {{- "\n" }}
+        {{- tool | tojson }}
+    {%- endfor %}
+    {{- "\n</tools>\n\nFor each function call, return a json object with function name and arguments within <tool_call></tool_call> XML tags:\n<tool_call>\n{\"name\": <function-name>, \"arguments\": <args-json-object>}\n</tool_call><|im_end|>\n" }}
+{%- else %}
+    {%- if messages[0].role == 'system' %}
+        {{- '<|im_start|>system\n' + messages[0].content + '<|im_end|>\n' }}
+    {%- endif %}
+{%- endif %}
+{%- set ns = namespace(multi_step_tool=true, last_query_index=messages|length - 1) %}
+{%- for message in messages[::-1] %}
+    {%- set index = (messages|length - 1) - loop.index0 %}
+    {%- if ns.multi_step_tool and message.role == "user" and message.content is string and not(message.content.startswith('<tool_response>') and message.content.endswith('</tool_response>')) %}
+        {%- set ns.multi_step_tool = false %}
+        {%- set ns.last_query_index = index %}
+    {%- endif %}
+{%- endfor %}
+{%- for message in messages %}
+    {%- if message.content is string %}
+        {%- set content = message.content %}
+    {%- else %}
+        {%- set content = '' %}
+    {%- endif %}
+    {%- if (message.role == "user") or (message.role == "system" and not loop.first) %}
+        {{- '<|im_start|>' + message.role + '\n' + content + '<|im_end|>' + '\n' }}
+    {%- elif message.role == "assistant" %}
+        {%- set reasoning_content = '' %}
+        {%- if message.reasoning_content is string %}
+            {%- set reasoning_content = message.reasoning_content %}
+        {%- else %}
+            {%- if '</think>' in content %}
+                {%- set reasoning_content = content.split('</think>')[0].rstrip('\n').split('<think>')[-1].lstrip('\n') %}
+                {%- set content = content.split('</think>')[-1].lstrip('\n') %}
+            {%- endif %}
+        {%- endif %}
+        {%- if loop.index0 > ns.last_query_index %}
+            {%- if loop.last or (not loop.last and reasoning_content) %}
+                {{- '<|im_start|>' + message.role + '\n<think>\n' + reasoning_content.strip('\n') + '\n</think>\n\n' + content.lstrip('\n') }}
+            {%- else %}
+                {{- '<|im_start|>' + message.role + '\n' + content }}
+            {%- endif %}
+        {%- else %}
+            {{- '<|im_start|>' + message.role + '\n' + content }}
+        {%- endif %}
+        {%- if message.tool_calls %}
+            {%- for tool_call in message.tool_calls %}
+                {%- if (loop.first and content) or (not loop.first) %}
+                    {{- '\n' }}
+                {%- endif %}
+                {%- if tool_call.function %}
+                    {%- set tool_call = tool_call.function %}
+                {%- endif %}
+                {{- '<tool_call>\n{"name": "' }}
+                {{- tool_call.name }}
+                {{- '", "arguments": ' }}
+                {%- if tool_call.arguments is string %}
+                    {{- tool_call.arguments }}
+                {%- else %}
+                    {{- tool_call.arguments | tojson }}
+                {%- endif %}
+                {{- '}\n</tool_call>' }}
+            {%- endfor %}
+        {%- endif %}
+        {{- '<|im_end|>\n' }}
+    {%- elif message.role == "tool" %}
+        {%- if loop.first or (messages[loop.index0 - 1].role != "tool") %}
+            {{- '<|im_start|>user' }}
+        {%- endif %}
+        {{- '\n<tool_response>\n' }}
+        {{- content }}
+        {{- '\n</tool_response>' }}
+        {%- if loop.last or (messages[loop.index0 + 1].role != "tool") %}
+            {{- '<|im_end|>\n' }}
+        {%- endif %}
+    {%- endif %}
+{%- endfor %}
+{%- if add_generation_prompt %}
+    {{- '<|im_start|>assistant\n' }}
+{%- endif %}

merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff