TymofiiNasobko/Lapa-function-calling

Files changed (5) hide show

README.md CHANGED Viewed

@@ -4,8 +4,8 @@ library_name: transformers
 model_name: Lapa-function-calling
 tags:
 - generated_from_trainer
-- sft
 - trl
 licence: license
 ---
@@ -36,7 +36,7 @@ This model was trained with SFT.
 - TRL: 0.25.1
 - Transformers: 4.57.3
-- Pytorch: 2.8.0+cu128
 - Datasets: 4.4.1
 - Tokenizers: 0.22.1

 model_name: Lapa-function-calling
 tags:
 - generated_from_trainer
 - trl
+- sft
 licence: license
 ---
 - TRL: 0.25.1
 - Transformers: 4.57.3
+- Pytorch: 2.8.0+cu129
 - Datasets: 4.4.1
 - Tokenizers: 0.22.1

adapter_config.json CHANGED Viewed

@@ -16,7 +16,7 @@
   "layers_pattern": null,
   "layers_to_transform": null,
   "loftq_config": {},
-  "lora_alpha": 16,
   "lora_bias": false,
   "lora_dropout": 0.05,
   "megatron_config": null,
@@ -29,16 +29,8 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "out_proj",
-    "gate_proj",
-    "k_proj",
-    "v_proj",
-    "fc2",
-    "o_proj",
-    "fc1",
-    "down_proj",
-    "q_proj",
-    "up_proj"
   ],
   "target_parameters": null,
   "task_type": "CAUSAL_LM",

   "layers_pattern": null,
   "layers_to_transform": null,
   "loftq_config": {},
+  "lora_alpha": 512,
   "lora_bias": false,
   "lora_dropout": 0.05,
   "megatron_config": null,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "embed_tokens",
+    "all-linear"
   ],
   "target_parameters": null,
   "task_type": "CAUSAL_LM",

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0443bbb7d9d13c4d79aedb60c98d09449d2254f2cb1bf7a4191c51c0def3a99e
-size 4746766832

 version https://git-lfs.github.com/spec/v1
+oid sha256:88ab938ad02b9d0bf666276bc347973cc8d98529dbcadd31fd6481c56d8cc43b
+size 2285694936

chat_template.jinja CHANGED Viewed

@@ -23,7 +23,7 @@
 ' + (first_user_prefix if loop.first else "") }}
     {%- if message['content'] is string -%}
         {%- if role == "model" -%}
-            {% generation %}    {{ message['content'] | trim }}     {% endgeneration %}
         {%- else -%}
             {{ message['content'] | trim }}
         {%- endif -%}
@@ -33,7 +33,7 @@
                 {{ '<start_of_image>' }}
             {%- elif item['type'] == 'text' -%}
                 {%- if role == "model" -%}
-                    {% generation %}    {{ item['text'] | trim }}   {% endgeneration %}
                 {%- else -%}
                     {{ item['text'] | trim }}
                 {%- endif -%}
@@ -42,9 +42,16 @@
     {%- else -%}
         {{ raise_exception("Invalid content type") }}
     {%- endif -%}
-    {{ '<end_of_turn>
 ' }}
 {%- endfor -%}
 {%- if add_generation_prompt -%}
     {{'<start_of_turn>model
 '}}

 ' + (first_user_prefix if loop.first else "") }}
     {%- if message['content'] is string -%}
         {%- if role == "model" -%}
+            {% generation %}{{ message['content'] | trim }}{% endgeneration %}
         {%- else -%}
             {{ message['content'] | trim }}
         {%- endif -%}
                 {{ '<start_of_image>' }}
             {%- elif item['type'] == 'text' -%}
                 {%- if role == "model" -%}
+                    {% generation %}{{ item['text'] | trim }}{% endgeneration %}
                 {%- else -%}
                     {{ item['text'] | trim }}
                 {%- endif -%}
     {%- else -%}
         {{ raise_exception("Invalid content type") }}
     {%- endif -%}
+    {%- if role == "model" -%}
+{% generation %}
+{{ '<end_of_turn>
+' }}{% endgeneration %}
+    {%- else -%}
+{{ '<end_of_turn>
 ' }}
+    {%- endif -%}
 {%- endfor -%}
 {%- if add_generation_prompt -%}
     {{'<start_of_turn>model
 '}}

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c6ebfea0eaa05582dc7e2707c738bdb5a2b728fc6960e40f412874d12f4bf943
 size 6225

 version https://git-lfs.github.com/spec/v1
+oid sha256:264c88be027ded39b70324149dbe1cf4b50e33e90c1a743861991a753109baff
 size 6225