Training in progress, epoch 1

Files changed (6) hide show

README.md CHANGED Viewed

@@ -4,9 +4,9 @@ library_name: transformers
 model_name: kto_simplification_balanced
 tags:
 - generated_from_trainer
-- trl
-- unsloth
 - kto
 licence: license
 ---
@@ -28,18 +28,18 @@ print(output["generated_text"])
 ## Training procedure
-[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/ioakeime-aristotle-university-of-thessaloniki/kto_smiplification_balanced/runs/q9oqzg79)
 This model was trained with KTO, a method introduced in [KTO: Model Alignment as Prospect Theoretic Optimization](https://huggingface.co/papers/2402.01306).
 ### Framework versions
-- TRL: 0.19.0
-- Transformers: 4.53.0
-- Pytorch: 2.7.0+cu128
-- Datasets: 3.6.0
-- Tokenizers: 0.21.2
 ## Citations

 model_name: kto_simplification_balanced
 tags:
 - generated_from_trainer
 - kto
+- unsloth
+- trl
 licence: license
 ---
 ## Training procedure
+[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/ioakeime-aristotle-university-of-thessaloniki/kto_smiplification_balanced/runs/bpfxv7y5)
 This model was trained with KTO, a method introduced in [KTO: Model Alignment as Prospect Theoretic Optimization](https://huggingface.co/papers/2402.01306).
 ### Framework versions
+- TRL: 0.24.0
+- Transformers: 4.57.3
+- Pytorch: 2.9.0
+- Datasets: 4.3.0
+- Tokenizers: 0.22.1
 ## Citations

adapter_config.json CHANGED Viewed

@@ -1,9 +1,16 @@
 {
   "alpha_pattern": {},
-  "auto_mapping": null,
   "base_model_name_or_path": "unsloth/mistral-7b-v0.3-bnb-4bit",
   "bias": "none",
   "corda_config": null,
   "eva_config": null,
   "exclude_modules": null,
   "fan_in_fan_out": false,
@@ -15,22 +22,23 @@
   "loftq_config": {},
   "lora_alpha": 16,
   "lora_bias": false,
-  "lora_dropout": 0,
   "megatron_config": null,
   "megatron_core": "megatron.core",
   "modules_to_save": null,
   "peft_type": "LORA",
   "qalora_group_size": 16,
   "r": 16,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "down_proj",
     "k_proj",
-    "o_proj",
     "q_proj",
-    "v_proj",
     "up_proj",
     "gate_proj"
   ],
   "target_parameters": null,

 {
+  "alora_invocation_tokens": null,
   "alpha_pattern": {},
+  "arrow_config": null,
+  "auto_mapping": {
+    "base_model_class": "MistralForCausalLM",
+    "parent_library": "transformers.models.mistral.modeling_mistral",
+    "unsloth_fixed": true
+  },
   "base_model_name_or_path": "unsloth/mistral-7b-v0.3-bnb-4bit",
   "bias": "none",
   "corda_config": null,
+  "ensure_weight_tying": false,
   "eva_config": null,
   "exclude_modules": null,
   "fan_in_fan_out": false,
   "loftq_config": {},
   "lora_alpha": 16,
   "lora_bias": false,
+  "lora_dropout": 0.0,
   "megatron_config": null,
   "megatron_core": "megatron.core",
   "modules_to_save": null,
   "peft_type": "LORA",
+  "peft_version": "0.18.0",
   "qalora_group_size": 16,
   "r": 16,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "v_proj",
     "down_proj",
     "k_proj",
     "q_proj",
     "up_proj",
+    "o_proj",
     "gate_proj"
   ],
   "target_parameters": null,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:234c57c0171045ee31f77b8494fa6eadf223c485501ff38ee6d067effa6a0a09
 size 167832240

 version https://git-lfs.github.com/spec/v1
+oid sha256:141a5935c1dd57689e8ae413b2597fbe9fd66ea2c2ae31f9514ea84ecc074a31
 size 167832240

tokenizer.json CHANGED Viewed

@@ -6964,6 +6964,12 @@
           "id": "A",
           "type_id": 0
         }
       }
     ],
     "pair": [
@@ -6979,6 +6985,12 @@
           "type_id": 0
         }
       },
       {
         "SpecialToken": {
           "id": "<s>",
@@ -6990,9 +7002,24 @@
           "id": "B",
           "type_id": 1
         }
       }
     ],
     "special_tokens": {
       "<s>": {
         "id": "<s>",
         "ids": [

           "id": "A",
           "type_id": 0
         }
+      },
+      {
+        "SpecialToken": {
+          "id": "</s>",
+          "type_id": 0
+        }
       }
     ],
     "pair": [
           "type_id": 0
         }
       },
+      {
+        "SpecialToken": {
+          "id": "</s>",
+          "type_id": 0
+        }
+      },
       {
         "SpecialToken": {
           "id": "<s>",
           "id": "B",
           "type_id": 1
         }
+      },
+      {
+        "SpecialToken": {
+          "id": "</s>",
+          "type_id": 1
+        }
       }
     ],
     "special_tokens": {
+      "</s>": {
+        "id": "</s>",
+        "ids": [
+          2
+        ],
+        "tokens": [
+          "</s>"
+        ]
+      },
       "<s>": {
         "id": "<s>",
         "ids": [

tokenizer_config.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "add_bos_token": true,
-  "add_eos_token": false,
   "add_prefix_space": true,
   "added_tokens_decoder": {
     "0": {

 {
   "add_bos_token": true,
+  "add_eos_token": true,
   "add_prefix_space": true,
   "added_tokens_decoder": {
     "0": {

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:91aa7e4b24a73bf63f76da8b8a36dc9a5ef4061cb2771c5a599bf78a8a1546f2
-size 6417

 version https://git-lfs.github.com/spec/v1
+oid sha256:74a34c14f6c99eb65f536192e3711f3533aca183ff32856608c59f7a6bc3188e
+size 6481