AmirlyPhd/IeeeNfsuV4

Files changed (9) hide show

README.md CHANGED Viewed

@@ -4,7 +4,7 @@ tags:
 - trl
 - sft
 - generated_from_trainer
-base_model: NousResearch/Llama-2-7b-chat-hf
 model-index:
 - name: trained_weigths
   results: []
@@ -15,9 +15,9 @@ should probably proofread and complete it, then remove this comment. -->
 # trained_weigths
-This model is a fine-tuned version of [NousResearch/Llama-2-7b-chat-hf](https://huggingface.co/NousResearch/Llama-2-7b-chat-hf) on the None dataset.
 It achieves the following results on the evaluation set:
-- Loss: 1.0769
 ## Model description
@@ -52,13 +52,13 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
-| 1.016         | 0.14  | 30   | 1.0769          |
 ### Framework versions
 - PEFT 0.7.2.dev0
 - Transformers 4.36.2
-- Pytorch 2.1.2
 - Datasets 2.16.1
 - Tokenizers 0.15.2

 - trl
 - sft
 - generated_from_trainer
+base_model: NousResearch/Llama-2-7b-hf
 model-index:
 - name: trained_weigths
   results: []
 # trained_weigths
+This model is a fine-tuned version of [NousResearch/Llama-2-7b-hf](https://huggingface.co/NousResearch/Llama-2-7b-hf) on the None dataset.
 It achieves the following results on the evaluation set:
+- Loss: 1.0609
 ## Model description
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
+| 1.7687        | 0.03  | 30   | 1.0609          |
 ### Framework versions
 - PEFT 0.7.2.dev0
 - Transformers 4.36.2
+- Pytorch 2.1.2+cu121
 - Datasets 2.16.1
 - Tokenizers 0.15.2

adapter_config.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "alpha_pattern": {},
   "auto_mapping": null,
-  "base_model_name_or_path": "NousResearch/Llama-2-7b-chat-hf",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
@@ -10,21 +10,21 @@
   "layers_to_transform": null,
   "loftq_config": {},
   "lora_alpha": 16,
-  "lora_dropout": 0.05,
   "megatron_config": null,
   "megatron_core": "megatron.core",
   "modules_to_save": null,
   "peft_type": "LORA",
-  "r": 16,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "up_proj",
     "o_proj",
     "q_proj",
-    "v_proj",
-    "down_proj",
-    "k_proj",
     "gate_proj"
   ],
   "task_type": "CAUSAL_LM",

 {
   "alpha_pattern": {},
   "auto_mapping": null,
+  "base_model_name_or_path": "NousResearch/Llama-2-7b-hf",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
   "layers_to_transform": null,
   "loftq_config": {},
   "lora_alpha": 16,
+  "lora_dropout": 0.1,
   "megatron_config": null,
   "megatron_core": "megatron.core",
   "modules_to_save": null,
   "peft_type": "LORA",
+  "r": 64,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "k_proj",
+    "down_proj",
     "up_proj",
+    "v_proj",
     "o_proj",
     "q_proj",
     "gate_proj"
   ],
   "task_type": "CAUSAL_LM",

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:158d1050804eb9731fa191c77ce90a4bc847918191471c7948504250cb8cc20a
-size 1208643928

 version https://git-lfs.github.com/spec/v1
+oid sha256:77f4bb35eaa42501a6e59b55e0a44d44722004922ef35e18ae879f8786229320
+size 1688334680

added_tokens.json CHANGED Viewed

@@ -1,5 +1,4 @@
 {
-  "<pad>": 32000,
-  "<|im_end|>": 32001,
-  "<|im_start|>": 32002
 }

 {
+  "<|im_end|>": 32000,
+  "<|im_start|>": 32001
 }

runs/Apr07_00-37-46_7e75014457a5/events.out.tfevents.1712450278.7e75014457a5.225.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:fe667fee2ad0ec58972b12bf60c778874aba4c99cb85f5ae1838e91afd639a67
+size 7112

runs/Apr07_01-03-35_7e75014457a5/events.out.tfevents.1712451829.7e75014457a5.225.1 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:5b6d75626ab3e09ca3b982b9216ad6864c67d08ae0346d474ecc44a5f8fc6e49
+size 7726

tokenizer.json CHANGED Viewed

@@ -37,15 +37,6 @@
     },
     {
       "id": 32000,
-      "content": "<pad>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": false,
-      "normalized": true,
-      "special": false
-    },
-    {
-      "id": 32001,
       "content": "<|im_end|>",
       "single_word": false,
       "lstrip": false,
@@ -54,7 +45,7 @@
       "special": true
     },
     {
-      "id": 32002,
       "content": "<|im_start|>",
       "single_word": false,
       "lstrip": false,

     },
     {
       "id": 32000,
       "content": "<|im_end|>",
       "single_word": false,
       "lstrip": false,
       "special": true
     },
     {
+      "id": 32001,
       "content": "<|im_start|>",
       "single_word": false,
       "lstrip": false,

tokenizer_config.json CHANGED Viewed

@@ -27,14 +27,6 @@
       "special": true
     },
     "32000": {
-      "content": "<pad>",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "32001": {
       "content": "<|im_end|>",
       "lstrip": false,
       "normalized": false,
@@ -42,7 +34,7 @@
       "single_word": false,
       "special": true
     },
-    "32002": {
       "content": "<|im_start|>",
       "lstrip": false,
       "normalized": false,

       "special": true
     },
     "32000": {
       "content": "<|im_end|>",
       "lstrip": false,
       "normalized": false,
       "single_word": false,
       "special": true
     },
+    "32001": {
       "content": "<|im_start|>",
       "lstrip": false,
       "normalized": false,

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1f0ea969c0eb983369b23a6a92f57fc0c08f143822ddd216feabaa5270d5d2cc
 size 4664

 version https://git-lfs.github.com/spec/v1
+oid sha256:bdc9d240b008498f5df064c69c1dc7f025073ab6e2dff33c62a2622c18d8e448
 size 4664