Training in progress, epoch 1

Files changed (6) hide show

README.md ADDED Viewed

+---
+library_name: peft
+---
+## Training procedure
+The following `bitsandbytes` quantization config was used during training:
+- quant_method: bitsandbytes
+- load_in_8bit: True
+- load_in_4bit: False
+- llm_int8_threshold: 6.0
+- llm_int8_skip_modules: None
+- llm_int8_enable_fp32_cpu_offload: False
+- llm_int8_has_fp16_weight: False
+- bnb_4bit_quant_type: fp4
+- bnb_4bit_use_double_quant: False
+- bnb_4bit_compute_dtype: float32
+### Framework versions
+- PEFT 0.6.0.dev0

adapter_config.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "alpha_pattern": {},
   "auto_mapping": null,
-  "base_model_name_or_path": "codellama/CodeLlama-7b-hf",
   "bias": "none",
   "fan_in_fan_out": null,
   "inference_mode": true,
@@ -16,13 +16,13 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "down_proj",
-    "v_proj",
     "gate_proj",
-    "q_proj",
-    "k_proj",
     "o_proj",
-    "up_proj"
   ],
   "task_type": "CAUSAL_LM"
 }

 {
   "alpha_pattern": {},
   "auto_mapping": null,
+  "base_model_name_or_path": "codellama/CodeLlama-7b-Instruct-hf",
   "bias": "none",
   "fan_in_fan_out": null,
   "inference_mode": true,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "gate_proj",
+    "v_proj",
+    "down_proj",
+    "up_proj",
     "o_proj",
+    "q_proj",
+    "k_proj"
   ],
   "task_type": "CAUSAL_LM"
 }

adapter_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:252e5bb28e7b71f5caba598d8296e60ba463497fb5ca5f5625ebd1a32123168b
 size 319977229

 version https://git-lfs.github.com/spec/v1
+oid sha256:c980182b1e1588556688b6a652a130642d20cf6bc0718d63b9b9ac36370b7a0b
 size 319977229

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "codellama/CodeLlama-7b-hf",
   "architectures": [
     "LlamaForCausalLM"
   ],

 {
+  "_name_or_path": "codellama/CodeLlama-7b-Instruct-hf",
   "architectures": [
     "LlamaForCausalLM"
   ],

tokenizer_config.json CHANGED Viewed

@@ -79,7 +79,7 @@
   "suffix_first": false,
   "suffix_token": "▁<SUF>",
   "tokenizer_class": "CodeLlamaTokenizer",
-  "tokenizer_file": "/root/.cache/huggingface/hub/models--codellama--CodeLlama-7b-hf/snapshots/3773f63b4511b9e47a9a7ffc765eed7eb0169486/tokenizer.json",
   "trust_remote_code": false,
   "unk_token": "<unk>",
   "use_default_system_prompt": false,

   "suffix_first": false,
   "suffix_token": "▁<SUF>",
   "tokenizer_class": "CodeLlamaTokenizer",
+  "tokenizer_file": "/root/.cache/huggingface/hub/models--codellama--CodeLlama-7b-Instruct-hf/snapshots/6114dd1e16f69e0765ccbd7a64d33d04b265fbd2/tokenizer.json",
   "trust_remote_code": false,
   "unk_token": "<unk>",
   "use_default_system_prompt": false,

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e829299a78f4b1dd4d8794df3b53ccce91314f8df1687084a34163608cc66743
 size 4475

 version https://git-lfs.github.com/spec/v1
+oid sha256:01a2680f6024f84d722c28decac8dad6e0feddc6f82978a329380e710c8027a4
 size 4475