lfhe commited on
Commit
a60b761
·
1 Parent(s): 22c25ff
README.md CHANGED
@@ -1,5 +1,5 @@
1
  ---
2
- base_model: microsoft/Phi-3.5-mini-instruct
3
  library_name: peft
4
  ---
5
 
 
1
  ---
2
+ base_model: microsoft/Phi-3-mini-4k-instruct
3
  library_name: peft
4
  ---
5
 
adapter_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
- "base_model_name_or_path": "microsoft/Phi-3.5-mini-instruct",
5
  "bias": "none",
6
  "corda_config": null,
7
  "eva_config": null,
@@ -13,21 +13,21 @@
13
  "layers_pattern": null,
14
  "layers_to_transform": null,
15
  "loftq_config": {},
16
- "lora_alpha": 256,
17
  "lora_bias": false,
18
- "lora_dropout": 0.0,
19
  "megatron_config": null,
20
  "megatron_core": "megatron.core",
21
  "modules_to_save": null,
22
  "peft_type": "LORA",
23
- "r": 64,
24
  "rank_pattern": {},
25
  "revision": null,
26
  "target_modules": [
27
- "qkv_proj",
28
  "o_proj",
29
  "gate_up_proj",
30
- "down_proj"
 
31
  ],
32
  "task_type": "CAUSAL_LM",
33
  "trainable_token_indices": null,
 
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
+ "base_model_name_or_path": "microsoft/Phi-3-mini-4k-instruct",
5
  "bias": "none",
6
  "corda_config": null,
7
  "eva_config": null,
 
13
  "layers_pattern": null,
14
  "layers_to_transform": null,
15
  "loftq_config": {},
16
+ "lora_alpha": 16,
17
  "lora_bias": false,
18
+ "lora_dropout": 0.4,
19
  "megatron_config": null,
20
  "megatron_core": "megatron.core",
21
  "modules_to_save": null,
22
  "peft_type": "LORA",
23
+ "r": 16,
24
  "rank_pattern": {},
25
  "revision": null,
26
  "target_modules": [
 
27
  "o_proj",
28
  "gate_up_proj",
29
+ "down_proj",
30
+ "qkv_proj"
31
  ],
32
  "task_type": "CAUSAL_LM",
33
  "trainable_token_indices": null,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e722590b3ae330b2443474e9e3a580530188d149187a877eff07104d09c5b723
3
- size 402688040
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:171b92d0a583e4d59bae3c9f38220b268cc96cca8e2a0b780ff43e9c3ad11da7
3
+ size 100697728
tokenizer_config.json CHANGED
@@ -117,12 +117,12 @@
117
  }
118
  },
119
  "bos_token": "<s>",
120
- "chat_template": "{% for message in messages %}{% if message['role'] == 'system' and message['content'] %}{{'<|system|>\n' + message['content'] + '<|end|>\n'}}{% elif message['role'] == 'user' %}{{'<|user|>\n' + message['content'] + '<|end|>\n'}}{% elif message['role'] == 'assistant' %}{{'<|assistant|>\n' + message['content'] + '<|end|>\n'}}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '<|assistant|>\n' }}{% else %}{{ eos_token }}{% endif %}",
121
  "clean_up_tokenization_spaces": false,
122
  "eos_token": "<|end|>",
123
  "extra_special_tokens": {},
124
  "legacy": false,
125
- "model_max_length": 131072,
126
  "pad_token": "<|endoftext|>",
127
  "padding_side": "right",
128
  "sp_model_kwargs": {},
 
117
  }
118
  },
119
  "bos_token": "<s>",
120
+ "chat_template": "{% for message in messages %}{% if message['role'] == 'system' %}{{'<|system|>\n' + message['content'] + '<|end|>\n'}}{% elif message['role'] == 'user' %}{{'<|user|>\n' + message['content'] + '<|end|>\n'}}{% elif message['role'] == 'assistant' %}{{'<|assistant|>\n' + message['content'] + '<|end|>\n'}}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '<|assistant|>\n' }}{% else %}{{ eos_token }}{% endif %}",
121
  "clean_up_tokenization_spaces": false,
122
  "eos_token": "<|end|>",
123
  "extra_special_tokens": {},
124
  "legacy": false,
125
+ "model_max_length": 8192,
126
  "pad_token": "<|endoftext|>",
127
  "padding_side": "right",
128
  "sp_model_kwargs": {},