lfhe commited on
Commit
c8f8957
·
1 Parent(s): 91734b0
adapter_config.json CHANGED
@@ -10,20 +10,20 @@
10
  "layers_pattern": null,
11
  "layers_to_transform": null,
12
  "loftq_config": {},
13
- "lora_alpha": 512,
14
- "lora_dropout": 0.0,
15
  "megatron_config": null,
16
  "megatron_core": "megatron.core",
17
  "modules_to_save": null,
18
  "peft_type": "LORA",
19
- "r": 256,
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "gate_up_proj",
24
  "down_proj",
 
25
  "qkv_proj",
26
- "o_proj"
27
  ],
28
  "task_type": "CAUSAL_LM",
29
  "use_dora": false,
 
10
  "layers_pattern": null,
11
  "layers_to_transform": null,
12
  "loftq_config": {},
13
+ "lora_alpha": 256,
14
+ "lora_dropout": 0.05,
15
  "megatron_config": null,
16
  "megatron_core": "megatron.core",
17
  "modules_to_save": null,
18
  "peft_type": "LORA",
19
+ "r": 128,
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
 
23
  "down_proj",
24
+ "o_proj",
25
  "qkv_proj",
26
+ "gate_up_proj"
27
  ],
28
  "task_type": "CAUSAL_LM",
29
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:928fea1571b72bf6236ffdbafa3a3004f76aee7ef9bafb120d58121376de256f
3
- size 1610648152
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:195dccfab7540a08a3ab4352ea19ded7e9c12099773406f6441dd229ac509e82
3
+ size 805341552
special_tokens_map.json CHANGED
@@ -1,4 +1,13 @@
1
  {
 
 
 
 
 
 
 
 
 
2
  "bos_token": {
3
  "content": "<s>",
4
  "lstrip": false,
@@ -7,7 +16,7 @@
7
  "single_word": false
8
  },
9
  "eos_token": {
10
- "content": "<|end|>",
11
  "lstrip": false,
12
  "normalized": false,
13
  "rstrip": false,
 
1
  {
2
+ "additional_special_tokens": [
3
+ {
4
+ "content": "<|end|>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false
9
+ }
10
+ ],
11
  "bos_token": {
12
  "content": "<s>",
13
  "lstrip": false,
 
16
  "single_word": false
17
  },
18
  "eos_token": {
19
+ "content": "<|endoftext|>",
20
  "lstrip": false,
21
  "normalized": false,
22
  "rstrip": false,
tokenizer_config.json CHANGED
@@ -116,12 +116,15 @@
116
  "special": true
117
  }
118
  },
 
 
 
119
  "bos_token": "<s>",
120
- "chat_template": "{{ '<s>' }}{% if messages[0]['role'] == 'system' %}{% set loop_messages = messages[1:] %}{% set system_message = messages[0]['content'] %}{% else %}{% set loop_messages = messages %}{% endif %}{% if system_message is defined %}{{ '<|system|>\n' + system_message + '<|end|>\n' }}{% endif %}{% for message in loop_messages %}{% set content = message['content'] %}{% if message['role'] == 'user' %}{{ '<|user|>\n' + content + '<|end|>\n<|assistant|>\n' }}{% elif message['role'] == 'assistant' %}{{ content + '<|end|>' + '\n' }}{% endif %}{% endfor %}",
121
  "clean_up_tokenization_spaces": false,
122
- "eos_token": "<|end|>",
123
  "legacy": false,
124
- "model_max_length": 131072,
125
  "pad_token": "<|endoftext|>",
126
  "padding_side": "right",
127
  "sp_model_kwargs": {},
 
116
  "special": true
117
  }
118
  },
119
+ "additional_special_tokens": [
120
+ "<|end|>"
121
+ ],
122
  "bos_token": "<s>",
123
+ "chat_template": "{% for message in messages %}{% if message['role'] == 'system' and message['content'] %}{{'<|system|>\n' + message['content'] + '<|end|>\n'}}{% elif message['role'] == 'user' %}{{'<|user|>\n' + message['content'] + '<|end|>\n'}}{% elif message['role'] == 'assistant' %}{{'<|assistant|>\n' + message['content'] + '<|end|>\n'}}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '<|assistant|>\n' }}{% else %}{{ eos_token }}{% endif %}",
124
  "clean_up_tokenization_spaces": false,
125
+ "eos_token": "<|endoftext|>",
126
  "legacy": false,
127
+ "model_max_length": 8192,
128
  "pad_token": "<|endoftext|>",
129
  "padding_side": "right",
130
  "sp_model_kwargs": {},
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6bf14235d53289dcacb8f4d67daf43098957e7e4f82aa8da4ac76c5b5ee0a7af
3
- size 5432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:108eb9d266db37ee1271e0668059f27379c3b7630df4718e340c8ea80d6d6100
3
+ size 5560