lfhe commited on
Commit
9fa6b02
·
1 Parent(s): 2d0b000
README.md CHANGED
@@ -1,5 +1,5 @@
1
  ---
2
- base_model: microsoft/Phi-3.5-mini-instruct
3
  library_name: peft
4
  ---
5
 
 
1
  ---
2
+ base_model: microsoft/Phi-4-mini-instruct
3
  library_name: peft
4
  ---
5
 
adapter_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
- "base_model_name_or_path": "microsoft/Phi-3.5-mini-instruct",
5
  "bias": "none",
6
  "corda_config": null,
7
  "eva_config": null,
@@ -13,24 +13,24 @@
13
  "layers_pattern": null,
14
  "layers_to_transform": null,
15
  "loftq_config": {},
16
- "lora_alpha": 32,
17
  "lora_bias": false,
18
- "lora_dropout": 0.15,
19
  "megatron_config": null,
20
  "megatron_core": "megatron.core",
21
  "modules_to_save": null,
22
  "peft_type": "LORA",
23
- "r": 32,
24
  "rank_pattern": {},
25
  "revision": null,
26
  "target_modules": [
27
  "down_proj",
28
  "qkv_proj",
29
- "o_proj",
30
- "gate_up_proj"
31
  ],
32
  "task_type": "CAUSAL_LM",
33
  "trainable_token_indices": null,
34
  "use_dora": false,
35
- "use_rslora": true
36
  }
 
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
+ "base_model_name_or_path": "microsoft/Phi-4-mini-instruct",
5
  "bias": "none",
6
  "corda_config": null,
7
  "eva_config": null,
 
13
  "layers_pattern": null,
14
  "layers_to_transform": null,
15
  "loftq_config": {},
16
+ "lora_alpha": 384,
17
  "lora_bias": false,
18
+ "lora_dropout": 0.4,
19
  "megatron_config": null,
20
  "megatron_core": "megatron.core",
21
  "modules_to_save": null,
22
  "peft_type": "LORA",
23
+ "r": 48,
24
  "rank_pattern": {},
25
  "revision": null,
26
  "target_modules": [
27
  "down_proj",
28
  "qkv_proj",
29
+ "gate_up_proj",
30
+ "o_proj"
31
  ],
32
  "task_type": "CAUSAL_LM",
33
  "trainable_token_indices": null,
34
  "use_dora": false,
35
+ "use_rslora": false
36
  }
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:636f75c19911bca5691af5654a25ca7d16e005162deb14ef7c1aec121f7816f2
3
- size 201361312
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:beea79c29dd9c4f470145d9e605714f30b2ac582212fdfbe95be7c8bbd8fa3f7
3
+ size 276858864
added_tokens.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "<|assistant|>": 32001,
3
- "<|endoftext|>": 32000,
4
- "<|end|>": 32007,
5
- "<|placeholder1|>": 32002,
6
- "<|placeholder2|>": 32003,
7
- "<|placeholder3|>": 32004,
8
- "<|placeholder4|>": 32005,
9
- "<|placeholder5|>": 32008,
10
- "<|placeholder6|>": 32009,
11
- "<|system|>": 32006,
12
- "<|user|>": 32010
13
  }
 
1
  {
2
+ "<|/tool_call|>": 200026,
3
+ "<|/tool|>": 200024,
4
+ "<|assistant|>": 200019,
5
+ "<|end|>": 200020,
6
+ "<|im_end|>": 200029,
7
+ "<|system|>": 200022,
8
+ "<|tag|>": 200028,
9
+ "<|tool_call|>": 200025,
10
+ "<|tool_response|>": 200027,
11
+ "<|tool|>": 200023,
12
+ "<|user|>": 200021
13
  }
merges.txt CHANGED
The diff for this file is too large to render. See raw diff
 
special_tokens_map.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
  "bos_token": {
3
- "content": "<s>",
4
  "lstrip": false,
5
  "normalized": false,
6
  "rstrip": false,
7
  "single_word": false
8
  },
9
  "eos_token": {
10
- "content": "<|end|>",
11
  "lstrip": false,
12
  "normalized": false,
13
  "rstrip": false,
@@ -21,7 +21,7 @@
21
  "single_word": false
22
  },
23
  "unk_token": {
24
- "content": "<unk>",
25
  "lstrip": false,
26
  "normalized": false,
27
  "rstrip": false,
 
1
  {
2
  "bos_token": {
3
+ "content": "<|endoftext|>",
4
  "lstrip": false,
5
  "normalized": false,
6
  "rstrip": false,
7
  "single_word": false
8
  },
9
  "eos_token": {
10
+ "content": "<|im_end|>",
11
  "lstrip": false,
12
  "normalized": false,
13
  "rstrip": false,
 
21
  "single_word": false
22
  },
23
  "unk_token": {
24
+ "content": "<|endoftext|>",
25
  "lstrip": false,
26
  "normalized": false,
27
  "rstrip": false,
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2923f15e986925cfb5e017bc9acbe2e24add5218d2b44558e1283fe76bb6df04
3
- size 3620658
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8799b7ce62bf40e724f80af87b9545f9d9043778f435040a6c08e834dc047b69
3
+ size 15524282
tokenizer_config.json CHANGED
@@ -1,133 +1,122 @@
1
  {
2
  "add_bos_token": false,
3
  "add_eos_token": false,
4
- "add_prefix_space": null,
5
  "added_tokens_decoder": {
6
- "0": {
7
- "content": "<unk>",
8
  "lstrip": false,
9
  "normalized": false,
10
  "rstrip": false,
11
  "single_word": false,
12
  "special": true
13
  },
14
- "1": {
15
- "content": "<s>",
16
  "lstrip": false,
17
  "normalized": false,
18
  "rstrip": false,
19
  "single_word": false,
20
  "special": true
21
  },
22
- "2": {
23
- "content": "</s>",
24
  "lstrip": false,
25
  "normalized": false,
26
  "rstrip": true,
27
  "single_word": false,
28
- "special": false
29
- },
30
- "32000": {
31
- "content": "<|endoftext|>",
32
- "lstrip": false,
33
- "normalized": false,
34
- "rstrip": false,
35
- "single_word": false,
36
  "special": true
37
  },
38
- "32001": {
39
- "content": "<|assistant|>",
40
  "lstrip": false,
41
  "normalized": false,
42
  "rstrip": true,
43
  "single_word": false,
44
  "special": true
45
  },
46
- "32002": {
47
- "content": "<|placeholder1|>",
48
  "lstrip": false,
49
  "normalized": false,
50
  "rstrip": true,
51
  "single_word": false,
52
  "special": true
53
  },
54
- "32003": {
55
- "content": "<|placeholder2|>",
56
  "lstrip": false,
57
  "normalized": false,
58
  "rstrip": true,
59
  "single_word": false,
60
  "special": true
61
  },
62
- "32004": {
63
- "content": "<|placeholder3|>",
64
  "lstrip": false,
65
  "normalized": false,
66
  "rstrip": true,
67
  "single_word": false,
68
- "special": true
69
  },
70
- "32005": {
71
- "content": "<|placeholder4|>",
72
  "lstrip": false,
73
  "normalized": false,
74
  "rstrip": true,
75
  "single_word": false,
76
- "special": true
77
  },
78
- "32006": {
79
- "content": "<|system|>",
80
  "lstrip": false,
81
  "normalized": false,
82
  "rstrip": true,
83
  "single_word": false,
84
- "special": true
85
  },
86
- "32007": {
87
- "content": "<|end|>",
88
  "lstrip": false,
89
  "normalized": false,
90
- "rstrip": false,
91
  "single_word": false,
92
- "special": true
93
  },
94
- "32008": {
95
- "content": "<|placeholder5|>",
96
  "lstrip": false,
97
  "normalized": false,
98
  "rstrip": true,
99
  "single_word": false,
100
- "special": true
101
  },
102
- "32009": {
103
- "content": "<|placeholder6|>",
104
  "lstrip": false,
105
  "normalized": false,
106
  "rstrip": true,
107
  "single_word": false,
108
  "special": true
109
  },
110
- "32010": {
111
- "content": "<|user|>",
112
  "lstrip": false,
113
  "normalized": false,
114
- "rstrip": true,
115
  "single_word": false,
116
  "special": true
117
  }
118
  },
119
- "bos_token": "<s>",
120
- "chat_template": "{% for message in messages %}{% if message['role'] == 'system' and message['content'] %}{{'<|system|>\n' + message['content'] + '<|end|>\n'}}{% elif message['role'] == 'user' %}{{'<|user|>\n' + message['content'] + '<|end|>\n'}}{% elif message['role'] == 'assistant' %}{{'<|assistant|>\n' + message['content'] + '<|end|>\n'}}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '<|assistant|>\n' }}{% else %}{{ eos_token }}{% endif %}",
121
  "clean_up_tokenization_spaces": false,
122
- "eos_token": "<|end|>",
123
  "extra_special_tokens": {},
124
- "legacy": false,
125
  "model_max_length": 131072,
126
  "pad_token": "<|endoftext|>",
127
  "padding_side": "right",
128
- "sp_model_kwargs": {},
129
  "split_special_tokens": false,
130
- "tokenizer_class": "LlamaTokenizer",
131
- "unk_token": "<unk>",
132
- "use_default_system_prompt": false
133
  }
 
1
  {
2
  "add_bos_token": false,
3
  "add_eos_token": false,
4
+ "add_prefix_space": false,
5
  "added_tokens_decoder": {
6
+ "199999": {
7
+ "content": "<|endoftext|>",
8
  "lstrip": false,
9
  "normalized": false,
10
  "rstrip": false,
11
  "single_word": false,
12
  "special": true
13
  },
14
+ "200018": {
15
+ "content": "<|endofprompt|>",
16
  "lstrip": false,
17
  "normalized": false,
18
  "rstrip": false,
19
  "single_word": false,
20
  "special": true
21
  },
22
+ "200019": {
23
+ "content": "<|assistant|>",
24
  "lstrip": false,
25
  "normalized": false,
26
  "rstrip": true,
27
  "single_word": false,
 
 
 
 
 
 
 
 
28
  "special": true
29
  },
30
+ "200020": {
31
+ "content": "<|end|>",
32
  "lstrip": false,
33
  "normalized": false,
34
  "rstrip": true,
35
  "single_word": false,
36
  "special": true
37
  },
38
+ "200021": {
39
+ "content": "<|user|>",
40
  "lstrip": false,
41
  "normalized": false,
42
  "rstrip": true,
43
  "single_word": false,
44
  "special": true
45
  },
46
+ "200022": {
47
+ "content": "<|system|>",
48
  "lstrip": false,
49
  "normalized": false,
50
  "rstrip": true,
51
  "single_word": false,
52
  "special": true
53
  },
54
+ "200023": {
55
+ "content": "<|tool|>",
56
  "lstrip": false,
57
  "normalized": false,
58
  "rstrip": true,
59
  "single_word": false,
60
+ "special": false
61
  },
62
+ "200024": {
63
+ "content": "<|/tool|>",
64
  "lstrip": false,
65
  "normalized": false,
66
  "rstrip": true,
67
  "single_word": false,
68
+ "special": false
69
  },
70
+ "200025": {
71
+ "content": "<|tool_call|>",
72
  "lstrip": false,
73
  "normalized": false,
74
  "rstrip": true,
75
  "single_word": false,
76
+ "special": false
77
  },
78
+ "200026": {
79
+ "content": "<|/tool_call|>",
80
  "lstrip": false,
81
  "normalized": false,
82
+ "rstrip": true,
83
  "single_word": false,
84
+ "special": false
85
  },
86
+ "200027": {
87
+ "content": "<|tool_response|>",
88
  "lstrip": false,
89
  "normalized": false,
90
  "rstrip": true,
91
  "single_word": false,
92
+ "special": false
93
  },
94
+ "200028": {
95
+ "content": "<|tag|>",
96
  "lstrip": false,
97
  "normalized": false,
98
  "rstrip": true,
99
  "single_word": false,
100
  "special": true
101
  },
102
+ "200029": {
103
+ "content": "<|im_end|>",
104
  "lstrip": false,
105
  "normalized": false,
106
+ "rstrip": false,
107
  "single_word": false,
108
  "special": true
109
  }
110
  },
111
+ "bos_token": "<|endoftext|>",
112
+ "chat_template": "{% for message in messages %}{% if message['role'] == 'system' and 'tools' in message and message['tools'] is not none %}{{ '<|' + message['role'] + '|>' + message['content'] + '<|tool|>' + message['tools'] + '<|/tool|>' + '<|end|>' }}{% else %}{{ '<|' + message['role'] + '|>' + message['content'] + '<|end|>' }}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '<|assistant|>' }}{% else %}{{ eos_token }}{% endif %}",
113
  "clean_up_tokenization_spaces": false,
114
+ "eos_token": "<|im_end|>",
115
  "extra_special_tokens": {},
 
116
  "model_max_length": 131072,
117
  "pad_token": "<|endoftext|>",
118
  "padding_side": "right",
 
119
  "split_special_tokens": false,
120
+ "tokenizer_class": "GPT2Tokenizer",
121
+ "unk_token": "<|endoftext|>"
 
122
  }
vocab.json CHANGED
The diff for this file is too large to render. See raw diff