danielhanchen commited on
Commit
9b9ccab
·
verified ·
1 Parent(s): 8c1eec7

Add files using upload-large-folder tool

Browse files
config.json CHANGED
@@ -15,7 +15,7 @@
15
  "num_attention_heads": 48,
16
  "num_hidden_layers": 61,
17
  "num_key_value_heads": 2,
18
- "pad_token_id": 151343,
19
  "partial_rotary_factor": 0.5,
20
  "rms_norm_eps": 1e-05,
21
  "rope_theta": 10000.0,
 
15
  "num_attention_heads": 48,
16
  "num_hidden_layers": 61,
17
  "num_key_value_heads": 2,
18
+ "pad_token_id": 151330,
19
  "partial_rotary_factor": 0.5,
20
  "rms_norm_eps": 1e-05,
21
  "rope_theta": 10000.0,
generation_config.json CHANGED
@@ -6,6 +6,6 @@
6
  151338
7
  ],
8
  "max_length": 32768,
9
- "pad_token_id": 151343,
10
  "transformers_version": "4.51.3"
11
  }
 
6
  151338
7
  ],
8
  "max_length": 32768,
9
+ "pad_token_id": 151330,
10
  "transformers_version": "4.51.3"
11
  }
special_tokens_map.json CHANGED
@@ -22,5 +22,11 @@
22
  "rstrip": false,
23
  "single_word": false
24
  },
25
- "pad_token": "<|PAD▁TOKEN|>"
 
 
 
 
 
 
26
  }
 
22
  "rstrip": false,
23
  "single_word": false
24
  },
25
+ "pad_token": {
26
+ "content": "[MASK]",
27
+ "lstrip": false,
28
+ "normalized": false,
29
+ "rstrip": false,
30
+ "single_word": false
31
+ }
32
  }
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b872a5bd5d75fa47dc7b28a1e152471b57704753f99f91fb294a48390809e040
3
- size 19966692
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76ebeac0d8bd7879ead7b43c16b44981f277e47225de2bd7de9ae1a6cc664a8c
3
+ size 19966496
tokenizer_config.json CHANGED
@@ -111,14 +111,6 @@
111
  "rstrip": false,
112
  "single_word": false,
113
  "special": true
114
- },
115
- "151343": {
116
- "content": "<|PAD▁TOKEN|>",
117
- "lstrip": false,
118
- "normalized": false,
119
- "rstrip": false,
120
- "single_word": false,
121
- "special": true
122
  }
123
  },
124
  "additional_special_tokens": [
@@ -148,7 +140,7 @@
148
  "attention_mask"
149
  ],
150
  "model_max_length": 32768,
151
- "pad_token": "<|PAD▁TOKEN|>",
152
  "padding_side": "left",
153
  "remove_space": false,
154
  "tokenizer_class": "PreTrainedTokenizer",
 
111
  "rstrip": false,
112
  "single_word": false,
113
  "special": true
 
 
 
 
 
 
 
 
114
  }
115
  },
116
  "additional_special_tokens": [
 
140
  "attention_mask"
141
  ],
142
  "model_max_length": 32768,
143
+ "pad_token": "[MASK]",
144
  "padding_side": "left",
145
  "remove_space": false,
146
  "tokenizer_class": "PreTrainedTokenizer",