hootan09 vladislavbro commited on
Commit
07ec72d
·
verified ·
0 Parent(s):

Duplicate from onnx-community/chatterbox-ONNX

Browse files

Co-authored-by: Vladislav Bronzov <vladislavbro@users.noreply.huggingface.co>

.gitattributes ADDED
@@ -0,0 +1,45 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
+ *.ftz filter=lfs diff=lfs merge=lfs -text
7
+ *.gz filter=lfs diff=lfs merge=lfs -text
8
+ *.h5 filter=lfs diff=lfs merge=lfs -text
9
+ *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
+ *.model filter=lfs diff=lfs merge=lfs -text
13
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
14
+ *.npy filter=lfs diff=lfs merge=lfs -text
15
+ *.npz filter=lfs diff=lfs merge=lfs -text
16
+ *.onnx filter=lfs diff=lfs merge=lfs -text
17
+ *.ot filter=lfs diff=lfs merge=lfs -text
18
+ *.parquet filter=lfs diff=lfs merge=lfs -text
19
+ *.pb filter=lfs diff=lfs merge=lfs -text
20
+ *.pickle filter=lfs diff=lfs merge=lfs -text
21
+ *.pkl filter=lfs diff=lfs merge=lfs -text
22
+ *.pt filter=lfs diff=lfs merge=lfs -text
23
+ *.pth filter=lfs diff=lfs merge=lfs -text
24
+ *.rar filter=lfs diff=lfs merge=lfs -text
25
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
26
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
28
+ *.tar filter=lfs diff=lfs merge=lfs -text
29
+ *.tflite filter=lfs diff=lfs merge=lfs -text
30
+ *.tgz filter=lfs diff=lfs merge=lfs -text
31
+ *.wasm filter=lfs diff=lfs merge=lfs -text
32
+ *.xz filter=lfs diff=lfs merge=lfs -text
33
+ *.zip filter=lfs diff=lfs merge=lfs -text
34
+ *.zst filter=lfs diff=lfs merge=lfs -text
35
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ llama3.onnx.data filter=lfs diff=lfs merge=lfs -text
37
+ llama3.data filter=lfs diff=lfs merge=lfs -text
38
+ onnx/language_model.onnx_data filter=lfs diff=lfs merge=lfs -text
39
+ default_voice.wav filter=lfs diff=lfs merge=lfs -text
40
+ onnx/conditional_decoder.onnx_data filter=lfs diff=lfs merge=lfs -text
41
+ onnx/embed_tokens.onnx_data filter=lfs diff=lfs merge=lfs -text
42
+ onnx/speech_encoder.onnx_data filter=lfs diff=lfs merge=lfs -text
43
+ onnx/language_model_fp16.onnx_data filter=lfs diff=lfs merge=lfs -text
44
+ onnx/language_model_q4.onnx_data filter=lfs diff=lfs merge=lfs -text
45
+ onnx/language_model_q4f16.onnx_data filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,248 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: mit
3
+ language:
4
+ - en
5
+ pipeline_tag: text-to-speech
6
+ tags:
7
+ - text-to-speech
8
+ - speech
9
+ - speech-generation
10
+ - voice-cloning
11
+ library_name: Chatterbox
12
+ base_model:
13
+ - ResembleAI/chatterbox
14
+ ---
15
+
16
+ <img width="800" alt="cb-big2" src="https://github.com/user-attachments/assets/bd8c5f03-e91d-4ee5-b680-57355da204d1" />
17
+
18
+ <h1 style="font-size: 32px">Chatterbox TTS</h1>
19
+
20
+ <div style="display: flex; align-items: center; gap: 12px">
21
+ <a href="https://resemble-ai.github.io/chatterbox_demopage/">
22
+ <img src="https://img.shields.io/badge/listen-demo_samples-blue" alt="Listen to Demo Samples" />
23
+ </a>
24
+ <a href="https://huggingface.co/spaces/ResembleAI/Chatterbox">
25
+ <img src="https://huggingface.co/datasets/huggingface/badges/resolve/main/open-in-hf-spaces-sm.svg" alt="Open in HF Spaces" />
26
+ </a>
27
+ <a href="https://podonos.com/resembleai/chatterbox">
28
+ <img src="https://static-public.podonos.com/badges/insight-on-pdns-sm-dark.svg" alt="Insight on Podos" />
29
+ </a>
30
+ </div>
31
+
32
+ <div style="display: flex; align-items: center; gap: 8px;">
33
+ <img width="100" alt="resemble-logo-horizontal" src="https://github.com/user-attachments/assets/35cf756b-3506-4943-9c72-c05ddfa4e525" />
34
+ </div>
35
+
36
+ **Chatterbox** [Resemble AI's](https://resemble.ai) production-grade open source TTS model. Chatterbox supports **English** out of the box. Licensed under MIT, Chatterbox has been benchmarked against leading closed-source systems like ElevenLabs, and is consistently preferred in side-by-side evaluations.
37
+
38
+ Whether you're working on memes, videos, games, or AI agents, Chatterbox brings your content to life. It's also the first open source TTS model to support **emotion exaggeration control**, a powerful feature that makes your voices stand out.
39
+
40
+ Chatterbox is provided in an exported ONNX format, enabling fast and portable inference with ONNX Runtime across platforms.
41
+
42
+ # Key Details
43
+ - SoTA zeroshot English TTS
44
+ - 0.5B Llama backbone
45
+ - Unique exaggeration/intensity control
46
+ - Ultra-stable with alignment-informed inference
47
+ - Trained on 0.5M hours of cleaned data
48
+ - Watermarked outputs (optional)
49
+ - Easy voice conversion script using onnxruntime
50
+ - [Outperforms ElevenLabs](https://podonos.com/resembleai/chatterbox)
51
+
52
+ # Tips
53
+ - **General Use (TTS and Voice Agents):**
54
+ - The default settings (`exaggeration=0.5`, `cfg=0.5`) work well for most prompts.
55
+
56
+ - **Expressive or Dramatic Speech:**
57
+ - Try increase `exaggeration` to around `0.7` or higher.
58
+ - Higher `exaggeration` tends to speed up speech;
59
+
60
+
61
+ # Usage
62
+ [Link to GitHub ONNX Export and Inference script](https://github.com/VladOS95-cyber/onnx_conversion_scripts/tree/main/chatterbox)
63
+
64
+ ```python
65
+ # !pip install --upgrade onnxruntime==1.22.1 huggingface_hub==0.34.4 transformers==4.46.3 numpy==2.2.6 tqdm==4.67.1 librosa==0.11.0 soundfile==0.13.1 resemble-perth==1.0.1
66
+
67
+ import onnxruntime
68
+
69
+ from huggingface_hub import hf_hub_download
70
+ from transformers import AutoTokenizer
71
+
72
+ import numpy as np
73
+ from tqdm import tqdm
74
+ import librosa
75
+ import soundfile as sf
76
+
77
+ S3GEN_SR = 24000
78
+ START_SPEECH_TOKEN = 6561
79
+ STOP_SPEECH_TOKEN = 6562
80
+
81
+
82
+ class RepetitionPenaltyLogitsProcessor:
83
+ def __init__(self, penalty: float):
84
+ if not isinstance(penalty, float) or not (penalty > 0):
85
+ raise ValueError(f"`penalty` must be a strictly positive float, but is {penalty}")
86
+ self.penalty = penalty
87
+
88
+ def __call__(self, input_ids: np.ndarray, scores: np.ndarray) -> np.ndarray:
89
+ score = np.take_along_axis(scores, input_ids, axis=1)
90
+ score = np.where(score < 0, score * self.penalty, score / self.penalty)
91
+ scores_processed = scores.copy()
92
+ np.put_along_axis(scores_processed, input_ids, score, axis=1)
93
+ return scores_processed
94
+
95
+
96
+ def run_inference(
97
+ text="The Lord of the Rings is the greatest work of literature.",
98
+ target_voice_path=None,
99
+ max_new_tokens = 256,
100
+ exaggeration=0.5,
101
+ output_dir="converted",
102
+ output_file_name="output.wav",
103
+ apply_watermark=True,
104
+ ):
105
+
106
+ model_id = "onnx-community/chatterbox-onnx"
107
+ if not target_voice_path:
108
+ target_voice_path = hf_hub_download(repo_id=model_id, filename="default_voice.wav", local_dir=output_dir)
109
+
110
+ ## Load model
111
+ speech_encoder_path = hf_hub_download(repo_id=model_id, filename="speech_encoder.onnx", local_dir=output_dir, subfolder='onnx')
112
+ hf_hub_download(repo_id=model_id, filename="speech_encoder.onnx_data", local_dir=output_dir, subfolder='onnx')
113
+ embed_tokens_path = hf_hub_download(repo_id=model_id, filename="embed_tokens.onnx", local_dir=output_dir, subfolder='onnx')
114
+ hf_hub_download(repo_id=model_id, filename="embed_tokens.onnx_data", local_dir=output_dir, subfolder='onnx')
115
+ conditional_decoder_path = hf_hub_download(repo_id=model_id, filename="conditional_decoder.onnx", local_dir=output_dir, subfolder='onnx')
116
+ hf_hub_download(repo_id=model_id, filename="conditional_decoder.onnx_data", local_dir=output_dir, subfolder='onnx')
117
+ language_model_path = hf_hub_download(repo_id=model_id, filename="language_model.onnx", local_dir=output_dir, subfolder='onnx')
118
+ hf_hub_download(repo_id=model_id, filename="language_model.onnx_data", local_dir=output_dir, subfolder='onnx')
119
+
120
+ # # Start inferense sessions
121
+ speech_encoder_session = onnxruntime.InferenceSession(speech_encoder_path)
122
+ embed_tokens_session = onnxruntime.InferenceSession(embed_tokens_path)
123
+ llama_with_past_session = onnxruntime.InferenceSession(language_model_path)
124
+ cond_decoder_session = onnxruntime.InferenceSession(conditional_decoder_path)
125
+
126
+ def execute_text_to_audio_inference(text):
127
+ print("Start inference script...")
128
+
129
+ audio_values, _ = librosa.load(target_voice_path, sr=S3GEN_SR)
130
+ audio_values = audio_values[np.newaxis, :].astype(np.float32)
131
+
132
+ ## Prepare input
133
+ tokenizer = AutoTokenizer.from_pretrained(model_id)
134
+ input_ids = tokenizer(text, return_tensors="np")["input_ids"].astype(np.int64)
135
+
136
+ position_ids = np.where(
137
+ input_ids >= START_SPEECH_TOKEN,
138
+ 0,
139
+ np.arange(input_ids.shape[1])[np.newaxis, :] - 1
140
+ )
141
+
142
+ ort_embed_tokens_inputs = {
143
+ "input_ids": input_ids,
144
+ "position_ids": position_ids,
145
+ "exaggeration": np.array([exaggeration], dtype=np.float32)
146
+ }
147
+
148
+ ## Instantiate the logits processors.
149
+ repetition_penalty = 1.2
150
+ repetition_penalty_processor = RepetitionPenaltyLogitsProcessor(penalty=repetition_penalty)
151
+
152
+ num_hidden_layers = 30
153
+ num_key_value_heads = 16
154
+ head_dim = 64
155
+
156
+ generate_tokens = np.array([[START_SPEECH_TOKEN]], dtype=np.long)
157
+
158
+ # ---- Generation Loop using kv_cache ----
159
+ for i in tqdm(range(max_new_tokens), desc="Sampling", dynamic_ncols=True):
160
+
161
+ inputs_embeds = embed_tokens_session.run(None, ort_embed_tokens_inputs)[0]
162
+ if i == 0:
163
+ ort_speech_encoder_input = {
164
+ "audio_values": audio_values,
165
+ }
166
+ cond_emb, prompt_token, ref_x_vector, prompt_feat = speech_encoder_session.run(None, ort_speech_encoder_input)
167
+ inputs_embeds = np.concatenate((cond_emb, inputs_embeds), axis=1)
168
+
169
+ ## Prepare llm inputs
170
+ batch_size, seq_len, _ = inputs_embeds.shape
171
+ past_key_values = {
172
+ f"past_key_values.{layer}.{kv}": np.zeros([batch_size, num_key_value_heads, 0, head_dim], dtype=np.float32)
173
+ for layer in range(num_hidden_layers)
174
+ for kv in ("key", "value")
175
+ }
176
+ attention_mask = np.ones((batch_size, seq_len), dtype=np.int64)
177
+
178
+ logits, *present_key_values = llama_with_past_session.run(None, dict(
179
+ inputs_embeds=inputs_embeds,
180
+ attention_mask=attention_mask,
181
+ **past_key_values,
182
+ ))
183
+
184
+ logits = logits[:, -1, :]
185
+ next_token_logits = repetition_penalty_processor(generate_tokens, logits)
186
+
187
+ next_token = np.argmax(next_token_logits, axis=-1, keepdims=True).astype(np.int64)
188
+ generate_tokens = np.concatenate((generate_tokens, next_token), axis=-1)
189
+ if (next_token.flatten() == STOP_SPEECH_TOKEN).all():
190
+ break
191
+
192
+ # Get embedding for the new token.
193
+ position_ids = np.full(
194
+ (input_ids.shape[0], 1),
195
+ i + 1,
196
+ dtype=np.int64,
197
+ )
198
+ ort_embed_tokens_inputs["input_ids"] = next_token
199
+ ort_embed_tokens_inputs["position_ids"] = position_ids
200
+
201
+ ## Update values for next generation loop
202
+ attention_mask = np.concatenate([attention_mask, np.ones((batch_size, 1), dtype=np.int64)], axis=1)
203
+ for j, key in enumerate(past_key_values):
204
+ past_key_values[key] = present_key_values[j]
205
+
206
+ speech_tokens = generate_tokens[:, 1:-1]
207
+ speech_tokens = np.concatenate([prompt_token, speech_tokens], axis=1)
208
+ return speech_tokens, ref_x_vector, prompt_feat
209
+
210
+ speech_tokens, speaker_embeddings, speaker_features = execute_text_to_audio_inference(text)
211
+ cond_incoder_input = {
212
+ "speech_tokens": speech_tokens,
213
+ "speaker_embeddings": speaker_embeddings,
214
+ "speaker_features": speaker_features,
215
+ }
216
+ wav = cond_decoder_session.run(None, cond_incoder_input)[0]
217
+ wav = np.squeeze(wav, axis=0)
218
+
219
+ # Optional: Apply watermark
220
+ if apply_watermark:
221
+ import perth
222
+ watermarker = perth.PerthImplicitWatermarker()
223
+ wav = watermarker.apply_watermark(wav, sample_rate=S3GEN_SR)
224
+
225
+ sf.write(output_file_name, wav, S3GEN_SR)
226
+ print(f"{output_file_name} was successfully saved")
227
+
228
+ if __name__ == "__main__":
229
+ run_inference(
230
+ text="Ezreal and Jinx teamed up with Ahri, Yasuo, and Teemo to take down the enemy's Nexus in an epic late-game pentakill.",
231
+ exaggeration=0.5,
232
+ output_file_name="output.wav",
233
+ apply_watermark=False,
234
+ )
235
+ ```
236
+
237
+
238
+ # Acknowledgements
239
+ - [Xenova](https://huggingface.co/Xenova)
240
+ - [Vladislav Bronzov](https://github.com/VladOS95-cyber)
241
+ - [Resemble AI](https://github.com/resemble-ai/chatterbox)
242
+
243
+ # Built-in PerTh Watermarking for Responsible AI
244
+
245
+ Every audio file generated by Chatterbox includes [Resemble AI's Perth (Perceptual Threshold) Watermarker](https://github.com/resemble-ai/perth) - imperceptible neural watermarks that survive MP3 compression, audio editing, and common manipulations while maintaining nearly 100% detection accuracy.
246
+
247
+ # Disclaimer
248
+ Don't use this model to do bad things. Prompts are sourced from freely available data on the internet.
config.json ADDED
@@ -0,0 +1,45 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_type": "chatterbox",
3
+ "text_config": {
4
+ "architectures": [
5
+ "LlamaForCausalLM"
6
+ ],
7
+ "attention_bias": false,
8
+ "attention_dropout": 0.0,
9
+ "bos_token_id": 1,
10
+ "eos_token_id": 2,
11
+ "head_dim": 64,
12
+ "hidden_act": "silu",
13
+ "hidden_size": 1024,
14
+ "initializer_range": 0.02,
15
+ "intermediate_size": 4096,
16
+ "max_position_embeddings": 131072,
17
+ "mlp_bias": false,
18
+ "model_type": "llama",
19
+ "num_attention_heads": 16,
20
+ "num_hidden_layers": 30,
21
+ "num_key_value_heads": 16,
22
+ "pretraining_tp": 1,
23
+ "rms_norm_eps": 1e-05,
24
+ "rope_scaling": {
25
+ "factor": 8.0,
26
+ "high_freq_factor": 4.0,
27
+ "low_freq_factor": 1.0,
28
+ "original_max_position_embeddings": 8192,
29
+ "rope_type": "llama3"
30
+ },
31
+ "rope_theta": 500000.0,
32
+ "tie_word_embeddings": false,
33
+ "torch_dtype": "float32",
34
+ "transformers_version": "4.46.3",
35
+ "use_cache": true,
36
+ "vocab_size": 8194
37
+ },
38
+ "transformers.js_config": {
39
+ "use_external_data_format": true,
40
+ "kv_cache_dtype": {
41
+ "fp16": "float16",
42
+ "q4f16": "float16"
43
+ }
44
+ }
45
+ }
default_voice.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ebc531cdaba358a327099c1c4f0448026719957bcf4d8e9868767f227e02f4e
3
+ size 714320
generation_config.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token_id": 1,
3
+ "eos_token_id": [
4
+ 2,
5
+ 6562
6
+ ],
7
+ "repetition_penalty": 1.2
8
+ }
onnx/conditional_decoder.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1656d0d31332bae1854839959a3139300ebb67c178651dfa3f8c5fbfa5351351
3
+ size 6350448
onnx/conditional_decoder.onnx_data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51d58345a272747665ec9d5bb61e01835258a940e321a288582ac4c18cf01b5a
3
+ size 533970816
onnx/embed_tokens.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:160722ec14789f616abdb1e31916cbbf9223c03fde0ab546d64ca74fb72e430b
3
+ size 13286
onnx/embed_tokens.onnx_data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:898c563c3a5ca1b9ea10ce89b0cdcf252b0bb5ab460dfc4eadea003b56e5d2ee
3
+ size 61640704
onnx/language_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:861a34585605e8ad671051788afc495dcbeaee833a41523a1b33aded9c3babc7
3
+ size 171387
onnx/language_model.onnx_data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efe9a1173c40d50bc651cb96ebff9f23d6f20d5b3a11b0685510e3a3facdbcf1
3
+ size 2080632832
onnx/language_model_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c36a5bbbc2a4ed8c345033896612cd320fd0971a0f5e6447ab4cdd2d7f22e36
3
+ size 172657
onnx/language_model_fp16.onnx_data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d1b751ce1af740bbfa6cde9dc7d359afedba4b6de5a875b6fd199131216f16d
3
+ size 1040316416
onnx/language_model_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f8cdca83b2493536cbf3acf421199808a3d68736f55f4eabd20ef8a99da4313
3
+ size 227911
onnx/language_model_q4.onnx_data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5203d1e83c159316f9923c5c83759f6a34f87be1322ce4ad0facd9fc4aef4790
3
+ size 353621248
onnx/language_model_q4f16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b78e9235be5e2e2a811e482399155cb30415f6d87c98c21d12bf48843fc928f
3
+ size 229388
onnx/language_model_q4f16.onnx_data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2480da95471e4cd41a6b1876686e65e8a594c82459f2e5d6fd7592a5bad4e6da
3
+ size 304737408
onnx/speech_encoder.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f1c8a0f89b77bf9cd5dd8f2e034eb2c79dc00fe70d41196b28c257643b00ccb
3
+ size 1184608
onnx/speech_encoder.onnx_data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04431dcef6325c54b02de2219845888b464bcd1f1ac2f8839c2fecd1ed2ef294
3
+ size 591274880
preprocessor_config.json ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ {
2
+ "feature_extractor_type": "ChatterboxFeatureExtractor",
3
+ "processor_class": "ChatterboxProcessor",
4
+ "sampling_rate": 24000
5
+ }
tokenizer.json ADDED
@@ -0,0 +1,1611 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "1.0",
3
+ "truncation": null,
4
+ "padding": null,
5
+ "added_tokens": [
6
+ {
7
+ "id": 0,
8
+ "special": true,
9
+ "content": "[STOP]",
10
+ "single_word": false,
11
+ "lstrip": false,
12
+ "rstrip": false,
13
+ "normalized": false
14
+ },
15
+ {
16
+ "id": 1,
17
+ "special": true,
18
+ "content": "[UNK]",
19
+ "single_word": false,
20
+ "lstrip": false,
21
+ "rstrip": false,
22
+ "normalized": false
23
+ },
24
+ {
25
+ "id": 255,
26
+ "special": true,
27
+ "content": "[START]",
28
+ "single_word": false,
29
+ "lstrip": false,
30
+ "rstrip": false,
31
+ "normalized": false
32
+ },
33
+ {
34
+ "id": 604,
35
+ "content": "[UH]",
36
+ "single_word": false,
37
+ "lstrip": false,
38
+ "rstrip": false,
39
+ "normalized": false,
40
+ "special": true
41
+ },
42
+ {
43
+ "id": 605,
44
+ "content": "[UM]",
45
+ "single_word": false,
46
+ "lstrip": false,
47
+ "rstrip": false,
48
+ "normalized": false,
49
+ "special": true
50
+ },
51
+ {
52
+ "id": 606,
53
+ "content": "[giggle]",
54
+ "single_word": false,
55
+ "lstrip": false,
56
+ "rstrip": false,
57
+ "normalized": false,
58
+ "special": true
59
+ },
60
+ {
61
+ "id": 607,
62
+ "content": "[laughter]",
63
+ "single_word": false,
64
+ "lstrip": false,
65
+ "rstrip": false,
66
+ "normalized": false,
67
+ "special": true
68
+ },
69
+ {
70
+ "id": 608,
71
+ "content": "[guffaw]",
72
+ "single_word": false,
73
+ "lstrip": false,
74
+ "rstrip": false,
75
+ "normalized": false,
76
+ "special": true
77
+ },
78
+ {
79
+ "id": 609,
80
+ "content": "[inhale]",
81
+ "single_word": false,
82
+ "lstrip": false,
83
+ "rstrip": false,
84
+ "normalized": false,
85
+ "special": true
86
+ },
87
+ {
88
+ "id": 610,
89
+ "content": "[exhale]",
90
+ "single_word": false,
91
+ "lstrip": false,
92
+ "rstrip": false,
93
+ "normalized": false,
94
+ "special": true
95
+ },
96
+ {
97
+ "id": 611,
98
+ "content": "[sigh]",
99
+ "single_word": false,
100
+ "lstrip": false,
101
+ "rstrip": false,
102
+ "normalized": false,
103
+ "special": true
104
+ },
105
+ {
106
+ "id": 612,
107
+ "content": "[cry]",
108
+ "single_word": false,
109
+ "lstrip": false,
110
+ "rstrip": false,
111
+ "normalized": false,
112
+ "special": true
113
+ },
114
+ {
115
+ "id": 613,
116
+ "content": "[bark]",
117
+ "single_word": false,
118
+ "lstrip": false,
119
+ "rstrip": false,
120
+ "normalized": false,
121
+ "special": true
122
+ },
123
+ {
124
+ "id": 614,
125
+ "content": "[howl]",
126
+ "single_word": false,
127
+ "lstrip": false,
128
+ "rstrip": false,
129
+ "normalized": false,
130
+ "special": true
131
+ },
132
+ {
133
+ "id": 615,
134
+ "content": "[meow]",
135
+ "single_word": false,
136
+ "lstrip": false,
137
+ "rstrip": false,
138
+ "normalized": false,
139
+ "special": true
140
+ },
141
+ {
142
+ "id": 616,
143
+ "content": "[singing]",
144
+ "single_word": false,
145
+ "lstrip": false,
146
+ "rstrip": false,
147
+ "normalized": false,
148
+ "special": true
149
+ },
150
+ {
151
+ "id": 617,
152
+ "content": "[music]",
153
+ "single_word": false,
154
+ "lstrip": false,
155
+ "rstrip": false,
156
+ "normalized": false,
157
+ "special": true
158
+ },
159
+ {
160
+ "id": 618,
161
+ "content": "[whistle]",
162
+ "single_word": false,
163
+ "lstrip": false,
164
+ "rstrip": false,
165
+ "normalized": false,
166
+ "special": true
167
+ },
168
+ {
169
+ "id": 619,
170
+ "content": "[humming]",
171
+ "single_word": false,
172
+ "lstrip": false,
173
+ "rstrip": false,
174
+ "normalized": false,
175
+ "special": true
176
+ },
177
+ {
178
+ "id": 620,
179
+ "content": "[gasp]",
180
+ "single_word": false,
181
+ "lstrip": false,
182
+ "rstrip": false,
183
+ "normalized": false,
184
+ "special": true
185
+ },
186
+ {
187
+ "id": 621,
188
+ "content": "[groan]",
189
+ "single_word": false,
190
+ "lstrip": false,
191
+ "rstrip": false,
192
+ "normalized": false,
193
+ "special": true
194
+ },
195
+ {
196
+ "id": 622,
197
+ "content": "[whisper]",
198
+ "single_word": false,
199
+ "lstrip": false,
200
+ "rstrip": false,
201
+ "normalized": false,
202
+ "special": true
203
+ },
204
+ {
205
+ "id": 623,
206
+ "content": "[mumble]",
207
+ "single_word": false,
208
+ "lstrip": false,
209
+ "rstrip": false,
210
+ "normalized": false,
211
+ "special": true
212
+ },
213
+ {
214
+ "id": 624,
215
+ "content": "[sniff]",
216
+ "single_word": false,
217
+ "lstrip": false,
218
+ "rstrip": false,
219
+ "normalized": false,
220
+ "special": true
221
+ },
222
+ {
223
+ "id": 625,
224
+ "content": "[sneeze]",
225
+ "single_word": false,
226
+ "lstrip": false,
227
+ "rstrip": false,
228
+ "normalized": false,
229
+ "special": true
230
+ },
231
+ {
232
+ "id": 626,
233
+ "content": "[cough]",
234
+ "single_word": false,
235
+ "lstrip": false,
236
+ "rstrip": false,
237
+ "normalized": false,
238
+ "special": true
239
+ },
240
+ {
241
+ "id": 627,
242
+ "content": "[snore]",
243
+ "single_word": false,
244
+ "lstrip": false,
245
+ "rstrip": false,
246
+ "normalized": false,
247
+ "special": true
248
+ },
249
+ {
250
+ "id": 628,
251
+ "content": "[chew]",
252
+ "single_word": false,
253
+ "lstrip": false,
254
+ "rstrip": false,
255
+ "normalized": false,
256
+ "special": true
257
+ },
258
+ {
259
+ "id": 629,
260
+ "content": "[sip]",
261
+ "single_word": false,
262
+ "lstrip": false,
263
+ "rstrip": false,
264
+ "normalized": false,
265
+ "special": true
266
+ },
267
+ {
268
+ "id": 630,
269
+ "content": "[clear_throat]",
270
+ "single_word": false,
271
+ "lstrip": false,
272
+ "rstrip": false,
273
+ "normalized": false,
274
+ "special": true
275
+ },
276
+ {
277
+ "id": 631,
278
+ "content": "[kiss]",
279
+ "single_word": false,
280
+ "lstrip": false,
281
+ "rstrip": false,
282
+ "normalized": false,
283
+ "special": true
284
+ },
285
+ {
286
+ "id": 632,
287
+ "content": "[shhh]",
288
+ "single_word": false,
289
+ "lstrip": false,
290
+ "rstrip": false,
291
+ "normalized": false,
292
+ "special": true
293
+ },
294
+ {
295
+ "id": 633,
296
+ "content": "[gibberish]",
297
+ "single_word": false,
298
+ "lstrip": false,
299
+ "rstrip": false,
300
+ "normalized": false,
301
+ "special": true
302
+ },
303
+ {
304
+ "id": 634,
305
+ "content": "[fr]",
306
+ "single_word": false,
307
+ "lstrip": false,
308
+ "rstrip": false,
309
+ "normalized": false,
310
+ "special": true
311
+ },
312
+ {
313
+ "id": 635,
314
+ "content": "[es]",
315
+ "single_word": false,
316
+ "lstrip": false,
317
+ "rstrip": false,
318
+ "normalized": false,
319
+ "special": true
320
+ },
321
+ {
322
+ "id": 636,
323
+ "content": "[de]",
324
+ "single_word": false,
325
+ "lstrip": false,
326
+ "rstrip": false,
327
+ "normalized": false,
328
+ "special": true
329
+ },
330
+ {
331
+ "id": 637,
332
+ "content": "[it]",
333
+ "single_word": false,
334
+ "lstrip": false,
335
+ "rstrip": false,
336
+ "normalized": false,
337
+ "special": true
338
+ },
339
+ {
340
+ "id": 638,
341
+ "content": "[ipa]",
342
+ "single_word": false,
343
+ "lstrip": false,
344
+ "rstrip": false,
345
+ "normalized": false,
346
+ "special": true
347
+ },
348
+ {
349
+ "id": 639,
350
+ "content": "[end_of_label]",
351
+ "single_word": false,
352
+ "lstrip": false,
353
+ "rstrip": false,
354
+ "normalized": false,
355
+ "special": true
356
+ },
357
+ {
358
+ "id": 695,
359
+ "content": "[PLACEHOLDER55]",
360
+ "single_word": false,
361
+ "lstrip": false,
362
+ "rstrip": false,
363
+ "normalized": false,
364
+ "special": true
365
+ },
366
+ {
367
+ "id": 696,
368
+ "content": "[PLACEHOLDER56]",
369
+ "single_word": false,
370
+ "lstrip": false,
371
+ "rstrip": false,
372
+ "normalized": false,
373
+ "special": true
374
+ },
375
+ {
376
+ "id": 697,
377
+ "content": "[PLACEHOLDER57]",
378
+ "single_word": false,
379
+ "lstrip": false,
380
+ "rstrip": false,
381
+ "normalized": false,
382
+ "special": true
383
+ },
384
+ {
385
+ "id": 698,
386
+ "content": "[PLACEHOLDER58]",
387
+ "single_word": false,
388
+ "lstrip": false,
389
+ "rstrip": false,
390
+ "normalized": false,
391
+ "special": true
392
+ },
393
+ {
394
+ "id": 699,
395
+ "content": "[PLACEHOLDER59]",
396
+ "single_word": false,
397
+ "lstrip": false,
398
+ "rstrip": false,
399
+ "normalized": false,
400
+ "special": true
401
+ },
402
+ {
403
+ "id": 700,
404
+ "content": "[PLACEHOLDER60]",
405
+ "single_word": false,
406
+ "lstrip": false,
407
+ "rstrip": false,
408
+ "normalized": false,
409
+ "special": true
410
+ },
411
+ {
412
+ "id": 701,
413
+ "content": "[PLACEHOLDER61]",
414
+ "single_word": false,
415
+ "lstrip": false,
416
+ "rstrip": false,
417
+ "normalized": false,
418
+ "special": true
419
+ },
420
+ {
421
+ "id": 702,
422
+ "content": "[PLACEHOLDER62]",
423
+ "single_word": false,
424
+ "lstrip": false,
425
+ "rstrip": false,
426
+ "normalized": false,
427
+ "special": true
428
+ },
429
+ {
430
+ "id": 703,
431
+ "content": "[PLACEHOLDER63]",
432
+ "single_word": false,
433
+ "lstrip": false,
434
+ "rstrip": false,
435
+ "normalized": false,
436
+ "special": true
437
+ },
438
+ {
439
+ "id": 6561,
440
+ "content": "[START_SPEECH]",
441
+ "single_word": false,
442
+ "lstrip": false,
443
+ "rstrip": false,
444
+ "normalized": false,
445
+ "special": true
446
+ },
447
+ {
448
+ "id": 6562,
449
+ "content": "[STOP_SPEECH]",
450
+ "single_word": false,
451
+ "lstrip": false,
452
+ "rstrip": false,
453
+ "normalized": false,
454
+ "special": true
455
+ },
456
+ {
457
+ "id": 6563,
458
+ "content": "[EXAGGERATION]",
459
+ "single_word": false,
460
+ "lstrip": false,
461
+ "rstrip": false,
462
+ "normalized": false,
463
+ "special": true
464
+ }
465
+ ],
466
+ "normalizer": {
467
+ "type": "Replace",
468
+ "pattern": {
469
+ "Regex": "\\s+"
470
+ },
471
+ "content": " "
472
+ },
473
+ "pre_tokenizer": null,
474
+ "post_processor": {
475
+ "type": "TemplateProcessing",
476
+ "single": [
477
+ {
478
+ "SpecialToken": {
479
+ "id": "[EXAGGERATION]",
480
+ "type_id": 0
481
+ }
482
+ },
483
+ {
484
+ "SpecialToken": {
485
+ "id": "[START]",
486
+ "type_id": 0
487
+ }
488
+ },
489
+ {
490
+ "Sequence": {
491
+ "id": "A",
492
+ "type_id": 0
493
+ }
494
+ },
495
+ {
496
+ "SpecialToken": {
497
+ "id": "[STOP]",
498
+ "type_id": 0
499
+ }
500
+ },
501
+ {
502
+ "SpecialToken": {
503
+ "id": "[START_SPEECH]",
504
+ "type_id": 0
505
+ }
506
+ },
507
+ {
508
+ "SpecialToken": {
509
+ "id": "[START_SPEECH]",
510
+ "type_id": 0
511
+ }
512
+ }
513
+ ],
514
+ "pair": [
515
+ {
516
+ "SpecialToken": {
517
+ "id": "[EXAGGERATION]",
518
+ "type_id": 0
519
+ }
520
+ },
521
+ {
522
+ "SpecialToken": {
523
+ "id": "[START]",
524
+ "type_id": 0
525
+ }
526
+ },
527
+ {
528
+ "Sequence": {
529
+ "id": "A",
530
+ "type_id": 0
531
+ }
532
+ },
533
+ {
534
+ "SpecialToken": {
535
+ "id": "[STOP]",
536
+ "type_id": 0
537
+ }
538
+ },
539
+ {
540
+ "SpecialToken": {
541
+ "id": "[START_SPEECH]",
542
+ "type_id": 0
543
+ }
544
+ },
545
+ {
546
+ "SpecialToken": {
547
+ "id": "[START_SPEECH]",
548
+ "type_id": 0
549
+ }
550
+ },
551
+ {
552
+ "SpecialToken": {
553
+ "id": "[EXAGGERATION]",
554
+ "type_id": 1
555
+ }
556
+ },
557
+ {
558
+ "SpecialToken": {
559
+ "id": "[START]",
560
+ "type_id": 1
561
+ }
562
+ },
563
+ {
564
+ "Sequence": {
565
+ "id": "B",
566
+ "type_id": 1
567
+ }
568
+ },
569
+ {
570
+ "SpecialToken": {
571
+ "id": "[STOP]",
572
+ "type_id": 1
573
+ }
574
+ },
575
+ {
576
+ "SpecialToken": {
577
+ "id": "[START_SPEECH]",
578
+ "type_id": 1
579
+ }
580
+ },
581
+ {
582
+ "SpecialToken": {
583
+ "id": "[START_SPEECH]",
584
+ "type_id": 1
585
+ }
586
+ }
587
+ ],
588
+ "special_tokens": {
589
+ "[START]": {
590
+ "id": "[START]",
591
+ "ids": [
592
+ 255
593
+ ],
594
+ "tokens": [
595
+ "[START]"
596
+ ]
597
+ },
598
+ "[STOP]": {
599
+ "id": "[STOP]",
600
+ "ids": [
601
+ 0
602
+ ],
603
+ "tokens": [
604
+ "[STOP]"
605
+ ]
606
+ },
607
+ "[EXAGGERATION]": {
608
+ "id": "[EXAGGERATION]",
609
+ "ids": [
610
+ 6563
611
+ ],
612
+ "tokens": [
613
+ "[EXAGGERATION]"
614
+ ]
615
+ },
616
+ "[START_SPEECH]": {
617
+ "id": "[START_SPEECH]",
618
+ "ids": [
619
+ 6561
620
+ ],
621
+ "tokens": [
622
+ "[START_SPEECH]"
623
+ ]
624
+ }
625
+ }
626
+ },
627
+ "decoder": {
628
+ "type": "Fuse"
629
+ },
630
+ "model": {
631
+ "type": "BPE",
632
+ "dropout": null,
633
+ "unk_token": "[UNK]",
634
+ "continuing_subword_prefix": null,
635
+ "end_of_word_suffix": null,
636
+ "fuse_unk": false,
637
+ "vocab": {
638
+ "[STOP]": 0,
639
+ "[UNK]": 1,
640
+ " ": 2,
641
+ "!": 3,
642
+ "'": 4,
643
+ "(": 5,
644
+ ")": 6,
645
+ ",": 7,
646
+ "-": 8,
647
+ ".": 9,
648
+ "/": 10,
649
+ ":": 11,
650
+ ";": 12,
651
+ "?": 13,
652
+ "a": 14,
653
+ "b": 15,
654
+ "c": 16,
655
+ "d": 17,
656
+ "e": 18,
657
+ "f": 19,
658
+ "g": 20,
659
+ "h": 21,
660
+ "i": 22,
661
+ "j": 23,
662
+ "k": 24,
663
+ "l": 25,
664
+ "m": 26,
665
+ "n": 27,
666
+ "o": 28,
667
+ "p": 29,
668
+ "q": 30,
669
+ "r": 31,
670
+ "s": 32,
671
+ "t": 33,
672
+ "u": 34,
673
+ "v": 35,
674
+ "w": 36,
675
+ "x": 37,
676
+ "y": 38,
677
+ "z": 39,
678
+ "th": 40,
679
+ "in": 41,
680
+ "the": 42,
681
+ "an": 43,
682
+ "er": 44,
683
+ "ou": 45,
684
+ "re": 46,
685
+ "on": 47,
686
+ "at": 48,
687
+ "ed": 49,
688
+ "en": 50,
689
+ "to": 51,
690
+ "ing": 52,
691
+ "and": 53,
692
+ "is": 54,
693
+ "as": 55,
694
+ "al": 56,
695
+ "or": 57,
696
+ "of": 58,
697
+ "ar": 59,
698
+ "it": 60,
699
+ "es": 61,
700
+ "he": 62,
701
+ "st": 63,
702
+ "le": 64,
703
+ "om": 65,
704
+ "se": 66,
705
+ "be": 67,
706
+ "ad": 68,
707
+ "ow": 69,
708
+ "ly": 70,
709
+ "ch": 71,
710
+ "wh": 72,
711
+ "that": 73,
712
+ "you": 74,
713
+ "li": 75,
714
+ "ve": 76,
715
+ "ac": 77,
716
+ "ti": 78,
717
+ "ld": 79,
718
+ "me": 80,
719
+ "was": 81,
720
+ "gh": 82,
721
+ "id": 83,
722
+ "ll": 84,
723
+ "wi": 85,
724
+ "ent": 86,
725
+ "for": 87,
726
+ "ay": 88,
727
+ "ro": 89,
728
+ "ver": 90,
729
+ "ic": 91,
730
+ "her": 92,
731
+ "ke": 93,
732
+ "his": 94,
733
+ "no": 95,
734
+ "ut": 96,
735
+ "un": 97,
736
+ "ir": 98,
737
+ "lo": 99,
738
+ "we": 100,
739
+ "ri": 101,
740
+ "ha": 102,
741
+ "with": 103,
742
+ "ght": 104,
743
+ "out": 105,
744
+ "im": 106,
745
+ "ion": 107,
746
+ "all": 108,
747
+ "ab": 109,
748
+ "one": 110,
749
+ "ne": 111,
750
+ "ge": 112,
751
+ "ould": 113,
752
+ "ter": 114,
753
+ "mo": 115,
754
+ "had": 116,
755
+ "ce": 117,
756
+ "she": 118,
757
+ "go": 119,
758
+ "sh": 120,
759
+ "ur": 121,
760
+ "am": 122,
761
+ "so": 123,
762
+ "pe": 124,
763
+ "my": 125,
764
+ "de": 126,
765
+ "are": 127,
766
+ "but": 128,
767
+ "ome": 129,
768
+ "fr": 130,
769
+ "ther": 131,
770
+ "fe": 132,
771
+ "su": 133,
772
+ "do": 134,
773
+ "con": 135,
774
+ "te": 136,
775
+ "ain": 137,
776
+ "ere": 138,
777
+ "po": 139,
778
+ "if": 140,
779
+ "they": 141,
780
+ "us": 142,
781
+ "ag": 143,
782
+ "tr": 144,
783
+ "now": 145,
784
+ "oun": 146,
785
+ "this": 147,
786
+ "have": 148,
787
+ "not": 149,
788
+ "sa": 150,
789
+ "il": 151,
790
+ "up": 152,
791
+ "thing": 153,
792
+ "from": 154,
793
+ "ap": 155,
794
+ "him": 156,
795
+ "ack": 157,
796
+ "ation": 158,
797
+ "ant": 159,
798
+ "our": 160,
799
+ "op": 161,
800
+ "like": 162,
801
+ "ust": 163,
802
+ "ess": 164,
803
+ "bo": 165,
804
+ "ok": 166,
805
+ "ul": 167,
806
+ "ind": 168,
807
+ "ex": 169,
808
+ "com": 170,
809
+ "some": 171,
810
+ "there": 172,
811
+ "ers": 173,
812
+ "co": 174,
813
+ "res": 175,
814
+ "man": 176,
815
+ "ard": 177,
816
+ "pl": 178,
817
+ "wor": 179,
818
+ "way": 180,
819
+ "tion": 181,
820
+ "fo": 182,
821
+ "ca": 183,
822
+ "were": 184,
823
+ "by": 185,
824
+ "ate": 186,
825
+ "pro": 187,
826
+ "ted": 188,
827
+ "ound": 189,
828
+ "own": 190,
829
+ "would": 191,
830
+ "ts": 192,
831
+ "what": 193,
832
+ "qu": 194,
833
+ "ally": 195,
834
+ "ight": 196,
835
+ "ck": 197,
836
+ "gr": 198,
837
+ "when": 199,
838
+ "ven": 200,
839
+ "can": 201,
840
+ "ough": 202,
841
+ "ine": 203,
842
+ "end": 204,
843
+ "per": 205,
844
+ "ous": 206,
845
+ "od": 207,
846
+ "ide": 208,
847
+ "know": 209,
848
+ "ty": 210,
849
+ "very": 211,
850
+ "si": 212,
851
+ "ak": 213,
852
+ "who": 214,
853
+ "about": 215,
854
+ "ill": 216,
855
+ "them": 217,
856
+ "est": 218,
857
+ "red": 219,
858
+ "ye": 220,
859
+ "could": 221,
860
+ "ong": 222,
861
+ "your": 223,
862
+ "their": 224,
863
+ "em": 225,
864
+ "just": 226,
865
+ "other": 227,
866
+ "into": 228,
867
+ "any": 229,
868
+ "whi": 230,
869
+ "um": 231,
870
+ "tw": 232,
871
+ "ast": 233,
872
+ "der": 234,
873
+ "did": 235,
874
+ "ie": 236,
875
+ "been": 237,
876
+ "ace": 238,
877
+ "ink": 239,
878
+ "ity": 240,
879
+ "back": 241,
880
+ "ting": 242,
881
+ "br": 243,
882
+ "more": 244,
883
+ "ake": 245,
884
+ "pp": 246,
885
+ "then": 247,
886
+ "sp": 248,
887
+ "el": 249,
888
+ "use": 250,
889
+ "bl": 251,
890
+ "said": 252,
891
+ "over": 253,
892
+ "get": 254,
893
+ "[START]": 255,
894
+ "\"": 256,
895
+ "#": 257,
896
+ "$": 258,
897
+ "%": 259,
898
+ "&": 260,
899
+ "*": 261,
900
+ "+": 262,
901
+ "0": 263,
902
+ "1": 264,
903
+ "2": 265,
904
+ "3": 266,
905
+ "4": 267,
906
+ "5": 268,
907
+ "6": 269,
908
+ "7": 270,
909
+ "8": 271,
910
+ "9": 272,
911
+ "<": 273,
912
+ "=": 274,
913
+ ">": 275,
914
+ "@": 276,
915
+ "A": 277,
916
+ "B": 278,
917
+ "C": 279,
918
+ "D": 280,
919
+ "E": 281,
920
+ "F": 282,
921
+ "G": 283,
922
+ "H": 284,
923
+ "I": 285,
924
+ "J": 286,
925
+ "K": 287,
926
+ "L": 288,
927
+ "M": 289,
928
+ "N": 290,
929
+ "O": 291,
930
+ "P": 292,
931
+ "Q": 293,
932
+ "R": 294,
933
+ "S": 295,
934
+ "T": 296,
935
+ "U": 297,
936
+ "V": 298,
937
+ "W": 299,
938
+ "X": 300,
939
+ "Y": 301,
940
+ "Z": 302,
941
+ "[": 303,
942
+ "\\": 304,
943
+ "]": 305,
944
+ "^": 306,
945
+ "_": 307,
946
+ "`": 308,
947
+ "{": 309,
948
+ "|": 310,
949
+ "}": 311,
950
+ "~": 312,
951
+ "‐": 313,
952
+ "‑": 314,
953
+ "‒": 315,
954
+ "–": 316,
955
+ "—": 317,
956
+ "―": 318,
957
+ "‖": 319,
958
+ "‗": 320,
959
+ "‘": 321,
960
+ "’": 322,
961
+ "‚": 323,
962
+ "‛": 324,
963
+ "“": 325,
964
+ "”": 326,
965
+ "„": 327,
966
+ "‟": 328,
967
+ " ": 329,
968
+ "¡": 330,
969
+ "¢": 331,
970
+ "£": 332,
971
+ "¤": 333,
972
+ "¥": 334,
973
+ "¦": 335,
974
+ "§": 336,
975
+ "¨": 337,
976
+ "©": 338,
977
+ "ª": 339,
978
+ "«": 340,
979
+ "¬": 341,
980
+ "­": 342,
981
+ "®": 343,
982
+ "¯": 344,
983
+ "°": 345,
984
+ "±": 346,
985
+ "²": 347,
986
+ "³": 348,
987
+ "´": 349,
988
+ "µ": 350,
989
+ "¶": 351,
990
+ "·": 352,
991
+ "¸": 353,
992
+ "¹": 354,
993
+ "º": 355,
994
+ "»": 356,
995
+ "¼": 357,
996
+ "½": 358,
997
+ "¾": 359,
998
+ "¿": 360,
999
+ "À": 361,
1000
+ "Á": 362,
1001
+ "Â": 363,
1002
+ "Ã": 364,
1003
+ "Ä": 365,
1004
+ "Å": 366,
1005
+ "Æ": 367,
1006
+ "Ç": 368,
1007
+ "È": 369,
1008
+ "É": 370,
1009
+ "Ê": 371,
1010
+ "Ë": 372,
1011
+ "Ì": 373,
1012
+ "Í": 374,
1013
+ "Î": 375,
1014
+ "Ï": 376,
1015
+ "Ð": 377,
1016
+ "Ñ": 378,
1017
+ "Ò": 379,
1018
+ "Ó": 380,
1019
+ "Ô": 381,
1020
+ "Õ": 382,
1021
+ "Ö": 383,
1022
+ "×": 384,
1023
+ "Ø": 385,
1024
+ "Ù": 386,
1025
+ "Ú": 387,
1026
+ "Û": 388,
1027
+ "Ü": 389,
1028
+ "Ý": 390,
1029
+ "Þ": 391,
1030
+ "ß": 392,
1031
+ "à": 393,
1032
+ "á": 394,
1033
+ "â": 395,
1034
+ "ã": 396,
1035
+ "ä": 397,
1036
+ "å": 398,
1037
+ "æ": 399,
1038
+ "ç": 400,
1039
+ "è": 401,
1040
+ "é": 402,
1041
+ "ê": 403,
1042
+ "ë": 404,
1043
+ "ì": 405,
1044
+ "í": 406,
1045
+ "î": 407,
1046
+ "ï": 408,
1047
+ "ð": 409,
1048
+ "ñ": 410,
1049
+ "ò": 411,
1050
+ "ó": 412,
1051
+ "ô": 413,
1052
+ "õ": 414,
1053
+ "ö": 415,
1054
+ "÷": 416,
1055
+ "ø": 417,
1056
+ "ù": 418,
1057
+ "ú": 419,
1058
+ "û": 420,
1059
+ "ü": 421,
1060
+ "ý": 422,
1061
+ "þ": 423,
1062
+ "ÿ": 424,
1063
+ "ɐ": 425,
1064
+ "ɑ": 426,
1065
+ "ɒ": 427,
1066
+ "ɓ": 428,
1067
+ "ɔ": 429,
1068
+ "ɕ": 430,
1069
+ "ɖ": 431,
1070
+ "ɗ": 432,
1071
+ "ɘ": 433,
1072
+ "ə": 434,
1073
+ "ɚ": 435,
1074
+ "ɛ": 436,
1075
+ "ɜ": 437,
1076
+ "ɝ": 438,
1077
+ "ɞ": 439,
1078
+ "ɟ": 440,
1079
+ "ɠ": 441,
1080
+ "ɡ": 442,
1081
+ "ɢ": 443,
1082
+ "ɣ": 444,
1083
+ "ɤ": 445,
1084
+ "ɥ": 446,
1085
+ "ɦ": 447,
1086
+ "ɧ": 448,
1087
+ "ɨ": 449,
1088
+ "ɩ": 450,
1089
+ "ɪ": 451,
1090
+ "ɫ": 452,
1091
+ "ɬ": 453,
1092
+ "ɭ": 454,
1093
+ "ɮ": 455,
1094
+ "ɯ": 456,
1095
+ "ɰ": 457,
1096
+ "ɱ": 458,
1097
+ "ɲ": 459,
1098
+ "ɳ": 460,
1099
+ "ɴ": 461,
1100
+ "ɵ": 462,
1101
+ "ɶ": 463,
1102
+ "ɷ": 464,
1103
+ "ɸ": 465,
1104
+ "ɹ": 466,
1105
+ "ɺ": 467,
1106
+ "ɻ": 468,
1107
+ "ɼ": 469,
1108
+ "ɽ": 470,
1109
+ "ɾ": 471,
1110
+ "ɿ": 472,
1111
+ "ʀ": 473,
1112
+ "ʁ": 474,
1113
+ "ʂ": 475,
1114
+ "ʃ": 476,
1115
+ "ʄ": 477,
1116
+ "ʅ": 478,
1117
+ "ʆ": 479,
1118
+ "ʇ": 480,
1119
+ "ʈ": 481,
1120
+ "ʉ": 482,
1121
+ "ʊ": 483,
1122
+ "ʋ": 484,
1123
+ "ʌ": 485,
1124
+ "ʍ": 486,
1125
+ "ʎ": 487,
1126
+ "ʏ": 488,
1127
+ "ʐ": 489,
1128
+ "ʑ": 490,
1129
+ "ʒ": 491,
1130
+ "ʓ": 492,
1131
+ "ʔ": 493,
1132
+ "ʕ": 494,
1133
+ "ʖ": 495,
1134
+ "ʗ": 496,
1135
+ "ʘ": 497,
1136
+ "ʙ": 498,
1137
+ "ʚ": 499,
1138
+ "ʛ": 500,
1139
+ "ʜ": 501,
1140
+ "ʝ": 502,
1141
+ "ʞ": 503,
1142
+ "ʟ": 504,
1143
+ "ʠ": 505,
1144
+ "ʡ": 506,
1145
+ "ʢ": 507,
1146
+ "ʣ": 508,
1147
+ "ʤ": 509,
1148
+ "ʥ": 510,
1149
+ "ʦ": 511,
1150
+ "ʧ": 512,
1151
+ "ʨ": 513,
1152
+ "ʩ": 514,
1153
+ "ʪ": 515,
1154
+ "ʫ": 516,
1155
+ "ʬ": 517,
1156
+ "ʭ": 518,
1157
+ "ʮ": 519,
1158
+ "ʯ": 520,
1159
+ "ʰ": 521,
1160
+ "ʱ": 522,
1161
+ "ʲ": 523,
1162
+ "ʳ": 524,
1163
+ "ʴ": 525,
1164
+ "ʵ": 526,
1165
+ "ʶ": 527,
1166
+ "ʷ": 528,
1167
+ "ʸ": 529,
1168
+ "ʹ": 530,
1169
+ "ʺ": 531,
1170
+ "ʻ": 532,
1171
+ "ʼ": 533,
1172
+ "ʽ": 534,
1173
+ "ʾ": 535,
1174
+ "ʿ": 536,
1175
+ "ˀ": 537,
1176
+ "ˁ": 538,
1177
+ "˂": 539,
1178
+ "˃": 540,
1179
+ "˄": 541,
1180
+ "˅": 542,
1181
+ "ˆ": 543,
1182
+ "ˇ": 544,
1183
+ "ˈ": 545,
1184
+ "ˉ": 546,
1185
+ "ˊ": 547,
1186
+ "ˋ": 548,
1187
+ "ˌ": 549,
1188
+ "ˍ": 550,
1189
+ "ˎ": 551,
1190
+ "ˏ": 552,
1191
+ "ː": 553,
1192
+ "ˑ": 554,
1193
+ "˒": 555,
1194
+ "˓": 556,
1195
+ "˔": 557,
1196
+ "˕": 558,
1197
+ "˖": 559,
1198
+ "˗": 560,
1199
+ "˘": 561,
1200
+ "˙": 562,
1201
+ "˚": 563,
1202
+ "˛": 564,
1203
+ "˜": 565,
1204
+ "˝": 566,
1205
+ "˞": 567,
1206
+ "˟": 568,
1207
+ "ˠ": 569,
1208
+ "ˡ": 570,
1209
+ "ˢ": 571,
1210
+ "ˣ": 572,
1211
+ "ˤ": 573,
1212
+ "˥": 574,
1213
+ "˦": 575,
1214
+ "˧": 576,
1215
+ "˨": 577,
1216
+ "˩": 578,
1217
+ "˪": 579,
1218
+ "˫": 580,
1219
+ "ˬ": 581,
1220
+ "˭": 582,
1221
+ "ˮ": 583,
1222
+ "˯": 584,
1223
+ "˰": 585,
1224
+ "˱": 586,
1225
+ "˲": 587,
1226
+ "˳": 588,
1227
+ "˴": 589,
1228
+ "˵": 590,
1229
+ "˶": 591,
1230
+ "˷": 592,
1231
+ "˸": 593,
1232
+ "˹": 594,
1233
+ "˺": 595,
1234
+ "˻": 596,
1235
+ "˼": 597,
1236
+ "˽": 598,
1237
+ "˾": 599,
1238
+ "˿": 600,
1239
+ "ā": 601,
1240
+ "ō": 602,
1241
+ "…": 603,
1242
+ "[UH]": 604,
1243
+ "[UM]": 605,
1244
+ "[giggle]": 606,
1245
+ "[laughter]": 607,
1246
+ "[guffaw]": 608,
1247
+ "[inhale]": 609,
1248
+ "[exhale]": 610,
1249
+ "[sigh]": 611,
1250
+ "[cry]": 612,
1251
+ "[bark]": 613,
1252
+ "[howl]": 614,
1253
+ "[meow]": 615,
1254
+ "[singing]": 616,
1255
+ "[music]": 617,
1256
+ "[whistle]": 618,
1257
+ "[humming]": 619,
1258
+ "[gasp]": 620,
1259
+ "[groan]": 621,
1260
+ "[whisper]": 622,
1261
+ "[mumble]": 623,
1262
+ "[sniff]": 624,
1263
+ "[sneeze]": 625,
1264
+ "[cough]": 626,
1265
+ "[snore]": 627,
1266
+ "[chew]": 628,
1267
+ "[sip]": 629,
1268
+ "[clear_throat]": 630,
1269
+ "[kiss]": 631,
1270
+ "[shhh]": 632,
1271
+ "[gibberish]": 633,
1272
+ "[fr]": 634,
1273
+ "[es]": 635,
1274
+ "[de]": 636,
1275
+ "[it]": 637,
1276
+ "[ipa]": 638,
1277
+ "[end_of_label]": 639,
1278
+ "ŋ": 640,
1279
+ "ᵻ": 641,
1280
+ "θ": 642,
1281
+ "̩": 643,
1282
+ "\u0303": 644,
1283
+ "ɑː": 645,
1284
+ "iː": 646,
1285
+ "uː": 647,
1286
+ "ɜː": 648,
1287
+ "ɔː": 649,
1288
+ "oː": 650,
1289
+ "eɪ": 651,
1290
+ "oʊ": 652,
1291
+ "aɪ": 653,
1292
+ "aʊ": 654,
1293
+ "ɔɪ": 655,
1294
+ "dʒ": 656,
1295
+ "tʃ": 657,
1296
+ "ɪŋ": 658,
1297
+ "ᵻd": 659,
1298
+ "ˈiː": 660,
1299
+ "ˌiː": 661,
1300
+ "ˈɪ": 662,
1301
+ "ˌɪ": 663,
1302
+ "ˈeɪ": 664,
1303
+ "ˌeɪ": 665,
1304
+ "ˈɛ": 666,
1305
+ "ˌɛ": 667,
1306
+ "ˈæ": 668,
1307
+ "ˌæ": 669,
1308
+ "ˈɑː": 670,
1309
+ "ˌɑː": 671,
1310
+ "ˈɔː": 672,
1311
+ "ˌɔː": 673,
1312
+ "oːɹ": 674,
1313
+ "ˈoːɹ": 675,
1314
+ "ˌoːɹ": 676,
1315
+ "ˈoʊ": 677,
1316
+ "ˌoʊ": 678,
1317
+ "ˈʊ": 679,
1318
+ "ˌʊ": 680,
1319
+ "ˈuː": 681,
1320
+ "ˌuː": 682,
1321
+ "ˈɜː": 683,
1322
+ "ˌɜː": 684,
1323
+ "ˈʌ": 685,
1324
+ "ˌʌ": 686,
1325
+ "ˈaɪ": 687,
1326
+ "ˌaɪ": 688,
1327
+ "ˈaʊ": 689,
1328
+ "ˌaʊ": 690,
1329
+ "ˈɔɪ": 691,
1330
+ "ˌɔɪ": 692,
1331
+ "ˈɚ": 693,
1332
+ "ˌɐ": 694,
1333
+ "[PLACEHOLDER55]": 695,
1334
+ "[PLACEHOLDER56]": 696,
1335
+ "[PLACEHOLDER57]": 697,
1336
+ "[PLACEHOLDER58]": 698,
1337
+ "[PLACEHOLDER59]": 699,
1338
+ "[PLACEHOLDER60]": 700,
1339
+ "[PLACEHOLDER61]": 701,
1340
+ "[PLACEHOLDER62]": 702,
1341
+ "[PLACEHOLDER63]": 703
1342
+ },
1343
+ "merges": [
1344
+ "t h",
1345
+ "i n",
1346
+ "th e",
1347
+ "a n",
1348
+ "e r",
1349
+ "o u",
1350
+ "r e",
1351
+ "o n",
1352
+ "a t",
1353
+ "e d",
1354
+ "e n",
1355
+ "t o",
1356
+ "in g",
1357
+ "an d",
1358
+ "i s",
1359
+ "a s",
1360
+ "a l",
1361
+ "o r",
1362
+ "o f",
1363
+ "a r",
1364
+ "i t",
1365
+ "e s",
1366
+ "h e",
1367
+ "s t",
1368
+ "l e",
1369
+ "o m",
1370
+ "s e",
1371
+ "b e",
1372
+ "a d",
1373
+ "o w",
1374
+ "l y",
1375
+ "c h",
1376
+ "w h",
1377
+ "th at",
1378
+ "y ou",
1379
+ "l i",
1380
+ "v e",
1381
+ "a c",
1382
+ "t i",
1383
+ "l d",
1384
+ "m e",
1385
+ "w as",
1386
+ "g h",
1387
+ "i d",
1388
+ "l l",
1389
+ "w i",
1390
+ "en t",
1391
+ "f or",
1392
+ "a y",
1393
+ "r o",
1394
+ "v er",
1395
+ "i c",
1396
+ "h er",
1397
+ "k e",
1398
+ "h is",
1399
+ "n o",
1400
+ "u t",
1401
+ "u n",
1402
+ "i r",
1403
+ "l o",
1404
+ "w e",
1405
+ "r i",
1406
+ "h a",
1407
+ "wi th",
1408
+ "gh t",
1409
+ "ou t",
1410
+ "i m",
1411
+ "i on",
1412
+ "al l",
1413
+ "a b",
1414
+ "on e",
1415
+ "n e",
1416
+ "g e",
1417
+ "ou ld",
1418
+ "t er",
1419
+ "m o",
1420
+ "h ad",
1421
+ "c e",
1422
+ "s he",
1423
+ "g o",
1424
+ "s h",
1425
+ "u r",
1426
+ "a m",
1427
+ "s o",
1428
+ "p e",
1429
+ "m y",
1430
+ "d e",
1431
+ "a re",
1432
+ "b ut",
1433
+ "om e",
1434
+ "f r",
1435
+ "the r",
1436
+ "f e",
1437
+ "s u",
1438
+ "d o",
1439
+ "c on",
1440
+ "t e",
1441
+ "a in",
1442
+ "er e",
1443
+ "p o",
1444
+ "i f",
1445
+ "the y",
1446
+ "u s",
1447
+ "a g",
1448
+ "t r",
1449
+ "n ow",
1450
+ "ou n",
1451
+ "th is",
1452
+ "ha ve",
1453
+ "no t",
1454
+ "s a",
1455
+ "i l",
1456
+ "u p",
1457
+ "th ing",
1458
+ "fr om",
1459
+ "a p",
1460
+ "h im",
1461
+ "ac k",
1462
+ "at ion",
1463
+ "an t",
1464
+ "ou r",
1465
+ "o p",
1466
+ "li ke",
1467
+ "u st",
1468
+ "es s",
1469
+ "b o",
1470
+ "o k",
1471
+ "u l",
1472
+ "in d",
1473
+ "e x",
1474
+ "c om",
1475
+ "s ome",
1476
+ "the re",
1477
+ "er s",
1478
+ "c o",
1479
+ "re s",
1480
+ "m an",
1481
+ "ar d",
1482
+ "p l",
1483
+ "w or",
1484
+ "w ay",
1485
+ "ti on",
1486
+ "f o",
1487
+ "c a",
1488
+ "w ere",
1489
+ "b y",
1490
+ "at e",
1491
+ "p ro",
1492
+ "t ed",
1493
+ "oun d",
1494
+ "ow n",
1495
+ "w ould",
1496
+ "t s",
1497
+ "wh at",
1498
+ "q u",
1499
+ "al ly",
1500
+ "i ght",
1501
+ "c k",
1502
+ "g r",
1503
+ "wh en",
1504
+ "v en",
1505
+ "c an",
1506
+ "ou gh",
1507
+ "in e",
1508
+ "en d",
1509
+ "p er",
1510
+ "ou s",
1511
+ "o d",
1512
+ "id e",
1513
+ "k now",
1514
+ "t y",
1515
+ "ver y",
1516
+ "s i",
1517
+ "a k",
1518
+ "wh o",
1519
+ "ab out",
1520
+ "i ll",
1521
+ "the m",
1522
+ "es t",
1523
+ "re d",
1524
+ "y e",
1525
+ "c ould",
1526
+ "on g",
1527
+ "you r",
1528
+ "the ir",
1529
+ "e m",
1530
+ "j ust",
1531
+ "o ther",
1532
+ "in to",
1533
+ "an y",
1534
+ "wh i",
1535
+ "u m",
1536
+ "t w",
1537
+ "as t",
1538
+ "d er",
1539
+ "d id",
1540
+ "i e",
1541
+ "be en",
1542
+ "ac e",
1543
+ "in k",
1544
+ "it y",
1545
+ "b ack",
1546
+ "t ing",
1547
+ "b r",
1548
+ "mo re",
1549
+ "a ke",
1550
+ "p p",
1551
+ "the n",
1552
+ "s p",
1553
+ "e l",
1554
+ "u se",
1555
+ "b l",
1556
+ "sa id",
1557
+ "o ver",
1558
+ "ge t",
1559
+ "ɑ ː",
1560
+ "i ː",
1561
+ "u ː",
1562
+ "ɜ ː",
1563
+ "ɔ ː",
1564
+ "o ː",
1565
+ "e ɪ",
1566
+ "o ʊ",
1567
+ "a ɪ",
1568
+ "a ʊ",
1569
+ "ɔ ɪ",
1570
+ "d ʒ",
1571
+ "t ʃ",
1572
+ "ɪ ŋ",
1573
+ "ᵻ d",
1574
+ "ˈ iː",
1575
+ "ˌ iː",
1576
+ "ˈ ɪ",
1577
+ "ˌ ɪ",
1578
+ "ˈ eɪ",
1579
+ "ˌ eɪ",
1580
+ "ˈ ɛ",
1581
+ "ˌ ɛ",
1582
+ "ˈ æ",
1583
+ "ˌ æ",
1584
+ "ˈ ɑː",
1585
+ "ˌ ɑː",
1586
+ "ˈ ɔː",
1587
+ "ˌ ɔː",
1588
+ "oː ɹ",
1589
+ "ˈ oːɹ",
1590
+ "ˌ oːɹ",
1591
+ "ˈ oʊ",
1592
+ "ˌ oʊ",
1593
+ "ˈ ʊ",
1594
+ "ˌ ʊ",
1595
+ "ˈ uː",
1596
+ "ˌ uː",
1597
+ "ˈ ɜː",
1598
+ "ˌ ɜː",
1599
+ "ˈ ʌ",
1600
+ "ˌ ʌ",
1601
+ "ˈ aɪ",
1602
+ "ˌ aɪ",
1603
+ "ˈ aʊ",
1604
+ "ˌ aʊ",
1605
+ "ˈ ɔɪ",
1606
+ "ˌ ɔɪ",
1607
+ "ˈ ɚ",
1608
+ "ˌ ɐ"
1609
+ ]
1610
+ }
1611
+ }
tokenizer_config.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_bos_token": true,
3
+ "add_eos_token": true,
4
+ "bos_token": "<s>",
5
+ "eos_token": "</s>",
6
+ "model_input_names": [
7
+ "input_ids",
8
+ "attention_mask"
9
+ ],
10
+ "model_max_length": 131072,
11
+ "tokenizer_class": "PreTrainedTokenizerFast"
12
+ }