sgjwong commited on
Commit
948c16b
·
verified ·
1 Parent(s): 5df4c74

https://huggingface.co/sgjwong/babylm_test

Browse files
README.md ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: transformers
3
+ model_name: my-model
4
+ tags:
5
+ - generated_from_trainer
6
+ - trl
7
+ - sft
8
+ licence: license
9
+ ---
10
+
11
+ # Model Card for my-model
12
+
13
+ This model is a fine-tuned version of [None](https://huggingface.co/None).
14
+ It has been trained using [TRL](https://github.com/huggingface/trl).
15
+
16
+ ## Quick start
17
+
18
+ ```python
19
+ from transformers import pipeline
20
+
21
+ question = "If you had a time machine, but could only go to the past or the future once and never return, which would you choose and why?"
22
+ generator = pipeline("text-generation", model="sgjwong/my-model", device="cuda")
23
+ output = generator([{"role": "user", "content": question}], max_new_tokens=128, return_full_text=False)[0]
24
+ print(output["generated_text"])
25
+ ```
26
+
27
+ ## Training procedure
28
+
29
+
30
+
31
+
32
+
33
+ This model was trained with SFT.
34
+
35
+ ### Framework versions
36
+
37
+ - TRL: 1.0.0
38
+ - Transformers: 5.0.0
39
+ - Pytorch: 2.10.0+cpu
40
+ - Datasets: 4.8.4
41
+ - Tokenizers: 0.22.2
42
+
43
+ ## Citations
44
+
45
+
46
+
47
+ Cite TRL as:
48
+
49
+ ```bibtex
50
+ @software{vonwerra2020trl,
51
+ title = {{TRL: Transformers Reinforcement Learning}},
52
+ author = {von Werra, Leandro and Belkada, Younes and Tunstall, Lewis and Beeching, Edward and Thrush, Tristan and Lambert, Nathan and Huang, Shengyi and Rasul, Kashif and Gallouédec, Quentin},
53
+ license = {Apache-2.0},
54
+ url = {https://github.com/huggingface/trl},
55
+ year = {2020}
56
+ }
57
+ ```
chat_template.jinja ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ {{ bos_token }}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if message['role'] == 'user' %}{{ '<|user|>
2
+ ' + message['content'] + '<|end|>
3
+ ' }}{% elif message['role'] == 'assistant' %}{{ '<|bot|>
4
+ ' + message['content'] + '<|end|>
5
+ ' }}{% else %}{{ raise_exception('Only user and assistant roles are supported!') }}{% endif %}{% endfor %}{{ eos_token }}
config.json ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "LlamaForCausalLM"
4
+ ],
5
+ "attention_bias": false,
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 0,
8
+ "dtype": "float32",
9
+ "eos_token_id": 2,
10
+ "head_dim": 64,
11
+ "hidden_act": "silu",
12
+ "hidden_size": 512,
13
+ "initializer_range": 0.02,
14
+ "intermediate_size": 1024,
15
+ "max_position_embeddings": 512,
16
+ "mlp_bias": false,
17
+ "model_type": "llama",
18
+ "num_attention_heads": 8,
19
+ "num_hidden_layers": 8,
20
+ "num_key_value_heads": 8,
21
+ "pad_token_id": 1,
22
+ "pretraining_tp": 1,
23
+ "rms_norm_eps": 1e-06,
24
+ "rope_parameters": {
25
+ "rope_theta": 10000.0,
26
+ "rope_type": "default"
27
+ },
28
+ "tie_word_embeddings": false,
29
+ "transformers_version": "5.0.0",
30
+ "use_cache": false,
31
+ "vocab_size": 761
32
+ }
generation_config.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 0,
4
+ "eos_token_id": [
5
+ 2
6
+ ],
7
+ "output_attentions": false,
8
+ "output_hidden_states": false,
9
+ "pad_token_id": 1,
10
+ "transformers_version": "5.0.0",
11
+ "use_cache": true
12
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf2058bbb245ca337c5dc82cd27d4f5a1b6942508782da20f36668b2275dcea5
3
+ size 87046088
tokenizer.json ADDED
@@ -0,0 +1,2861 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "1.0",
3
+ "truncation": null,
4
+ "padding": null,
5
+ "added_tokens": [
6
+ {
7
+ "id": 0,
8
+ "content": "<s>",
9
+ "single_word": false,
10
+ "lstrip": false,
11
+ "rstrip": false,
12
+ "normalized": false,
13
+ "special": true
14
+ },
15
+ {
16
+ "id": 1,
17
+ "content": "<pad>",
18
+ "single_word": false,
19
+ "lstrip": false,
20
+ "rstrip": false,
21
+ "normalized": false,
22
+ "special": true
23
+ },
24
+ {
25
+ "id": 2,
26
+ "content": "</s>",
27
+ "single_word": false,
28
+ "lstrip": false,
29
+ "rstrip": false,
30
+ "normalized": false,
31
+ "special": true
32
+ },
33
+ {
34
+ "id": 3,
35
+ "content": "<unk>",
36
+ "single_word": false,
37
+ "lstrip": false,
38
+ "rstrip": false,
39
+ "normalized": false,
40
+ "special": true
41
+ },
42
+ {
43
+ "id": 4,
44
+ "content": "<mask>",
45
+ "single_word": false,
46
+ "lstrip": false,
47
+ "rstrip": false,
48
+ "normalized": false,
49
+ "special": true
50
+ },
51
+ {
52
+ "id": 5,
53
+ "content": "<|user|>",
54
+ "single_word": false,
55
+ "lstrip": false,
56
+ "rstrip": false,
57
+ "normalized": false,
58
+ "special": true
59
+ },
60
+ {
61
+ "id": 6,
62
+ "content": "<|bot|>",
63
+ "single_word": false,
64
+ "lstrip": false,
65
+ "rstrip": false,
66
+ "normalized": false,
67
+ "special": true
68
+ },
69
+ {
70
+ "id": 7,
71
+ "content": "<|end|>",
72
+ "single_word": false,
73
+ "lstrip": false,
74
+ "rstrip": false,
75
+ "normalized": false,
76
+ "special": true
77
+ }
78
+ ],
79
+ "normalizer": null,
80
+ "pre_tokenizer": {
81
+ "type": "ByteLevel",
82
+ "add_prefix_space": false,
83
+ "trim_offsets": true,
84
+ "use_regex": true
85
+ },
86
+ "post_processor": {
87
+ "type": "ByteLevel",
88
+ "add_prefix_space": true,
89
+ "trim_offsets": false,
90
+ "use_regex": true
91
+ },
92
+ "decoder": {
93
+ "type": "ByteLevel",
94
+ "add_prefix_space": true,
95
+ "trim_offsets": true,
96
+ "use_regex": true
97
+ },
98
+ "model": {
99
+ "type": "BPE",
100
+ "dropout": null,
101
+ "unk_token": null,
102
+ "continuing_subword_prefix": null,
103
+ "end_of_word_suffix": null,
104
+ "fuse_unk": false,
105
+ "byte_fallback": false,
106
+ "ignore_merges": false,
107
+ "vocab": {
108
+ "<s>": 0,
109
+ "<pad>": 1,
110
+ "</s>": 2,
111
+ "<unk>": 3,
112
+ "<mask>": 4,
113
+ "<|user|>": 5,
114
+ "<|bot|>": 6,
115
+ "<|end|>": 7,
116
+ "!": 8,
117
+ "\"": 9,
118
+ "#": 10,
119
+ "$": 11,
120
+ "%": 12,
121
+ "&": 13,
122
+ "'": 14,
123
+ "(": 15,
124
+ ")": 16,
125
+ "*": 17,
126
+ "+": 18,
127
+ ",": 19,
128
+ "-": 20,
129
+ ".": 21,
130
+ "/": 22,
131
+ "0": 23,
132
+ "1": 24,
133
+ "2": 25,
134
+ "3": 26,
135
+ "4": 27,
136
+ "5": 28,
137
+ "6": 29,
138
+ "7": 30,
139
+ "8": 31,
140
+ "9": 32,
141
+ ":": 33,
142
+ ";": 34,
143
+ "<": 35,
144
+ "=": 36,
145
+ ">": 37,
146
+ "?": 38,
147
+ "@": 39,
148
+ "A": 40,
149
+ "B": 41,
150
+ "C": 42,
151
+ "D": 43,
152
+ "E": 44,
153
+ "F": 45,
154
+ "G": 46,
155
+ "H": 47,
156
+ "I": 48,
157
+ "J": 49,
158
+ "K": 50,
159
+ "L": 51,
160
+ "M": 52,
161
+ "N": 53,
162
+ "O": 54,
163
+ "P": 55,
164
+ "Q": 56,
165
+ "R": 57,
166
+ "S": 58,
167
+ "T": 59,
168
+ "U": 60,
169
+ "V": 61,
170
+ "W": 62,
171
+ "X": 63,
172
+ "Y": 64,
173
+ "Z": 65,
174
+ "[": 66,
175
+ "\\": 67,
176
+ "]": 68,
177
+ "^": 69,
178
+ "_": 70,
179
+ "`": 71,
180
+ "a": 72,
181
+ "b": 73,
182
+ "c": 74,
183
+ "d": 75,
184
+ "e": 76,
185
+ "f": 77,
186
+ "g": 78,
187
+ "h": 79,
188
+ "i": 80,
189
+ "j": 81,
190
+ "k": 82,
191
+ "l": 83,
192
+ "m": 84,
193
+ "n": 85,
194
+ "o": 86,
195
+ "p": 87,
196
+ "q": 88,
197
+ "r": 89,
198
+ "s": 90,
199
+ "t": 91,
200
+ "u": 92,
201
+ "v": 93,
202
+ "w": 94,
203
+ "x": 95,
204
+ "y": 96,
205
+ "z": 97,
206
+ "{": 98,
207
+ "|": 99,
208
+ "}": 100,
209
+ "~": 101,
210
+ "¡": 102,
211
+ "¢": 103,
212
+ "£": 104,
213
+ "¤": 105,
214
+ "¥": 106,
215
+ "¦": 107,
216
+ "§": 108,
217
+ "¨": 109,
218
+ "©": 110,
219
+ "ª": 111,
220
+ "«": 112,
221
+ "¬": 113,
222
+ "®": 114,
223
+ "¯": 115,
224
+ "°": 116,
225
+ "±": 117,
226
+ "²": 118,
227
+ "³": 119,
228
+ "´": 120,
229
+ "µ": 121,
230
+ "¶": 122,
231
+ "·": 123,
232
+ "¸": 124,
233
+ "¹": 125,
234
+ "º": 126,
235
+ "»": 127,
236
+ "¼": 128,
237
+ "½": 129,
238
+ "¾": 130,
239
+ "¿": 131,
240
+ "À": 132,
241
+ "Á": 133,
242
+ "Â": 134,
243
+ "Ã": 135,
244
+ "Ä": 136,
245
+ "Å": 137,
246
+ "Æ": 138,
247
+ "Ç": 139,
248
+ "È": 140,
249
+ "É": 141,
250
+ "Ê": 142,
251
+ "Ë": 143,
252
+ "Ì": 144,
253
+ "Í": 145,
254
+ "Î": 146,
255
+ "Ï": 147,
256
+ "Ð": 148,
257
+ "Ñ": 149,
258
+ "Ò": 150,
259
+ "Ó": 151,
260
+ "Ô": 152,
261
+ "Õ": 153,
262
+ "Ö": 154,
263
+ "×": 155,
264
+ "Ø": 156,
265
+ "Ù": 157,
266
+ "Ú": 158,
267
+ "Û": 159,
268
+ "Ü": 160,
269
+ "Ý": 161,
270
+ "Þ": 162,
271
+ "ß": 163,
272
+ "à": 164,
273
+ "á": 165,
274
+ "â": 166,
275
+ "ã": 167,
276
+ "ä": 168,
277
+ "å": 169,
278
+ "æ": 170,
279
+ "ç": 171,
280
+ "è": 172,
281
+ "é": 173,
282
+ "ê": 174,
283
+ "ë": 175,
284
+ "ì": 176,
285
+ "í": 177,
286
+ "î": 178,
287
+ "ï": 179,
288
+ "ð": 180,
289
+ "ñ": 181,
290
+ "ò": 182,
291
+ "ó": 183,
292
+ "ô": 184,
293
+ "õ": 185,
294
+ "ö": 186,
295
+ "÷": 187,
296
+ "ø": 188,
297
+ "ù": 189,
298
+ "ú": 190,
299
+ "û": 191,
300
+ "ü": 192,
301
+ "ý": 193,
302
+ "þ": 194,
303
+ "ÿ": 195,
304
+ "Ā": 196,
305
+ "ā": 197,
306
+ "Ă": 198,
307
+ "ă": 199,
308
+ "Ą": 200,
309
+ "ą": 201,
310
+ "Ć": 202,
311
+ "ć": 203,
312
+ "Ĉ": 204,
313
+ "ĉ": 205,
314
+ "Ċ": 206,
315
+ "ċ": 207,
316
+ "Č": 208,
317
+ "č": 209,
318
+ "Ď": 210,
319
+ "ď": 211,
320
+ "Đ": 212,
321
+ "đ": 213,
322
+ "Ē": 214,
323
+ "ē": 215,
324
+ "Ĕ": 216,
325
+ "ĕ": 217,
326
+ "Ė": 218,
327
+ "ė": 219,
328
+ "Ę": 220,
329
+ "ę": 221,
330
+ "Ě": 222,
331
+ "ě": 223,
332
+ "Ĝ": 224,
333
+ "ĝ": 225,
334
+ "Ğ": 226,
335
+ "ğ": 227,
336
+ "Ġ": 228,
337
+ "ġ": 229,
338
+ "Ģ": 230,
339
+ "ģ": 231,
340
+ "Ĥ": 232,
341
+ "ĥ": 233,
342
+ "Ħ": 234,
343
+ "ħ": 235,
344
+ "Ĩ": 236,
345
+ "ĩ": 237,
346
+ "Ī": 238,
347
+ "ī": 239,
348
+ "Ĭ": 240,
349
+ "ĭ": 241,
350
+ "Į": 242,
351
+ "į": 243,
352
+ "İ": 244,
353
+ "ı": 245,
354
+ "IJ": 246,
355
+ "ij": 247,
356
+ "Ĵ": 248,
357
+ "ĵ": 249,
358
+ "Ķ": 250,
359
+ "ķ": 251,
360
+ "ĸ": 252,
361
+ "Ĺ": 253,
362
+ "ĺ": 254,
363
+ "Ļ": 255,
364
+ "ļ": 256,
365
+ "Ľ": 257,
366
+ "ľ": 258,
367
+ "Ŀ": 259,
368
+ "ŀ": 260,
369
+ "Ł": 261,
370
+ "ł": 262,
371
+ "Ń": 263,
372
+ "Ġt": 264,
373
+ "Ġa": 265,
374
+ "Ġth": 266,
375
+ "en": 267,
376
+ "Ġthe": 268,
377
+ "in": 269,
378
+ "Ġs": 270,
379
+ "te": 271,
380
+ "es": 272,
381
+ "or": 273,
382
+ "Ġf": 274,
383
+ "Ġo": 275,
384
+ "er": 276,
385
+ "ent": 277,
386
+ "Ġof": 278,
387
+ "on": 279,
388
+ "Ġc": 280,
389
+ "re": 281,
390
+ "Ġw": 282,
391
+ "ing": 283,
392
+ "it": 284,
393
+ "Ġan": 285,
394
+ "le": 286,
395
+ "Ġp": 287,
396
+ "ce": 288,
397
+ "at": 289,
398
+ "ate": 290,
399
+ "Ġb": 291,
400
+ "ar": 292,
401
+ "Ġin": 293,
402
+ "al": 294,
403
+ "ri": 295,
404
+ "ut": 296,
405
+ "Ġto": 297,
406
+ "Ġm": 298,
407
+ "iv": 299,
408
+ "om": 300,
409
+ "an": 301,
410
+ "Ġd": 302,
411
+ "ence": 303,
412
+ "as": 304,
413
+ "is": 305,
414
+ "Ġg": 306,
415
+ "Ġsent": 307,
416
+ "Ġsentence": 308,
417
+ "et": 309,
418
+ "ll": 310,
419
+ "ow": 311,
420
+ "ct": 312,
421
+ "ion": 313,
422
+ "if": 314,
423
+ "est": 315,
424
+ "us": 316,
425
+ "Ġst": 317,
426
+ "ord": 318,
427
+ "Ġfo": 319,
428
+ "Ġfor": 320,
429
+ "bo": 321,
430
+ "Ġe": 322,
431
+ "Ġh": 323,
432
+ "Ġabo": 324,
433
+ "iven": 325,
434
+ "llow": 326,
435
+ "Ġfollow": 327,
436
+ "Ġabout": 328,
437
+ "Ġfollowing": 329,
438
+ "am": 330,
439
+ "ch": 331,
440
+ "Ġwh": 332,
441
+ "Gen": 333,
442
+ "ic": 334,
443
+ "qu": 335,
444
+ "vi": 336,
445
+ "Ġn": 337,
446
+ "ter": 338,
447
+ "erate": 339,
448
+ "Ġcom": 340,
449
+ "Ġand": 341,
450
+ "Generate": 342,
451
+ "Des": 343,
452
+ "el": 344,
453
+ "ig": 345,
454
+ "ree": 346,
455
+ "ith": 347,
456
+ "rite": 348,
457
+ "dent": 349,
458
+ "im": 350,
459
+ "pl": 351,
460
+ "ro": 352,
461
+ "se": 353,
462
+ "ur": 354,
463
+ "Ġqu": 355,
464
+ "Ġthat": 356,
465
+ "ine": 357,
466
+ "Ġsu": 358,
467
+ "Ġword": 359,
468
+ "Ġwith": 360,
469
+ "its": 361,
470
+ "Ġgiven": 362,
471
+ "be": 363,
472
+ "cri": 364,
473
+ "pe": 365,
474
+ "ist": 366,
475
+ "ify": 367,
476
+ "ew": 368,
477
+ "il": 369,
478
+ "ir": 370,
479
+ "ite": 371,
480
+ "ment": 372,
481
+ "od": 373,
482
+ "ple": 374,
483
+ "res": 375,
484
+ "Ġl": 376,
485
+ "Ġre": 377,
486
+ "Ġle": 378,
487
+ "Ġus": 379,
488
+ "Ġthree": 380,
489
+ "ers": 381,
490
+ "ive": 382,
491
+ "estion": 383,
492
+ "Ġstate": 384,
493
+ "pla": 385,
494
+ "cribe": 386,
495
+ "Write": 387,
496
+ "ak": 388,
497
+ "ed": 389,
498
+ "fer": 390,
499
+ "ge": 391,
500
+ "ou": 392,
501
+ "sw": 393,
502
+ "Ġ\"": 394,
503
+ "Ġu": 395,
504
+ "Ġv": 396,
505
+ "Ġbe": 397,
506
+ "Ġcomp": 398,
507
+ "Describe": 399,
508
+ "Ġquestion": 400,
509
+ "Ex": 401,
510
+ "Wh": 402,
511
+ "ay": 403,
512
+ "are": 404,
513
+ "ces": 405,
514
+ "las": 406,
515
+ "th": 407,
516
+ "to": 408,
517
+ "tic": 409,
518
+ "xt": 410,
519
+ "Ġ1": 411,
520
+ "Ġj": 412,
521
+ "Ġx": 413,
522
+ "Ġy": 414,
523
+ "Ġits": 415,
524
+ "Ġty": 416,
525
+ "Ġthis": 417,
526
+ "ory": 418,
527
+ "Ġansw": 419,
528
+ "Ġpo": 420,
529
+ "Ġpar": 421,
530
+ "Ġpro": 422,
531
+ "ome": 423,
532
+ "Ġstory": 424,
533
+ "ame": 425,
534
+ "dentify": 426,
535
+ "plain": 427,
536
+ "Explain": 428,
537
+ "What": 429,
538
+ "lass": 430,
539
+ "Given": 431,
540
+ "Identify": 432,
541
+ "List": 433,
542
+ "ad": 434,
543
+ "ach": 435,
544
+ "ci": 436,
545
+ "ect": 437,
546
+ "ms": 438,
547
+ "ovi": 439,
548
+ "ram": 440,
549
+ "ve": 441,
550
+ "we": 442,
551
+ "Ġis": 443,
552
+ "Ġte": 444,
553
+ "Ġap": 445,
554
+ "Ġar": 446,
555
+ "Ġat": 447,
556
+ "Ġare": 448,
557
+ "Ġtheir": 449,
558
+ "Ġfa": 450,
559
+ "Ġch": 451,
560
+ "Ġcon": 452,
561
+ "reate": 453,
562
+ "Ġwas": 454,
563
+ "ation": 455,
564
+ "Ġbet": 456,
565
+ "Ġbest": 457,
566
+ "Ġinto": 458,
567
+ "all": 459,
568
+ "Ġmovi": 460,
569
+ "Ġde": 461,
570
+ "Ġdif": 462,
571
+ "ust": 463,
572
+ "Ġex": 464,
573
+ "Ġhe": 465,
574
+ "Ġwho": 466,
575
+ "Ġwhat": 467,
576
+ "Desig": 468,
577
+ "Ġwords": 469,
578
+ "Ġstatement": 470,
579
+ "ake": 471,
580
+ "Ġup": 472,
581
+ "Ġquestions": 473,
582
+ "Ġtype": 474,
583
+ "Ġanswer": 475,
584
+ "Ġpart": 476,
585
+ "Ġmovie": 477,
586
+ "Ġdiffer": 478,
587
+ "Design": 479,
588
+ "\".": 480,
589
+ "'t": 481,
590
+ "Create": 482,
591
+ "Fin": 483,
592
+ "Name": 484,
593
+ "Out": 485,
594
+ "Re": 486,
595
+ "St": 487,
596
+ "Su": 488,
597
+ "ab": 489,
598
+ "age": 490,
599
+ "bs": 491,
600
+ "cc": 492,
601
+ "de": 493,
602
+ "dit": 494,
603
+ "em": 495,
604
+ "eo": 496,
605
+ "ff": 497,
606
+ "gg": 498,
607
+ "ges": 499,
608
+ "gan": 500,
609
+ "gree": 501,
610
+ "iz": 502,
611
+ "ident": 503,
612
+ "ks": 504,
613
+ "line": 505,
614
+ "mm": 506,
615
+ "ning": 507,
616
+ "ob": 508,
617
+ "oc": 509,
618
+ "ol": 510,
619
+ "ot": 511,
620
+ "ose": 512,
621
+ "por": 513,
622
+ "pose": 514,
623
+ "ry": 515,
624
+ "ue": 516,
625
+ "ul": 517,
626
+ "un": 518,
627
+ "ure": 519,
628
+ "âĢ": 520,
629
+ "Ġ3": 521,
630
+ "Ġ=": 522,
631
+ "ĠU": 523,
632
+ "Ġk": 524,
633
+ "Ġor": 525,
634
+ "Ġif": 526,
635
+ "Ġim": 527,
636
+ "Ġite": 528,
637
+ "Ġtit": 529,
638
+ "Ġas": 530,
639
+ "Ġall": 531,
640
+ "Ġacc": 532,
641
+ "ene": 533,
642
+ "Ġthem": 534,
643
+ "Ġsome": 535,
644
+ "Ġon": 536,
645
+ "Ġcor": 537,
646
+ "Ġcan": 538,
647
+ "Ġclass": 539,
648
+ "Ġwe": 540,
649
+ "lect": 541,
650
+ "Ġpres": 542,
651
+ "Ġpeo": 543,
652
+ "ative": 544,
653
+ "Ġinter": 545,
654
+ "als": 546,
655
+ "alth": 547,
656
+ "Ġmake": 548,
657
+ "ant": 549,
658
+ "Ġdon": 550,
659
+ "Ġgram": 551,
660
+ "eth": 552,
661
+ "Ġhel": 553,
662
+ "vice": 554,
663
+ "igh": 555,
664
+ "Ġref": 556,
665
+ "Ġused": 557,
666
+ "ticle": 558,
667
+ "Ġjob": 559,
668
+ "Ġyou": 560,
669
+ "Ġpoem": 561,
670
+ "ween": 562,
671
+ "Ġapp": 563,
672
+ "Ġarticle": 564,
673
+ "Ġbetween": 565,
674
+ "Ġhealth": 566,
675
+ "Find": 567,
676
+ "port": 568,
677
+ "Ġtitle": 569,
678
+ "Ġpresident": 570,
679
+ "Ġpeople": 571,
680
+ "Ġgramm": 572,
681
+ "'s": 573,
682
+ "Com": 574,
683
+ "Class": 575,
684
+ "Edit": 576,
685
+ "In": 577,
686
+ "Rew": 578,
687
+ "Se": 579,
688
+ "Th": 580,
689
+ "Tw": 581,
690
+ "cy": 582,
691
+ "di": 583,
692
+ "ech": 584,
693
+ "for": 585,
694
+ "fits": 586,
695
+ "gu": 587,
696
+ "gy": 588,
697
+ "hen": 589,
698
+ "hare": 590,
699
+ "ik": 591,
700
+ "ix": 592,
701
+ "ice": 593,
702
+ "ill": 594,
703
+ "ide": 595,
704
+ "ket": 596,
705
+ "lo": 597,
706
+ "mon": 598,
707
+ "mine": 599,
708
+ "ner": 600,
709
+ "now": 601,
710
+ "os": 602,
711
+ "our": 603,
712
+ "pt": 604,
713
+ "pon": 605,
714
+ "put": 606,
715
+ "rom": 607,
716
+ "ran": 608,
717
+ "ste": 609,
718
+ "ting": 610,
719
+ "uter": 611,
720
+ "uil": 612,
721
+ "ver": 613,
722
+ "ving": 614,
723
+ "vel": 615,
724
+ "vol": 616,
725
+ "Ġ-": 617,
726
+ "Ġ0": 618,
727
+ "Ġ4": 619,
728
+ "ĠA": 620,
729
+ "ĠC": 621,
730
+ "ĠE": 622,
731
+ "ĠG": 623,
732
+ "Ġro": 624,
733
+ "Ġres": 625,
734
+ "ĠSt": 626,
735
+ "ĠTw": 627,
736
+ "Ġtas": 628,
737
+ "Ġad": 629,
738
+ "Ġal": 630,
739
+ "Ġaut": 631,
740
+ "Ġact": 632,
741
+ "enges": 633,
742
+ "ines": 634,
743
+ "Ġsc": 635,
744
+ "Ġso": 636,
745
+ "Ġson": 637,
746
+ "Ġset": 638,
747
+ "Ġspe": 639,
748
+ "Ġsci": 640,
749
+ "Ġslo": 641,
750
+ "text": 642,
751
+ "orks": 643,
752
+ "Ġfig": 644,
753
+ "Ġfun": 645,
754
+ "erb": 646,
755
+ "ere": 647,
756
+ "ents": 648,
757
+ "entif": 649,
758
+ "one": 650,
759
+ "onents": 651,
760
+ "Ġcat": 652,
761
+ "Ġcar": 653,
762
+ "Ġcou": 654,
763
+ "rect": 655,
764
+ "redi": 656,
765
+ "itative": 657,
766
+ "Ġany": 658,
767
+ "lement": 659,
768
+ "Ġpri": 660,
769
+ "Ġpas": 661,
770
+ "atic": 662,
771
+ "ated": 663,
772
+ "Ġbl": 664,
773
+ "Ġby": 665,
774
+ "Ġbene": 666,
775
+ "Ġbuil": 667,
776
+ "ard": 668,
777
+ "arning": 669,
778
+ "arket": 670,
779
+ "Ġinvol": 671,
780
+ "Ġme": 672,
781
+ "Ġmod": 673,
782
+ "Ġmach": 674,
783
+ "Ġmarket": 675,
784
+ "ival": 676,
785
+ "ance": 677,
786
+ "angu": 678,
787
+ "Ġdo": 679,
788
+ "Ġdat": 680,
789
+ "astic": 681,
790
+ "Ġgo": 682,
791
+ "esting": 683,
792
+ "order": 684,
793
+ "ording": 685,
794
+ "Ġfood": 686,
795
+ "Ġform": 687,
796
+ "Ġeach": 688,
797
+ "Ġelement": 689,
798
+ "Ġha": 690,
799
+ "Ġhow": 691,
800
+ "ample": 692,
801
+ "Ġwhen": 693,
802
+ "view": 694,
803
+ "Ġne": 695,
804
+ "Ġnew": 696,
805
+ "termine": 697,
806
+ "els": 698,
807
+ "urr": 699,
808
+ "Ġsumm": 700,
809
+ "Ġlangu": 701,
810
+ "Ġrel": 702,
811
+ "Ġlearning": 703,
812
+ "Ġusing": 704,
813
+ "erson": 705,
814
+ "Ġun": 706,
815
+ "Ġval": 707,
816
+ "Ġverb": 708,
817
+ "Ġcomputer": 709,
818
+ "Ġcomponents": 710,
819
+ "ays": 711,
820
+ "cess": 712,
821
+ "Ġtext": 713,
822
+ "Ġfact": 714,
823
+ "Ġchall": 715,
824
+ "Ġcontext": 716,
825
+ "ally": 717,
826
+ "Ġexample": 718,
827
+ "Ġparts": 719,
828
+ "Ġdifference": 720,
829
+ "Output": 721,
830
+ "Sugg": 722,
831
+ "bsite": 723,
832
+ "ffect": 724,
833
+ "ize": 725,
834
+ "ular": 726,
835
+ "ĠUS": 727,
836
+ "Ġknow": 728,
837
+ "Ġimport": 729,
838
+ "Ġitems": 730,
839
+ "Ġaccording": 731,
840
+ "Ġcorrect": 732,
841
+ "Ġwebsite": 733,
842
+ "Ġinteresting": 734,
843
+ "Ġhelp": 735,
844
+ "ight": 736,
845
+ "Ġgrammatic": 737,
846
+ "Compose": 738,
847
+ "Classify": 739,
848
+ "Rewrite": 740,
849
+ "The": 741,
850
+ "form": 742,
851
+ "Ġtask": 743,
852
+ "Ġactive": 744,
853
+ "Ġsong": 745,
854
+ "Ġspeech": 746,
855
+ "Ġscientif": 747,
856
+ "Ġslogan": 748,
857
+ "redict": 749,
858
+ "Ġbenefits": 750,
859
+ "Ġinvolving": 751,
860
+ "Ġmodels": 752,
861
+ "Ġmachine": 753,
862
+ "Ġelements": 754,
863
+ "Ġsummer": 755,
864
+ "Ġlanguage": 756,
865
+ "Ġchallenges": 757,
866
+ "Suggest": 758,
867
+ "Ġgrammatical": 759,
868
+ "Ġscientific": 760
869
+ },
870
+ "merges": [
871
+ [
872
+ "Ġ",
873
+ "t"
874
+ ],
875
+ [
876
+ "Ġ",
877
+ "a"
878
+ ],
879
+ [
880
+ "Ġt",
881
+ "h"
882
+ ],
883
+ [
884
+ "e",
885
+ "n"
886
+ ],
887
+ [
888
+ "Ġth",
889
+ "e"
890
+ ],
891
+ [
892
+ "i",
893
+ "n"
894
+ ],
895
+ [
896
+ "Ġ",
897
+ "s"
898
+ ],
899
+ [
900
+ "t",
901
+ "e"
902
+ ],
903
+ [
904
+ "e",
905
+ "s"
906
+ ],
907
+ [
908
+ "o",
909
+ "r"
910
+ ],
911
+ [
912
+ "Ġ",
913
+ "f"
914
+ ],
915
+ [
916
+ "Ġ",
917
+ "o"
918
+ ],
919
+ [
920
+ "e",
921
+ "r"
922
+ ],
923
+ [
924
+ "en",
925
+ "t"
926
+ ],
927
+ [
928
+ "Ġo",
929
+ "f"
930
+ ],
931
+ [
932
+ "o",
933
+ "n"
934
+ ],
935
+ [
936
+ "Ġ",
937
+ "c"
938
+ ],
939
+ [
940
+ "r",
941
+ "e"
942
+ ],
943
+ [
944
+ "Ġ",
945
+ "w"
946
+ ],
947
+ [
948
+ "in",
949
+ "g"
950
+ ],
951
+ [
952
+ "i",
953
+ "t"
954
+ ],
955
+ [
956
+ "Ġa",
957
+ "n"
958
+ ],
959
+ [
960
+ "l",
961
+ "e"
962
+ ],
963
+ [
964
+ "Ġ",
965
+ "p"
966
+ ],
967
+ [
968
+ "c",
969
+ "e"
970
+ ],
971
+ [
972
+ "a",
973
+ "t"
974
+ ],
975
+ [
976
+ "a",
977
+ "te"
978
+ ],
979
+ [
980
+ "Ġ",
981
+ "b"
982
+ ],
983
+ [
984
+ "a",
985
+ "r"
986
+ ],
987
+ [
988
+ "Ġ",
989
+ "in"
990
+ ],
991
+ [
992
+ "a",
993
+ "l"
994
+ ],
995
+ [
996
+ "r",
997
+ "i"
998
+ ],
999
+ [
1000
+ "u",
1001
+ "t"
1002
+ ],
1003
+ [
1004
+ "Ġt",
1005
+ "o"
1006
+ ],
1007
+ [
1008
+ "Ġ",
1009
+ "m"
1010
+ ],
1011
+ [
1012
+ "i",
1013
+ "v"
1014
+ ],
1015
+ [
1016
+ "o",
1017
+ "m"
1018
+ ],
1019
+ [
1020
+ "a",
1021
+ "n"
1022
+ ],
1023
+ [
1024
+ "Ġ",
1025
+ "d"
1026
+ ],
1027
+ [
1028
+ "en",
1029
+ "ce"
1030
+ ],
1031
+ [
1032
+ "a",
1033
+ "s"
1034
+ ],
1035
+ [
1036
+ "i",
1037
+ "s"
1038
+ ],
1039
+ [
1040
+ "Ġ",
1041
+ "g"
1042
+ ],
1043
+ [
1044
+ "Ġs",
1045
+ "ent"
1046
+ ],
1047
+ [
1048
+ "Ġsent",
1049
+ "ence"
1050
+ ],
1051
+ [
1052
+ "e",
1053
+ "t"
1054
+ ],
1055
+ [
1056
+ "l",
1057
+ "l"
1058
+ ],
1059
+ [
1060
+ "o",
1061
+ "w"
1062
+ ],
1063
+ [
1064
+ "c",
1065
+ "t"
1066
+ ],
1067
+ [
1068
+ "i",
1069
+ "on"
1070
+ ],
1071
+ [
1072
+ "i",
1073
+ "f"
1074
+ ],
1075
+ [
1076
+ "es",
1077
+ "t"
1078
+ ],
1079
+ [
1080
+ "u",
1081
+ "s"
1082
+ ],
1083
+ [
1084
+ "Ġs",
1085
+ "t"
1086
+ ],
1087
+ [
1088
+ "or",
1089
+ "d"
1090
+ ],
1091
+ [
1092
+ "Ġf",
1093
+ "o"
1094
+ ],
1095
+ [
1096
+ "Ġf",
1097
+ "or"
1098
+ ],
1099
+ [
1100
+ "b",
1101
+ "o"
1102
+ ],
1103
+ [
1104
+ "Ġ",
1105
+ "e"
1106
+ ],
1107
+ [
1108
+ "Ġ",
1109
+ "h"
1110
+ ],
1111
+ [
1112
+ "Ġa",
1113
+ "bo"
1114
+ ],
1115
+ [
1116
+ "iv",
1117
+ "en"
1118
+ ],
1119
+ [
1120
+ "ll",
1121
+ "ow"
1122
+ ],
1123
+ [
1124
+ "Ġfo",
1125
+ "llow"
1126
+ ],
1127
+ [
1128
+ "Ġabo",
1129
+ "ut"
1130
+ ],
1131
+ [
1132
+ "Ġfollow",
1133
+ "ing"
1134
+ ],
1135
+ [
1136
+ "a",
1137
+ "m"
1138
+ ],
1139
+ [
1140
+ "c",
1141
+ "h"
1142
+ ],
1143
+ [
1144
+ "Ġw",
1145
+ "h"
1146
+ ],
1147
+ [
1148
+ "G",
1149
+ "en"
1150
+ ],
1151
+ [
1152
+ "i",
1153
+ "c"
1154
+ ],
1155
+ [
1156
+ "q",
1157
+ "u"
1158
+ ],
1159
+ [
1160
+ "v",
1161
+ "i"
1162
+ ],
1163
+ [
1164
+ "Ġ",
1165
+ "n"
1166
+ ],
1167
+ [
1168
+ "te",
1169
+ "r"
1170
+ ],
1171
+ [
1172
+ "er",
1173
+ "ate"
1174
+ ],
1175
+ [
1176
+ "Ġc",
1177
+ "om"
1178
+ ],
1179
+ [
1180
+ "Ġan",
1181
+ "d"
1182
+ ],
1183
+ [
1184
+ "Gen",
1185
+ "erate"
1186
+ ],
1187
+ [
1188
+ "D",
1189
+ "es"
1190
+ ],
1191
+ [
1192
+ "e",
1193
+ "l"
1194
+ ],
1195
+ [
1196
+ "i",
1197
+ "g"
1198
+ ],
1199
+ [
1200
+ "re",
1201
+ "e"
1202
+ ],
1203
+ [
1204
+ "it",
1205
+ "h"
1206
+ ],
1207
+ [
1208
+ "ri",
1209
+ "te"
1210
+ ],
1211
+ [
1212
+ "d",
1213
+ "ent"
1214
+ ],
1215
+ [
1216
+ "i",
1217
+ "m"
1218
+ ],
1219
+ [
1220
+ "p",
1221
+ "l"
1222
+ ],
1223
+ [
1224
+ "r",
1225
+ "o"
1226
+ ],
1227
+ [
1228
+ "s",
1229
+ "e"
1230
+ ],
1231
+ [
1232
+ "u",
1233
+ "r"
1234
+ ],
1235
+ [
1236
+ "Ġ",
1237
+ "qu"
1238
+ ],
1239
+ [
1240
+ "Ġth",
1241
+ "at"
1242
+ ],
1243
+ [
1244
+ "in",
1245
+ "e"
1246
+ ],
1247
+ [
1248
+ "Ġs",
1249
+ "u"
1250
+ ],
1251
+ [
1252
+ "Ġw",
1253
+ "ord"
1254
+ ],
1255
+ [
1256
+ "Ġw",
1257
+ "ith"
1258
+ ],
1259
+ [
1260
+ "it",
1261
+ "s"
1262
+ ],
1263
+ [
1264
+ "Ġg",
1265
+ "iven"
1266
+ ],
1267
+ [
1268
+ "b",
1269
+ "e"
1270
+ ],
1271
+ [
1272
+ "c",
1273
+ "ri"
1274
+ ],
1275
+ [
1276
+ "p",
1277
+ "e"
1278
+ ],
1279
+ [
1280
+ "is",
1281
+ "t"
1282
+ ],
1283
+ [
1284
+ "if",
1285
+ "y"
1286
+ ],
1287
+ [
1288
+ "e",
1289
+ "w"
1290
+ ],
1291
+ [
1292
+ "i",
1293
+ "l"
1294
+ ],
1295
+ [
1296
+ "i",
1297
+ "r"
1298
+ ],
1299
+ [
1300
+ "i",
1301
+ "te"
1302
+ ],
1303
+ [
1304
+ "m",
1305
+ "ent"
1306
+ ],
1307
+ [
1308
+ "o",
1309
+ "d"
1310
+ ],
1311
+ [
1312
+ "p",
1313
+ "le"
1314
+ ],
1315
+ [
1316
+ "r",
1317
+ "es"
1318
+ ],
1319
+ [
1320
+ "Ġ",
1321
+ "l"
1322
+ ],
1323
+ [
1324
+ "Ġ",
1325
+ "re"
1326
+ ],
1327
+ [
1328
+ "Ġ",
1329
+ "le"
1330
+ ],
1331
+ [
1332
+ "Ġ",
1333
+ "us"
1334
+ ],
1335
+ [
1336
+ "Ġth",
1337
+ "ree"
1338
+ ],
1339
+ [
1340
+ "er",
1341
+ "s"
1342
+ ],
1343
+ [
1344
+ "iv",
1345
+ "e"
1346
+ ],
1347
+ [
1348
+ "est",
1349
+ "ion"
1350
+ ],
1351
+ [
1352
+ "Ġst",
1353
+ "ate"
1354
+ ],
1355
+ [
1356
+ "pl",
1357
+ "a"
1358
+ ],
1359
+ [
1360
+ "cri",
1361
+ "be"
1362
+ ],
1363
+ [
1364
+ "W",
1365
+ "rite"
1366
+ ],
1367
+ [
1368
+ "a",
1369
+ "k"
1370
+ ],
1371
+ [
1372
+ "e",
1373
+ "d"
1374
+ ],
1375
+ [
1376
+ "f",
1377
+ "er"
1378
+ ],
1379
+ [
1380
+ "g",
1381
+ "e"
1382
+ ],
1383
+ [
1384
+ "o",
1385
+ "u"
1386
+ ],
1387
+ [
1388
+ "s",
1389
+ "w"
1390
+ ],
1391
+ [
1392
+ "Ġ",
1393
+ "\""
1394
+ ],
1395
+ [
1396
+ "Ġ",
1397
+ "u"
1398
+ ],
1399
+ [
1400
+ "Ġ",
1401
+ "v"
1402
+ ],
1403
+ [
1404
+ "Ġb",
1405
+ "e"
1406
+ ],
1407
+ [
1408
+ "Ġcom",
1409
+ "p"
1410
+ ],
1411
+ [
1412
+ "Des",
1413
+ "cribe"
1414
+ ],
1415
+ [
1416
+ "Ġqu",
1417
+ "estion"
1418
+ ],
1419
+ [
1420
+ "E",
1421
+ "x"
1422
+ ],
1423
+ [
1424
+ "W",
1425
+ "h"
1426
+ ],
1427
+ [
1428
+ "a",
1429
+ "y"
1430
+ ],
1431
+ [
1432
+ "a",
1433
+ "re"
1434
+ ],
1435
+ [
1436
+ "c",
1437
+ "es"
1438
+ ],
1439
+ [
1440
+ "l",
1441
+ "as"
1442
+ ],
1443
+ [
1444
+ "t",
1445
+ "h"
1446
+ ],
1447
+ [
1448
+ "t",
1449
+ "o"
1450
+ ],
1451
+ [
1452
+ "t",
1453
+ "ic"
1454
+ ],
1455
+ [
1456
+ "x",
1457
+ "t"
1458
+ ],
1459
+ [
1460
+ "Ġ",
1461
+ "1"
1462
+ ],
1463
+ [
1464
+ "Ġ",
1465
+ "j"
1466
+ ],
1467
+ [
1468
+ "Ġ",
1469
+ "x"
1470
+ ],
1471
+ [
1472
+ "Ġ",
1473
+ "y"
1474
+ ],
1475
+ [
1476
+ "Ġ",
1477
+ "its"
1478
+ ],
1479
+ [
1480
+ "Ġt",
1481
+ "y"
1482
+ ],
1483
+ [
1484
+ "Ġth",
1485
+ "is"
1486
+ ],
1487
+ [
1488
+ "or",
1489
+ "y"
1490
+ ],
1491
+ [
1492
+ "Ġan",
1493
+ "sw"
1494
+ ],
1495
+ [
1496
+ "Ġp",
1497
+ "o"
1498
+ ],
1499
+ [
1500
+ "Ġp",
1501
+ "ar"
1502
+ ],
1503
+ [
1504
+ "Ġp",
1505
+ "ro"
1506
+ ],
1507
+ [
1508
+ "om",
1509
+ "e"
1510
+ ],
1511
+ [
1512
+ "Ġst",
1513
+ "ory"
1514
+ ],
1515
+ [
1516
+ "am",
1517
+ "e"
1518
+ ],
1519
+ [
1520
+ "dent",
1521
+ "ify"
1522
+ ],
1523
+ [
1524
+ "pla",
1525
+ "in"
1526
+ ],
1527
+ [
1528
+ "Ex",
1529
+ "plain"
1530
+ ],
1531
+ [
1532
+ "Wh",
1533
+ "at"
1534
+ ],
1535
+ [
1536
+ "las",
1537
+ "s"
1538
+ ],
1539
+ [
1540
+ "G",
1541
+ "iven"
1542
+ ],
1543
+ [
1544
+ "I",
1545
+ "dentify"
1546
+ ],
1547
+ [
1548
+ "L",
1549
+ "ist"
1550
+ ],
1551
+ [
1552
+ "a",
1553
+ "d"
1554
+ ],
1555
+ [
1556
+ "a",
1557
+ "ch"
1558
+ ],
1559
+ [
1560
+ "c",
1561
+ "i"
1562
+ ],
1563
+ [
1564
+ "e",
1565
+ "ct"
1566
+ ],
1567
+ [
1568
+ "m",
1569
+ "s"
1570
+ ],
1571
+ [
1572
+ "o",
1573
+ "vi"
1574
+ ],
1575
+ [
1576
+ "r",
1577
+ "am"
1578
+ ],
1579
+ [
1580
+ "v",
1581
+ "e"
1582
+ ],
1583
+ [
1584
+ "w",
1585
+ "e"
1586
+ ],
1587
+ [
1588
+ "Ġ",
1589
+ "is"
1590
+ ],
1591
+ [
1592
+ "Ġt",
1593
+ "e"
1594
+ ],
1595
+ [
1596
+ "Ġa",
1597
+ "p"
1598
+ ],
1599
+ [
1600
+ "Ġa",
1601
+ "r"
1602
+ ],
1603
+ [
1604
+ "Ġa",
1605
+ "t"
1606
+ ],
1607
+ [
1608
+ "Ġa",
1609
+ "re"
1610
+ ],
1611
+ [
1612
+ "Ġthe",
1613
+ "ir"
1614
+ ],
1615
+ [
1616
+ "Ġf",
1617
+ "a"
1618
+ ],
1619
+ [
1620
+ "Ġc",
1621
+ "h"
1622
+ ],
1623
+ [
1624
+ "Ġc",
1625
+ "on"
1626
+ ],
1627
+ [
1628
+ "re",
1629
+ "ate"
1630
+ ],
1631
+ [
1632
+ "Ġw",
1633
+ "as"
1634
+ ],
1635
+ [
1636
+ "at",
1637
+ "ion"
1638
+ ],
1639
+ [
1640
+ "Ġb",
1641
+ "et"
1642
+ ],
1643
+ [
1644
+ "Ġb",
1645
+ "est"
1646
+ ],
1647
+ [
1648
+ "Ġin",
1649
+ "to"
1650
+ ],
1651
+ [
1652
+ "al",
1653
+ "l"
1654
+ ],
1655
+ [
1656
+ "Ġm",
1657
+ "ovi"
1658
+ ],
1659
+ [
1660
+ "Ġd",
1661
+ "e"
1662
+ ],
1663
+ [
1664
+ "Ġd",
1665
+ "if"
1666
+ ],
1667
+ [
1668
+ "us",
1669
+ "t"
1670
+ ],
1671
+ [
1672
+ "Ġe",
1673
+ "x"
1674
+ ],
1675
+ [
1676
+ "Ġh",
1677
+ "e"
1678
+ ],
1679
+ [
1680
+ "Ġwh",
1681
+ "o"
1682
+ ],
1683
+ [
1684
+ "Ġwh",
1685
+ "at"
1686
+ ],
1687
+ [
1688
+ "Des",
1689
+ "ig"
1690
+ ],
1691
+ [
1692
+ "Ġword",
1693
+ "s"
1694
+ ],
1695
+ [
1696
+ "Ġstate",
1697
+ "ment"
1698
+ ],
1699
+ [
1700
+ "ak",
1701
+ "e"
1702
+ ],
1703
+ [
1704
+ "Ġu",
1705
+ "p"
1706
+ ],
1707
+ [
1708
+ "Ġquestion",
1709
+ "s"
1710
+ ],
1711
+ [
1712
+ "Ġty",
1713
+ "pe"
1714
+ ],
1715
+ [
1716
+ "Ġansw",
1717
+ "er"
1718
+ ],
1719
+ [
1720
+ "Ġpar",
1721
+ "t"
1722
+ ],
1723
+ [
1724
+ "Ġmovi",
1725
+ "e"
1726
+ ],
1727
+ [
1728
+ "Ġdif",
1729
+ "fer"
1730
+ ],
1731
+ [
1732
+ "Desig",
1733
+ "n"
1734
+ ],
1735
+ [
1736
+ "\"",
1737
+ "."
1738
+ ],
1739
+ [
1740
+ "'",
1741
+ "t"
1742
+ ],
1743
+ [
1744
+ "C",
1745
+ "reate"
1746
+ ],
1747
+ [
1748
+ "F",
1749
+ "in"
1750
+ ],
1751
+ [
1752
+ "N",
1753
+ "ame"
1754
+ ],
1755
+ [
1756
+ "O",
1757
+ "ut"
1758
+ ],
1759
+ [
1760
+ "R",
1761
+ "e"
1762
+ ],
1763
+ [
1764
+ "S",
1765
+ "t"
1766
+ ],
1767
+ [
1768
+ "S",
1769
+ "u"
1770
+ ],
1771
+ [
1772
+ "a",
1773
+ "b"
1774
+ ],
1775
+ [
1776
+ "a",
1777
+ "ge"
1778
+ ],
1779
+ [
1780
+ "b",
1781
+ "s"
1782
+ ],
1783
+ [
1784
+ "c",
1785
+ "c"
1786
+ ],
1787
+ [
1788
+ "d",
1789
+ "e"
1790
+ ],
1791
+ [
1792
+ "d",
1793
+ "it"
1794
+ ],
1795
+ [
1796
+ "e",
1797
+ "m"
1798
+ ],
1799
+ [
1800
+ "e",
1801
+ "o"
1802
+ ],
1803
+ [
1804
+ "f",
1805
+ "f"
1806
+ ],
1807
+ [
1808
+ "g",
1809
+ "g"
1810
+ ],
1811
+ [
1812
+ "g",
1813
+ "es"
1814
+ ],
1815
+ [
1816
+ "g",
1817
+ "an"
1818
+ ],
1819
+ [
1820
+ "g",
1821
+ "ree"
1822
+ ],
1823
+ [
1824
+ "i",
1825
+ "z"
1826
+ ],
1827
+ [
1828
+ "i",
1829
+ "dent"
1830
+ ],
1831
+ [
1832
+ "k",
1833
+ "s"
1834
+ ],
1835
+ [
1836
+ "l",
1837
+ "ine"
1838
+ ],
1839
+ [
1840
+ "m",
1841
+ "m"
1842
+ ],
1843
+ [
1844
+ "n",
1845
+ "ing"
1846
+ ],
1847
+ [
1848
+ "o",
1849
+ "b"
1850
+ ],
1851
+ [
1852
+ "o",
1853
+ "c"
1854
+ ],
1855
+ [
1856
+ "o",
1857
+ "l"
1858
+ ],
1859
+ [
1860
+ "o",
1861
+ "t"
1862
+ ],
1863
+ [
1864
+ "o",
1865
+ "se"
1866
+ ],
1867
+ [
1868
+ "p",
1869
+ "or"
1870
+ ],
1871
+ [
1872
+ "p",
1873
+ "ose"
1874
+ ],
1875
+ [
1876
+ "r",
1877
+ "y"
1878
+ ],
1879
+ [
1880
+ "u",
1881
+ "e"
1882
+ ],
1883
+ [
1884
+ "u",
1885
+ "l"
1886
+ ],
1887
+ [
1888
+ "u",
1889
+ "n"
1890
+ ],
1891
+ [
1892
+ "u",
1893
+ "re"
1894
+ ],
1895
+ [
1896
+ "â",
1897
+ "Ģ"
1898
+ ],
1899
+ [
1900
+ "Ġ",
1901
+ "3"
1902
+ ],
1903
+ [
1904
+ "Ġ",
1905
+ "="
1906
+ ],
1907
+ [
1908
+ "Ġ",
1909
+ "U"
1910
+ ],
1911
+ [
1912
+ "Ġ",
1913
+ "k"
1914
+ ],
1915
+ [
1916
+ "Ġ",
1917
+ "or"
1918
+ ],
1919
+ [
1920
+ "Ġ",
1921
+ "if"
1922
+ ],
1923
+ [
1924
+ "Ġ",
1925
+ "im"
1926
+ ],
1927
+ [
1928
+ "Ġ",
1929
+ "ite"
1930
+ ],
1931
+ [
1932
+ "Ġt",
1933
+ "it"
1934
+ ],
1935
+ [
1936
+ "Ġa",
1937
+ "s"
1938
+ ],
1939
+ [
1940
+ "Ġa",
1941
+ "ll"
1942
+ ],
1943
+ [
1944
+ "Ġa",
1945
+ "cc"
1946
+ ],
1947
+ [
1948
+ "en",
1949
+ "e"
1950
+ ],
1951
+ [
1952
+ "Ġthe",
1953
+ "m"
1954
+ ],
1955
+ [
1956
+ "Ġs",
1957
+ "ome"
1958
+ ],
1959
+ [
1960
+ "Ġo",
1961
+ "n"
1962
+ ],
1963
+ [
1964
+ "Ġc",
1965
+ "or"
1966
+ ],
1967
+ [
1968
+ "Ġc",
1969
+ "an"
1970
+ ],
1971
+ [
1972
+ "Ġc",
1973
+ "lass"
1974
+ ],
1975
+ [
1976
+ "Ġw",
1977
+ "e"
1978
+ ],
1979
+ [
1980
+ "le",
1981
+ "ct"
1982
+ ],
1983
+ [
1984
+ "Ġp",
1985
+ "res"
1986
+ ],
1987
+ [
1988
+ "Ġp",
1989
+ "eo"
1990
+ ],
1991
+ [
1992
+ "at",
1993
+ "ive"
1994
+ ],
1995
+ [
1996
+ "Ġin",
1997
+ "ter"
1998
+ ],
1999
+ [
2000
+ "al",
2001
+ "s"
2002
+ ],
2003
+ [
2004
+ "al",
2005
+ "th"
2006
+ ],
2007
+ [
2008
+ "Ġm",
2009
+ "ake"
2010
+ ],
2011
+ [
2012
+ "an",
2013
+ "t"
2014
+ ],
2015
+ [
2016
+ "Ġd",
2017
+ "on"
2018
+ ],
2019
+ [
2020
+ "Ġg",
2021
+ "ram"
2022
+ ],
2023
+ [
2024
+ "et",
2025
+ "h"
2026
+ ],
2027
+ [
2028
+ "Ġh",
2029
+ "el"
2030
+ ],
2031
+ [
2032
+ "vi",
2033
+ "ce"
2034
+ ],
2035
+ [
2036
+ "ig",
2037
+ "h"
2038
+ ],
2039
+ [
2040
+ "Ġre",
2041
+ "f"
2042
+ ],
2043
+ [
2044
+ "Ġus",
2045
+ "ed"
2046
+ ],
2047
+ [
2048
+ "tic",
2049
+ "le"
2050
+ ],
2051
+ [
2052
+ "Ġj",
2053
+ "ob"
2054
+ ],
2055
+ [
2056
+ "Ġy",
2057
+ "ou"
2058
+ ],
2059
+ [
2060
+ "Ġpo",
2061
+ "em"
2062
+ ],
2063
+ [
2064
+ "we",
2065
+ "en"
2066
+ ],
2067
+ [
2068
+ "Ġap",
2069
+ "p"
2070
+ ],
2071
+ [
2072
+ "Ġar",
2073
+ "ticle"
2074
+ ],
2075
+ [
2076
+ "Ġbet",
2077
+ "ween"
2078
+ ],
2079
+ [
2080
+ "Ġhe",
2081
+ "alth"
2082
+ ],
2083
+ [
2084
+ "Fin",
2085
+ "d"
2086
+ ],
2087
+ [
2088
+ "por",
2089
+ "t"
2090
+ ],
2091
+ [
2092
+ "Ġtit",
2093
+ "le"
2094
+ ],
2095
+ [
2096
+ "Ġpres",
2097
+ "ident"
2098
+ ],
2099
+ [
2100
+ "Ġpeo",
2101
+ "ple"
2102
+ ],
2103
+ [
2104
+ "Ġgram",
2105
+ "m"
2106
+ ],
2107
+ [
2108
+ "'",
2109
+ "s"
2110
+ ],
2111
+ [
2112
+ "C",
2113
+ "om"
2114
+ ],
2115
+ [
2116
+ "C",
2117
+ "lass"
2118
+ ],
2119
+ [
2120
+ "E",
2121
+ "dit"
2122
+ ],
2123
+ [
2124
+ "I",
2125
+ "n"
2126
+ ],
2127
+ [
2128
+ "R",
2129
+ "ew"
2130
+ ],
2131
+ [
2132
+ "S",
2133
+ "e"
2134
+ ],
2135
+ [
2136
+ "T",
2137
+ "h"
2138
+ ],
2139
+ [
2140
+ "T",
2141
+ "w"
2142
+ ],
2143
+ [
2144
+ "c",
2145
+ "y"
2146
+ ],
2147
+ [
2148
+ "d",
2149
+ "i"
2150
+ ],
2151
+ [
2152
+ "e",
2153
+ "ch"
2154
+ ],
2155
+ [
2156
+ "f",
2157
+ "or"
2158
+ ],
2159
+ [
2160
+ "f",
2161
+ "its"
2162
+ ],
2163
+ [
2164
+ "g",
2165
+ "u"
2166
+ ],
2167
+ [
2168
+ "g",
2169
+ "y"
2170
+ ],
2171
+ [
2172
+ "h",
2173
+ "en"
2174
+ ],
2175
+ [
2176
+ "h",
2177
+ "are"
2178
+ ],
2179
+ [
2180
+ "i",
2181
+ "k"
2182
+ ],
2183
+ [
2184
+ "i",
2185
+ "x"
2186
+ ],
2187
+ [
2188
+ "i",
2189
+ "ce"
2190
+ ],
2191
+ [
2192
+ "i",
2193
+ "ll"
2194
+ ],
2195
+ [
2196
+ "i",
2197
+ "de"
2198
+ ],
2199
+ [
2200
+ "k",
2201
+ "et"
2202
+ ],
2203
+ [
2204
+ "l",
2205
+ "o"
2206
+ ],
2207
+ [
2208
+ "m",
2209
+ "on"
2210
+ ],
2211
+ [
2212
+ "m",
2213
+ "ine"
2214
+ ],
2215
+ [
2216
+ "n",
2217
+ "er"
2218
+ ],
2219
+ [
2220
+ "n",
2221
+ "ow"
2222
+ ],
2223
+ [
2224
+ "o",
2225
+ "s"
2226
+ ],
2227
+ [
2228
+ "o",
2229
+ "ur"
2230
+ ],
2231
+ [
2232
+ "p",
2233
+ "t"
2234
+ ],
2235
+ [
2236
+ "p",
2237
+ "on"
2238
+ ],
2239
+ [
2240
+ "p",
2241
+ "ut"
2242
+ ],
2243
+ [
2244
+ "r",
2245
+ "om"
2246
+ ],
2247
+ [
2248
+ "r",
2249
+ "an"
2250
+ ],
2251
+ [
2252
+ "s",
2253
+ "te"
2254
+ ],
2255
+ [
2256
+ "t",
2257
+ "ing"
2258
+ ],
2259
+ [
2260
+ "u",
2261
+ "ter"
2262
+ ],
2263
+ [
2264
+ "u",
2265
+ "il"
2266
+ ],
2267
+ [
2268
+ "v",
2269
+ "er"
2270
+ ],
2271
+ [
2272
+ "v",
2273
+ "ing"
2274
+ ],
2275
+ [
2276
+ "v",
2277
+ "el"
2278
+ ],
2279
+ [
2280
+ "v",
2281
+ "ol"
2282
+ ],
2283
+ [
2284
+ "Ġ",
2285
+ "-"
2286
+ ],
2287
+ [
2288
+ "Ġ",
2289
+ "0"
2290
+ ],
2291
+ [
2292
+ "Ġ",
2293
+ "4"
2294
+ ],
2295
+ [
2296
+ "Ġ",
2297
+ "A"
2298
+ ],
2299
+ [
2300
+ "Ġ",
2301
+ "C"
2302
+ ],
2303
+ [
2304
+ "Ġ",
2305
+ "E"
2306
+ ],
2307
+ [
2308
+ "Ġ",
2309
+ "G"
2310
+ ],
2311
+ [
2312
+ "Ġ",
2313
+ "ro"
2314
+ ],
2315
+ [
2316
+ "Ġ",
2317
+ "res"
2318
+ ],
2319
+ [
2320
+ "Ġ",
2321
+ "St"
2322
+ ],
2323
+ [
2324
+ "Ġ",
2325
+ "Tw"
2326
+ ],
2327
+ [
2328
+ "Ġt",
2329
+ "as"
2330
+ ],
2331
+ [
2332
+ "Ġa",
2333
+ "d"
2334
+ ],
2335
+ [
2336
+ "Ġa",
2337
+ "l"
2338
+ ],
2339
+ [
2340
+ "Ġa",
2341
+ "ut"
2342
+ ],
2343
+ [
2344
+ "Ġa",
2345
+ "ct"
2346
+ ],
2347
+ [
2348
+ "en",
2349
+ "ges"
2350
+ ],
2351
+ [
2352
+ "in",
2353
+ "es"
2354
+ ],
2355
+ [
2356
+ "Ġs",
2357
+ "c"
2358
+ ],
2359
+ [
2360
+ "Ġs",
2361
+ "o"
2362
+ ],
2363
+ [
2364
+ "Ġs",
2365
+ "on"
2366
+ ],
2367
+ [
2368
+ "Ġs",
2369
+ "et"
2370
+ ],
2371
+ [
2372
+ "Ġs",
2373
+ "pe"
2374
+ ],
2375
+ [
2376
+ "Ġs",
2377
+ "ci"
2378
+ ],
2379
+ [
2380
+ "Ġs",
2381
+ "lo"
2382
+ ],
2383
+ [
2384
+ "te",
2385
+ "xt"
2386
+ ],
2387
+ [
2388
+ "or",
2389
+ "ks"
2390
+ ],
2391
+ [
2392
+ "Ġf",
2393
+ "ig"
2394
+ ],
2395
+ [
2396
+ "Ġf",
2397
+ "un"
2398
+ ],
2399
+ [
2400
+ "er",
2401
+ "b"
2402
+ ],
2403
+ [
2404
+ "er",
2405
+ "e"
2406
+ ],
2407
+ [
2408
+ "ent",
2409
+ "s"
2410
+ ],
2411
+ [
2412
+ "ent",
2413
+ "if"
2414
+ ],
2415
+ [
2416
+ "on",
2417
+ "e"
2418
+ ],
2419
+ [
2420
+ "on",
2421
+ "ents"
2422
+ ],
2423
+ [
2424
+ "Ġc",
2425
+ "at"
2426
+ ],
2427
+ [
2428
+ "Ġc",
2429
+ "ar"
2430
+ ],
2431
+ [
2432
+ "Ġc",
2433
+ "ou"
2434
+ ],
2435
+ [
2436
+ "re",
2437
+ "ct"
2438
+ ],
2439
+ [
2440
+ "re",
2441
+ "di"
2442
+ ],
2443
+ [
2444
+ "it",
2445
+ "ative"
2446
+ ],
2447
+ [
2448
+ "Ġan",
2449
+ "y"
2450
+ ],
2451
+ [
2452
+ "le",
2453
+ "ment"
2454
+ ],
2455
+ [
2456
+ "Ġp",
2457
+ "ri"
2458
+ ],
2459
+ [
2460
+ "Ġp",
2461
+ "as"
2462
+ ],
2463
+ [
2464
+ "at",
2465
+ "ic"
2466
+ ],
2467
+ [
2468
+ "ate",
2469
+ "d"
2470
+ ],
2471
+ [
2472
+ "Ġb",
2473
+ "l"
2474
+ ],
2475
+ [
2476
+ "Ġb",
2477
+ "y"
2478
+ ],
2479
+ [
2480
+ "Ġb",
2481
+ "ene"
2482
+ ],
2483
+ [
2484
+ "Ġb",
2485
+ "uil"
2486
+ ],
2487
+ [
2488
+ "ar",
2489
+ "d"
2490
+ ],
2491
+ [
2492
+ "ar",
2493
+ "ning"
2494
+ ],
2495
+ [
2496
+ "ar",
2497
+ "ket"
2498
+ ],
2499
+ [
2500
+ "Ġin",
2501
+ "vol"
2502
+ ],
2503
+ [
2504
+ "Ġm",
2505
+ "e"
2506
+ ],
2507
+ [
2508
+ "Ġm",
2509
+ "od"
2510
+ ],
2511
+ [
2512
+ "Ġm",
2513
+ "ach"
2514
+ ],
2515
+ [
2516
+ "Ġm",
2517
+ "arket"
2518
+ ],
2519
+ [
2520
+ "iv",
2521
+ "al"
2522
+ ],
2523
+ [
2524
+ "an",
2525
+ "ce"
2526
+ ],
2527
+ [
2528
+ "an",
2529
+ "gu"
2530
+ ],
2531
+ [
2532
+ "Ġd",
2533
+ "o"
2534
+ ],
2535
+ [
2536
+ "Ġd",
2537
+ "at"
2538
+ ],
2539
+ [
2540
+ "as",
2541
+ "tic"
2542
+ ],
2543
+ [
2544
+ "Ġg",
2545
+ "o"
2546
+ ],
2547
+ [
2548
+ "est",
2549
+ "ing"
2550
+ ],
2551
+ [
2552
+ "ord",
2553
+ "er"
2554
+ ],
2555
+ [
2556
+ "ord",
2557
+ "ing"
2558
+ ],
2559
+ [
2560
+ "Ġfo",
2561
+ "od"
2562
+ ],
2563
+ [
2564
+ "Ġfor",
2565
+ "m"
2566
+ ],
2567
+ [
2568
+ "Ġe",
2569
+ "ach"
2570
+ ],
2571
+ [
2572
+ "Ġe",
2573
+ "lement"
2574
+ ],
2575
+ [
2576
+ "Ġh",
2577
+ "a"
2578
+ ],
2579
+ [
2580
+ "Ġh",
2581
+ "ow"
2582
+ ],
2583
+ [
2584
+ "am",
2585
+ "ple"
2586
+ ],
2587
+ [
2588
+ "Ġwh",
2589
+ "en"
2590
+ ],
2591
+ [
2592
+ "vi",
2593
+ "ew"
2594
+ ],
2595
+ [
2596
+ "Ġn",
2597
+ "e"
2598
+ ],
2599
+ [
2600
+ "Ġn",
2601
+ "ew"
2602
+ ],
2603
+ [
2604
+ "ter",
2605
+ "mine"
2606
+ ],
2607
+ [
2608
+ "el",
2609
+ "s"
2610
+ ],
2611
+ [
2612
+ "ur",
2613
+ "r"
2614
+ ],
2615
+ [
2616
+ "Ġsu",
2617
+ "mm"
2618
+ ],
2619
+ [
2620
+ "Ġl",
2621
+ "angu"
2622
+ ],
2623
+ [
2624
+ "Ġre",
2625
+ "l"
2626
+ ],
2627
+ [
2628
+ "Ġle",
2629
+ "arning"
2630
+ ],
2631
+ [
2632
+ "Ġus",
2633
+ "ing"
2634
+ ],
2635
+ [
2636
+ "ers",
2637
+ "on"
2638
+ ],
2639
+ [
2640
+ "Ġu",
2641
+ "n"
2642
+ ],
2643
+ [
2644
+ "Ġv",
2645
+ "al"
2646
+ ],
2647
+ [
2648
+ "Ġv",
2649
+ "erb"
2650
+ ],
2651
+ [
2652
+ "Ġcomp",
2653
+ "uter"
2654
+ ],
2655
+ [
2656
+ "Ġcomp",
2657
+ "onents"
2658
+ ],
2659
+ [
2660
+ "ay",
2661
+ "s"
2662
+ ],
2663
+ [
2664
+ "ces",
2665
+ "s"
2666
+ ],
2667
+ [
2668
+ "Ġte",
2669
+ "xt"
2670
+ ],
2671
+ [
2672
+ "Ġfa",
2673
+ "ct"
2674
+ ],
2675
+ [
2676
+ "Ġch",
2677
+ "all"
2678
+ ],
2679
+ [
2680
+ "Ġcon",
2681
+ "text"
2682
+ ],
2683
+ [
2684
+ "all",
2685
+ "y"
2686
+ ],
2687
+ [
2688
+ "Ġex",
2689
+ "ample"
2690
+ ],
2691
+ [
2692
+ "Ġpart",
2693
+ "s"
2694
+ ],
2695
+ [
2696
+ "Ġdiffer",
2697
+ "ence"
2698
+ ],
2699
+ [
2700
+ "Out",
2701
+ "put"
2702
+ ],
2703
+ [
2704
+ "Su",
2705
+ "gg"
2706
+ ],
2707
+ [
2708
+ "bs",
2709
+ "ite"
2710
+ ],
2711
+ [
2712
+ "ff",
2713
+ "ect"
2714
+ ],
2715
+ [
2716
+ "iz",
2717
+ "e"
2718
+ ],
2719
+ [
2720
+ "ul",
2721
+ "ar"
2722
+ ],
2723
+ [
2724
+ "ĠU",
2725
+ "S"
2726
+ ],
2727
+ [
2728
+ "Ġk",
2729
+ "now"
2730
+ ],
2731
+ [
2732
+ "Ġim",
2733
+ "port"
2734
+ ],
2735
+ [
2736
+ "Ġite",
2737
+ "ms"
2738
+ ],
2739
+ [
2740
+ "Ġacc",
2741
+ "ording"
2742
+ ],
2743
+ [
2744
+ "Ġcor",
2745
+ "rect"
2746
+ ],
2747
+ [
2748
+ "Ġwe",
2749
+ "bsite"
2750
+ ],
2751
+ [
2752
+ "Ġinter",
2753
+ "esting"
2754
+ ],
2755
+ [
2756
+ "Ġhel",
2757
+ "p"
2758
+ ],
2759
+ [
2760
+ "igh",
2761
+ "t"
2762
+ ],
2763
+ [
2764
+ "Ġgramm",
2765
+ "atic"
2766
+ ],
2767
+ [
2768
+ "Com",
2769
+ "pose"
2770
+ ],
2771
+ [
2772
+ "Class",
2773
+ "ify"
2774
+ ],
2775
+ [
2776
+ "Rew",
2777
+ "rite"
2778
+ ],
2779
+ [
2780
+ "Th",
2781
+ "e"
2782
+ ],
2783
+ [
2784
+ "for",
2785
+ "m"
2786
+ ],
2787
+ [
2788
+ "Ġtas",
2789
+ "k"
2790
+ ],
2791
+ [
2792
+ "Ġact",
2793
+ "ive"
2794
+ ],
2795
+ [
2796
+ "Ġson",
2797
+ "g"
2798
+ ],
2799
+ [
2800
+ "Ġspe",
2801
+ "ech"
2802
+ ],
2803
+ [
2804
+ "Ġsci",
2805
+ "entif"
2806
+ ],
2807
+ [
2808
+ "Ġslo",
2809
+ "gan"
2810
+ ],
2811
+ [
2812
+ "redi",
2813
+ "ct"
2814
+ ],
2815
+ [
2816
+ "Ġbene",
2817
+ "fits"
2818
+ ],
2819
+ [
2820
+ "Ġinvol",
2821
+ "ving"
2822
+ ],
2823
+ [
2824
+ "Ġmod",
2825
+ "els"
2826
+ ],
2827
+ [
2828
+ "Ġmach",
2829
+ "ine"
2830
+ ],
2831
+ [
2832
+ "Ġelement",
2833
+ "s"
2834
+ ],
2835
+ [
2836
+ "Ġsumm",
2837
+ "er"
2838
+ ],
2839
+ [
2840
+ "Ġlangu",
2841
+ "age"
2842
+ ],
2843
+ [
2844
+ "Ġchall",
2845
+ "enges"
2846
+ ],
2847
+ [
2848
+ "Sugg",
2849
+ "est"
2850
+ ],
2851
+ [
2852
+ "Ġgrammatic",
2853
+ "al"
2854
+ ],
2855
+ [
2856
+ "Ġscientif",
2857
+ "ic"
2858
+ ]
2859
+ ]
2860
+ }
2861
+ }
tokenizer_config.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "backend": "tokenizers",
3
+ "bos_token": "<s>",
4
+ "eos_token": "</s>",
5
+ "extra_special_tokens": [
6
+ "<|user|>",
7
+ "<|bot|>",
8
+ "<|end|>"
9
+ ],
10
+ "mask_token": "<mask>",
11
+ "model_max_length": 1000000000000000019884624838656,
12
+ "pad_token": "<pad>",
13
+ "tokenizer_class": "TokenizersBackend",
14
+ "unk_token": "<unk>"
15
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afde10076c965ae0b6510c01e669607fe10be70da8b4661ee97a0bcf71ca0547
3
+ size 5585