kenkwon commited on
Commit
52de6a4
·
verified ·
1 Parent(s): e802563

Update spaCy pipeline

Browse files
.gitattributes CHANGED
@@ -33,3 +33,6 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ ner/model filter=lfs diff=lfs merge=lfs -text
37
+ tok2vec/model filter=lfs diff=lfs merge=lfs -text
38
+ vi_task_ner-any-py3-none-any.whl filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - spacy
4
+ - token-classification
5
+ language:
6
+ - vi
7
+ model-index:
8
+ - name: vi_task_ner
9
+ results:
10
+ - task:
11
+ name: NER
12
+ type: token-classification
13
+ metrics:
14
+ - name: NER Precision
15
+ type: precision
16
+ value: 0.8979591837
17
+ - name: NER Recall
18
+ type: recall
19
+ value: 0.8979591837
20
+ - name: NER F Score
21
+ type: f_score
22
+ value: 0.8979591837
23
+ ---
24
+ This is ner model for task
25
+
26
+ | Feature | Description |
27
+ | --- | --- |
28
+ | **Name** | `vi_task_ner` |
29
+ | **Version** | `0.0.0` |
30
+ | **spaCy** | `>=3.7.5,<3.8.0` |
31
+ | **Default Pipeline** | `tok2vec`, `ner` |
32
+ | **Components** | `tok2vec`, `ner` |
33
+ | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
34
+ | **Sources** | n/a |
35
+ | **License** | n/a |
36
+ | **Author** | [Chánh Hỷ]() |
37
+
38
+ ### Label Scheme
39
+
40
+ <details>
41
+
42
+ <summary>View label scheme (5 labels for 1 components)</summary>
43
+
44
+ | Component | Labels |
45
+ | --- | --- |
46
+ | **`ner`** | `DATE`, `LOCATION`, `PERSON`, `TASK`, `TIME` |
47
+
48
+ </details>
49
+
50
+ ### Accuracy
51
+
52
+ | Type | Score |
53
+ | --- | --- |
54
+ | `ENTS_F` | 89.80 |
55
+ | `ENTS_P` | 89.80 |
56
+ | `ENTS_R` | 89.80 |
57
+ | `TOK2VEC_LOSS` | 19657.96 |
58
+ | `NER_LOSS` | 12221.95 |
config.cfg ADDED
@@ -0,0 +1,145 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [paths]
2
+ train = "train.spacy"
3
+ dev = "dev.spacy"
4
+ vectors = null
5
+ init_tok2vec = null
6
+
7
+ [system]
8
+ gpu_allocator = null
9
+ seed = 0
10
+
11
+ [nlp]
12
+ lang = "xx"
13
+ pipeline = ["tok2vec","ner"]
14
+ batch_size = 1000
15
+ disabled = []
16
+ before_creation = null
17
+ after_creation = null
18
+ after_pipeline_creation = null
19
+ tokenizer = {"@tokenizers":"spacy.Tokenizer.v1"}
20
+ vectors = {"@vectors":"spacy.Vectors.v1"}
21
+
22
+ [components]
23
+
24
+ [components.ner]
25
+ factory = "ner"
26
+ incorrect_spans_key = null
27
+ moves = null
28
+ scorer = {"@scorers":"spacy.ner_scorer.v1"}
29
+ update_with_oracle_cut_size = 100
30
+
31
+ [components.ner.model]
32
+ @architectures = "spacy.TransitionBasedParser.v2"
33
+ state_type = "ner"
34
+ extra_state_tokens = false
35
+ hidden_width = 64
36
+ maxout_pieces = 2
37
+ use_upper = true
38
+ nO = null
39
+
40
+ [components.ner.model.tok2vec]
41
+ @architectures = "spacy.Tok2VecListener.v1"
42
+ width = ${components.tok2vec.model.encode.width}
43
+ upstream = "*"
44
+
45
+ [components.tok2vec]
46
+ factory = "tok2vec"
47
+
48
+ [components.tok2vec.model]
49
+ @architectures = "spacy.Tok2Vec.v2"
50
+
51
+ [components.tok2vec.model.embed]
52
+ @architectures = "spacy.MultiHashEmbed.v2"
53
+ width = ${components.tok2vec.model.encode.width}
54
+ attrs = ["NORM","PREFIX","SUFFIX","SHAPE"]
55
+ rows = [5000,1000,2500,2500]
56
+ include_static_vectors = false
57
+
58
+ [components.tok2vec.model.encode]
59
+ @architectures = "spacy.MaxoutWindowEncoder.v2"
60
+ width = 96
61
+ depth = 4
62
+ window_size = 1
63
+ maxout_pieces = 3
64
+
65
+ [corpora]
66
+
67
+ [corpora.dev]
68
+ @readers = "spacy.Corpus.v1"
69
+ path = ${paths.dev}
70
+ max_length = 0
71
+ gold_preproc = false
72
+ limit = 0
73
+ augmenter = null
74
+
75
+ [corpora.train]
76
+ @readers = "spacy.Corpus.v1"
77
+ path = ${paths.train}
78
+ max_length = 0
79
+ gold_preproc = false
80
+ limit = 0
81
+ augmenter = null
82
+
83
+ [training]
84
+ dev_corpus = "corpora.dev"
85
+ train_corpus = "corpora.train"
86
+ seed = ${system.seed}
87
+ gpu_allocator = ${system.gpu_allocator}
88
+ dropout = 0.1
89
+ accumulate_gradient = 1
90
+ patience = 1600
91
+ max_epochs = 0
92
+ max_steps = 20000
93
+ eval_frequency = 200
94
+ frozen_components = []
95
+ annotating_components = []
96
+ before_to_disk = null
97
+ before_update = null
98
+
99
+ [training.batcher]
100
+ @batchers = "spacy.batch_by_words.v1"
101
+ discard_oversize = false
102
+ tolerance = 0.2
103
+ get_length = null
104
+
105
+ [training.batcher.size]
106
+ @schedules = "compounding.v1"
107
+ start = 100
108
+ stop = 1000
109
+ compound = 1.001
110
+ t = 0.0
111
+
112
+ [training.logger]
113
+ @loggers = "spacy.ConsoleLogger.v1"
114
+ progress_bar = false
115
+
116
+ [training.optimizer]
117
+ @optimizers = "Adam.v1"
118
+ beta1 = 0.9
119
+ beta2 = 0.999
120
+ L2_is_weight_decay = true
121
+ L2 = 0.01
122
+ grad_clip = 1.0
123
+ use_averages = false
124
+ eps = 0.00000001
125
+ learn_rate = 0.001
126
+
127
+ [training.score_weights]
128
+ ents_f = 1.0
129
+ ents_p = 0.0
130
+ ents_r = 0.0
131
+ ents_per_type = null
132
+
133
+ [pretraining]
134
+
135
+ [initialize]
136
+ vectors = ${paths.vectors}
137
+ init_tok2vec = ${paths.init_tok2vec}
138
+ vocab_data = null
139
+ lookups = null
140
+ before_init = null
141
+ after_init = null
142
+
143
+ [initialize.components]
144
+
145
+ [initialize.tokenizer]
meta.json ADDED
@@ -0,0 +1,73 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "lang":"vi",
3
+ "name":"task_ner",
4
+ "version":"0.0.0",
5
+ "description":"This is ner model for task",
6
+ "author":"Ch\u00e1nh H\u1ef7",
7
+ "email":"hlchy11997@gmail.com",
8
+ "url":"",
9
+ "license":"",
10
+ "spacy_version":">=3.7.5,<3.8.0",
11
+ "spacy_git_version":"a6d0fc360",
12
+ "vectors":{
13
+ "width":0,
14
+ "vectors":0,
15
+ "keys":0,
16
+ "name":null
17
+ },
18
+ "labels":{
19
+ "tok2vec":[
20
+
21
+ ],
22
+ "ner":[
23
+ "DATE",
24
+ "LOCATION",
25
+ "PERSON",
26
+ "TASK",
27
+ "TIME"
28
+ ]
29
+ },
30
+ "pipeline":[
31
+ "tok2vec",
32
+ "ner"
33
+ ],
34
+ "components":[
35
+ "tok2vec",
36
+ "ner"
37
+ ],
38
+ "disabled":[
39
+
40
+ ],
41
+ "performance":{
42
+ "ents_f":0.8979591837,
43
+ "ents_p":0.8979591837,
44
+ "ents_r":0.8979591837,
45
+ "ents_per_type":{
46
+ "TIME":{
47
+ "p":0.9473684211,
48
+ "r":0.9473684211,
49
+ "f":0.9473684211
50
+ },
51
+ "DATE":{
52
+ "p":0.8723404255,
53
+ "r":0.9111111111,
54
+ "f":0.8913043478
55
+ },
56
+ "TASK":{
57
+ "p":0.875,
58
+ "r":0.875,
59
+ "f":0.875
60
+ },
61
+ "PERSON":{
62
+ "p":0.9285714286,
63
+ "r":0.8125,
64
+ "f":0.8666666667
65
+ }
66
+ },
67
+ "tok2vec_loss":196.5795554539,
68
+ "ner_loss":122.2195483109
69
+ },
70
+ "requirements":[
71
+
72
+ ]
73
+ }
ner/cfg ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "moves":null,
3
+ "update_with_oracle_cut_size":100,
4
+ "multitasks":[
5
+
6
+ ],
7
+ "min_action_freq":1,
8
+ "learn_tokens":false,
9
+ "beam_width":1,
10
+ "beam_density":0.0,
11
+ "beam_update_prob":0.0,
12
+ "incorrect_spans_key":null
13
+ }
ner/model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5abe06e35b2210f36e1084f11de0734821dd7bb78c13836a85ac79ee0f1a4774
3
+ size 131668
ner/moves ADDED
@@ -0,0 +1 @@
 
 
1
+ ��moves� {"0":{},"1":{"TASK":1998,"DATE":631,"TIME":445,"PERSON":253,"LOCATION":2},"2":{"TASK":1998,"DATE":631,"TIME":445,"PERSON":253,"LOCATION":2},"3":{"TASK":1998,"DATE":631,"TIME":445,"PERSON":253,"LOCATION":2},"4":{"TASK":1998,"DATE":631,"TIME":445,"PERSON":253,"LOCATION":2,"":1},"5":{"":1}}�cfg��neg_key�
tok2vec/cfg ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+
3
+ }
tok2vec/model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6802a1aa6560ae4366b5ddba351841800646048fbcac81236a72e4636a455f6
3
+ size 6009091
tokenizer ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ ��prefix_search� �^§|^%|^=|^—|^–|^\+(?![0-9])|^…|^……|^,|^:|^;|^\!|^\?|^¿|^؟|^¡|^\(|^\)|^\[|^\]|^\{|^\}|^<|^>|^_|^#|^\*|^&|^。|^?|^!|^,|^、|^;|^:|^~|^·|^।|^،|^۔|^؛|^٪|^\.\.+|^…|^\'|^"|^”|^“|^`|^‘|^´|^’|^‚|^,|^„|^»|^«|^「|^」|^『|^』|^(|^)|^〔|^〕|^【|^】|^《|^》|^〈|^〉|^〈|^〉|^⟦|^⟧|^\$|^£|^€|^¥|^฿|^US\$|^C\$|^A\$|^₽|^﷼|^₴|^₠|^₡|^₢|^₣|^₤|^₥|^₦|^₧|^₨|^₩|^₪|^₫|^€|^₭|^₮|^₯|^₰|^₱|^₲|^₳|^₴|^₵|^₶|^₷|^₸|^₹|^₺|^₻|^₼|^₽|^₾|^₿|^[\u00A6\u00A9\u00AE\u00B0\u0482\u058D\u058E\u060E\u060F\u06DE\u06E9\u06FD\u06FE\u07F6\u09FA\u0B70\u0BF3-\u0BF8\u0BFA\u0C7F\u0D4F\u0D79\u0F01-\u0F03\u0F13\u0F15-\u0F17\u0F1A-\u0F1F\u0F34\u0F36\u0F38\u0FBE-\u0FC5\u0FC7-\u0FCC\u0FCE\u0FCF\u0FD5-\u0FD8\u109E\u109F\u1390-\u1399\u1940\u19DE-\u19FF\u1B61-\u1B6A\u1B74-\u1B7C\u2100\u2101\u2103-\u2106\u2108\u2109\u2114\u2116\u2117\u211E-\u2123\u2125\u2127\u2129\u212E\u213A\u213B\u214A\u214C\u214D\u214F\u218A\u218B\u2195-\u2199\u219C-\u219F\u21A1\u21A2\u21A4\u21A5\u21A7-\u21AD\u21AF-\u21CD\u21D0\u21D1\u21D3\u21D5-\u21F3\u2300-\u2307\u230C-\u231F\u2322-\u2328\u232B-\u237B\u237D-\u239A\u23B4-\u23DB\u23E2-\u2426\u2440-\u244A\u249C-\u24E9\u2500-\u25B6\u25B8-\u25C0\u25C2-\u25F7\u2600-\u266E\u2670-\u2767\u2794-\u27BF\u2800-\u28FF\u2B00-\u2B2F\u2B45\u2B46\u2B4D-\u2B73\u2B76-\u2B95\u2B98-\u2BC8\u2BCA-\u2BFE\u2CE5-\u2CEA\u2E80-\u2E99\u2E9B-\u2EF3\u2F00-\u2FD5\u2FF0-\u2FFB\u3004\u3012\u3013\u3020\u3036\u3037\u303E\u303F\u3190\u3191\u3196-\u319F\u31C0-\u31E3\u3200-\u321E\u322A-\u3247\u3250\u3260-\u327F\u328A-\u32B0\u32C0-\u32FE\u3300-\u33FF\u4DC0-\u4DFF\uA490-\uA4C6\uA828-\uA82B\uA836\uA837\uA839\uAA77-\uAA79\uFDFD\uFFE4\uFFE8\uFFED\uFFEE\uFFFC\uFFFD\U00010137-\U0001013F\U00010179-\U00010189\U0001018C-\U0001018E\U00010190-\U0001019B\U000101A0\U000101D0-\U000101FC\U00010877\U00010878\U00010AC8\U0001173F\U00016B3C-\U00016B3F\U00016B45\U0001BC9C\U0001D000-\U0001D0F5\U0001D100-\U0001D126\U0001D129-\U0001D164\U0001D16A-\U0001D16C\U0001D183\U0001D184\U0001D18C-\U0001D1A9\U0001D1AE-\U0001D1E8\U0001D200-\U0001D241\U0001D245\U0001D300-\U0001D356\U0001D800-\U0001D9FF\U0001DA37-\U0001DA3A\U0001DA6D-\U0001DA74\U0001DA76-\U0001DA83\U0001DA85\U0001DA86\U0001ECAC\U0001F000-\U0001F02B\U0001F030-\U0001F093\U0001F0A0-\U0001F0AE\U0001F0B1-\U0001F0BF\U0001F0C1-\U0001F0CF\U0001F0D1-\U0001F0F5\U0001F110-\U0001F16B\U0001F170-\U0001F1AC\U0001F1E6-\U0001F202\U0001F210-\U0001F23B\U0001F240-\U0001F248\U0001F250\U0001F251\U0001F260-\U0001F265\U0001F300-\U0001F3FA\U0001F400-\U0001F6D4\U0001F6E0-\U0001F6EC\U0001F6F0-\U0001F6F9\U0001F700-\U0001F773\U0001F780-\U0001F7D8\U0001F800-\U0001F80B\U0001F810-\U0001F847\U0001F850-\U0001F859\U0001F860-\U0001F887\U0001F890-\U0001F8AD\U0001F900-\U0001F90B\U0001F910-\U0001F93E\U0001F940-\U0001F970\U0001F973-\U0001F976\U0001F97A\U0001F97C-\U0001F9A2\U0001F9B0-\U0001F9B9\U0001F9C0-\U0001F9C2\U0001F9D0-\U0001F9FF\U0001FA60-\U0001FA6D]�suffix_search�2�…$|……$|,$|:$|;$|\!$|\?$|¿$|؟$|¡$|\($|\)$|\[$|\]$|\{$|\}$|<$|>$|_$|#$|\*$|&$|。$|?$|!$|,$|、$|;$|:$|~$|·$|।$|،$|۔$|؛$|٪$|\.\.+$|…$|\'$|"$|”$|“$|`$|‘$|´$|’$|‚$|,$|„$|»$|«$|「$|」$|『$|』$|($|)$|〔$|〕$|【$|】$|《$|》$|〈$|〉$|〈$|〉$|⟦$|⟧$|[\u00A6\u00A9\u00AE\u00B0\u0482\u058D\u058E\u060E\u060F\u06DE\u06E9\u06FD\u06FE\u07F6\u09FA\u0B70\u0BF3-\u0BF8\u0BFA\u0C7F\u0D4F\u0D79\u0F01-\u0F03\u0F13\u0F15-\u0F17\u0F1A-\u0F1F\u0F34\u0F36\u0F38\u0FBE-\u0FC5\u0FC7-\u0FCC\u0FCE\u0FCF\u0FD5-\u0FD8\u109E\u109F\u1390-\u1399\u1940\u19DE-\u19FF\u1B61-\u1B6A\u1B74-\u1B7C\u2100\u2101\u2103-\u2106\u2108\u2109\u2114\u2116\u2117\u211E-\u2123\u2125\u2127\u2129\u212E\u213A\u213B\u214A\u214C\u214D\u214F\u218A\u218B\u2195-\u2199\u219C-\u219F\u21A1\u21A2\u21A4\u21A5\u21A7-\u21AD\u21AF-\u21CD\u21D0\u21D1\u21D3\u21D5-\u21F3\u2300-\u2307\u230C-\u231F\u2322-\u2328\u232B-\u237B\u237D-\u239A\u23B4-\u23DB\u23E2-\u2426\u2440-\u244A\u249C-\u24E9\u2500-\u25B6\u25B8-\u25C0\u25C2-\u25F7\u2600-\u266E\u2670-\u2767\u2794-\u27BF\u2800-\u28FF\u2B00-\u2B2F\u2B45\u2B46\u2B4D-\u2B73\u2B76-\u2B95\u2B98-\u2BC8\u2BCA-\u2BFE\u2CE5-\u2CEA\u2E80-\u2E99\u2E9B-\u2EF3\u2F00-\u2FD5\u2FF0-\u2FFB\u3004\u3012\u3013\u3020\u3036\u3037\u303E\u303F\u3190\u3191\u3196-\u319F\u31C0-\u31E3\u3200-\u321E\u322A-\u3247\u3250\u3260-\u327F\u328A-\u32B0\u32C0-\u32FE\u3300-\u33FF\u4DC0-\u4DFF\uA490-\uA4C6\uA828-\uA82B\uA836\uA837\uA839\uAA77-\uAA79\uFDFD\uFFE4\uFFE8\uFFED\uFFEE\uFFFC\uFFFD\U00010137-\U0001013F\U00010179-\U00010189\U0001018C-\U0001018E\U00010190-\U0001019B\U000101A0\U000101D0-\U000101FC\U00010877\U00010878\U00010AC8\U0001173F\U00016B3C-\U00016B3F\U00016B45\U0001BC9C\U0001D000-\U0001D0F5\U0001D100-\U0001D126\U0001D129-\U0001D164\U0001D16A-\U0001D16C\U0001D183\U0001D184\U0001D18C-\U0001D1A9\U0001D1AE-\U0001D1E8\U0001D200-\U0001D241\U0001D245\U0001D300-\U0001D356\U0001D800-\U0001D9FF\U0001DA37-\U0001DA3A\U0001DA6D-\U0001DA74\U0001DA76-\U0001DA83\U0001DA85\U0001DA86\U0001ECAC\U0001F000-\U0001F02B\U0001F030-\U0001F093\U0001F0A0-\U0001F0AE\U0001F0B1-\U0001F0BF\U0001F0C1-\U0001F0CF\U0001F0D1-\U0001F0F5\U0001F110-\U0001F16B\U0001F170-\U0001F1AC\U0001F1E6-\U0001F202\U0001F210-\U0001F23B\U0001F240-\U0001F248\U0001F250\U0001F251\U0001F260-\U0001F265\U0001F300-\U0001F3FA\U0001F400-\U0001F6D4\U0001F6E0-\U0001F6EC\U0001F6F0-\U0001F6F9\U0001F700-\U0001F773\U0001F780-\U0001F7D8\U0001F800-\U0001F80B\U0001F810-\U0001F847\U0001F850-\U0001F859\U0001F860-\U0001F887\U0001F890-\U0001F8AD\U0001F900-\U0001F90B\U0001F910-\U0001F93E\U0001F940-\U0001F970\U0001F973-\U0001F976\U0001F97A\U0001F97C-\U0001F9A2\U0001F9B0-\U0001F9B9\U0001F9C0-\U0001F9C2\U0001F9D0-\U0001F9FF\U0001FA60-\U0001FA6D]$|'s$|'S$|’s$|’S$|—$|–$|(?<=[0-9])\+$|(?<=°[FfCcKk])\.$|(?<=[0-9])(?:\$|£|€|¥|฿|US\$|C\$|A\$|₽|﷼|₴|₠|₡|₢|₣|₤|₥|₦|₧|₨|₩|₪|₫|€|₭|₮|₯|₰|₱|₲|₳|₴|₵|₶|₷|₸|₹|₺|₻|₼|₽|₾|₿)$|(?<=[0-9])(?:km|km²|km³|m|m²|m³|dm|dm²|dm³|cm|cm²|cm³|mm|mm²|mm³|ha|µm|nm|yd|in|ft|kg|g|mg|µg|t|lb|oz|m/s|km/h|kmh|mph|hPa|Pa|mbar|mb|MB|kb|KB|gb|GB|tb|TB|T|G|M|K|%|км|км²|км³|м|м²|м³|дм|дм²|дм³|см|см²|см³|мм|мм²|мм³|нм|кг|г|мг|м/с|км/ч|кПа|Па|мбар|Кб|КБ|кб|Мб|МБ|мб|Гб|ГБ|гб|Тб|ТБ|тбكم|كم²|كم³|م|م²|م³|سم|سم²|سم³|مم|مم²|مم³|كم|غرام|جرام|جم|كغ|ملغ|كوب|اكواب)$|(?<=[0-9a-z\uFF41-\uFF5A\u00DF-\u00F6\u00F8-\u00FF\u0101\u0103\u0105\u0107\u0109\u010B\u010D\u010F\u0111\u0113\u0115\u0117\u0119\u011B\u011D\u011F\u0121\u0123\u0125\u0127\u0129\u012B\u012D\u012F\u0131\u0133\u0135\u0137\u0138\u013A\u013C\u013E\u0140\u0142\u0144\u0146\u0148\u0149\u014B\u014D\u014F\u0151\u0153\u0155\u0157\u0159\u015B\u015D\u015F\u0161\u0163\u0165\u0167\u0169\u016B\u016D\u016F\u0171\u0173\u0175\u0177\u017A\u017C\u017E\u017F\u0180\u0183\u0185\u0188\u018C\u018D\u0192\u0195\u0199-\u019B\u019E\u01A1\u01A3\u01A5\u01A8\u01AA\u01AB\u01AD\u01B0\u01B4\u01B6\u01B9\u01BA\u01BD-\u01BF\u01C6\u01C9\u01CC\u01CE\u01D0\u01D2\u01D4\u01D6\u01D8\u01DA\u01DC\u01DD\u01DF\u01E1\u01E3\u01E5\u01E7\u01E9\u01EB\u01ED\u01EF\u01F0\u01F3\u01F5\u01F9\u01FB\u01FD\u01FF\u0201\u0203\u0205\u0207\u0209\u020B\u020D\u020F\u0211\u0213\u0215\u0217\u0219\u021B\u021D\u021F\u0221\u0223\u0225\u0227\u0229\u022B\u022D\u022F\u0231\u0233-\u0239\u023C\u023F\u0240\u0242\u0247\u0249\u024B\u024D\u024F\u2C61\u2C65\u2C66\u2C68\u2C6A\u2C6C\u2C71\u2C73\u2C74\u2C76-\u2C7B\uA723\uA725\uA727\uA729\uA72B\uA72D\uA72F-\uA731\uA733\uA735\uA737\uA739\uA73B\uA73D\uA73F\uA741\uA743\uA745\uA747\uA749\uA74B\uA74D\uA74F\uA751\uA753\uA755\uA757\uA759\uA75B\uA75D\uA75F\uA761\uA763\uA765\uA767\uA769\uA76B\uA76D\uA76F\uA771-\uA778\uA77A\uA77C\uA77F\uA781\uA783\uA785\uA787\uA78C\uA78E\uA791\uA793-\uA795\uA797\uA799\uA79B\uA79D\uA79F\uA7A1\uA7A3\uA7A5\uA7A7\uA7A9\uA7AF\uA7B5\uA7B7\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E01\u1E03\u1E05\u1E07\u1E09\u1E0B\u1E0D\u1E0F\u1E11\u1E13\u1E15\u1E17\u1E19\u1E1B\u1E1D\u1E1F\u1E21\u1E23\u1E25\u1E27\u1E29\u1E2B\u1E2D\u1E2F\u1E31\u1E33\u1E35\u1E37\u1E39\u1E3B\u1E3D\u1E3F\u1E41\u1E43\u1E45\u1E47\u1E49\u1E4B\u1E4D\u1E4F\u1E51\u1E53\u1E55\u1E57\u1E59\u1E5B\u1E5D\u1E5F\u1E61\u1E63\u1E65\u1E67\u1E69\u1E6B\u1E6D\u1E6F\u1E71\u1E73\u1E75\u1E77\u1E79\u1E7B\u1E7D\u1E7F\u1E81\u1E83\u1E85\u1E87\u1E89\u1E8B\u1E8D\u1E8F\u1E91\u1E93\u1E95-\u1E9D\u1E9F\u1EA1\u1EA3\u1EA5\u1EA7\u1EA9\u1EAB\u1EAD\u1EAF\u1EB1\u1EB3\u1EB5\u1EB7\u1EB9\u1EBB\u1EBD\u1EBF\u1EC1\u1EC3\u1EC5\u1EC7\u1EC9\u1ECB\u1ECD\u1ECF\u1ED1\u1ED3\u1ED5\u1ED7\u1ED9\u1EDB\u1EDD\u1EDF\u1EE1\u1EE3\u1EE5\u1EE7\u1EE9\u1EEB\u1EED\u1EEF\u1EF1\u1EF3\u1EF5\u1EF7\u1EF9\u1EFB\u1EFD\u1EFFёа-яәөүҗңһα-ωάέίόώήύа-щюяіїєґѓѕјљњќѐѝ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F%²\-\+…|……|,|:|;|\!|\?|¿|؟|¡|\(|\)|\[|\]|\{|\}|<|>|_|#|\*|&|。|?|!|,|、|;|:|~|·|।|،|۔|؛|٪(?:\'"”“`‘´’‚,„»«「」『』()〔〕【】《》〈〉〈〉⟦⟧)])\.$|(?<=[A-Z\uFF21-\uFF3A\u00C0-\u00D6\u00D8-\u00DE\u0100\u0102\u0104\u0106\u0108\u010A\u010C\u010E\u0110\u0112\u0114\u0116\u0118\u011A\u011C\u011E\u0120\u0122\u0124\u0126\u0128\u012A\u012C\u012E\u0130\u0132\u0134\u0136\u0139\u013B\u013D\u013F\u0141\u0143\u0145\u0147\u014A\u014C\u014E\u0150\u0152\u0154\u0156\u0158\u015A\u015C\u015E\u0160\u0162\u0164\u0166\u0168\u016A\u016C\u016E\u0170\u0172\u0174\u0176\u0178\u0179\u017B\u017D\u0181\u0182\u0184\u0186\u0187\u0189-\u018B\u018E-\u0191\u0193\u0194\u0196-\u0198\u019C\u019D\u019F\u01A0\u01A2\u01A4\u01A6\u01A7\u01A9\u01AC\u01AE\u01AF\u01B1-\u01B3\u01B5\u01B7\u01B8\u01BC\u01C4\u01C7\u01CA\u01CD\u01CF\u01D1\u01D3\u01D5\u01D7\u01D9\u01DB\u01DE\u01E0\u01E2\u01E4\u01E6\u01E8\u01EA\u01EC\u01EE\u01F1\u01F4\u01F6-\u01F8\u01FA\u01FC\u01FE\u0200\u0202\u0204\u0206\u0208\u020A\u020C\u020E\u0210\u0212\u0214\u0216\u0218\u021A\u021C\u021E\u0220\u0222\u0224\u0226\u0228\u022A\u022C\u022E\u0230\u0232\u023A\u023B\u023D\u023E\u0241\u0243-\u0246\u0248\u024A\u024C\u024E\u2C60\u2C62-\u2C64\u2C67\u2C69\u2C6B\u2C6D-\u2C70\u2C72\u2C75\u2C7E\u2C7F\uA722\uA724\uA726\uA728\uA72A\uA72C\uA72E\uA732\uA734\uA736\uA738\uA73A\uA73C\uA73E\uA740\uA742\uA744\uA746\uA748\uA74A\uA74C\uA74E\uA750\uA752\uA754\uA756\uA758\uA75A\uA75C\uA75E\uA760\uA762\uA764\uA766\uA768\uA76A\uA76C\uA76E\uA779\uA77B\uA77D\uA77E\uA780\uA782\uA784\uA786\uA78B\uA78D\uA790\uA792\uA796\uA798\uA79A\uA79C\uA79E\uA7A0\uA7A2\uA7A4\uA7A6\uA7A8\uA7AA-\uA7AE\uA7B0-\uA7B4\uA7B6\uA7B8\u1E00\u1E02\u1E04\u1E06\u1E08\u1E0A\u1E0C\u1E0E\u1E10\u1E12\u1E14\u1E16\u1E18\u1E1A\u1E1C\u1E1E\u1E20\u1E22\u1E24\u1E26\u1E28\u1E2A\u1E2C\u1E2E\u1E30\u1E32\u1E34\u1E36\u1E38\u1E3A\u1E3C\u1E3E\u1E40\u1E42\u1E44\u1E46\u1E48\u1E4A\u1E4C\u1E4E\u1E50\u1E52\u1E54\u1E56\u1E58\u1E5A\u1E5C\u1E5E\u1E60\u1E62\u1E64\u1E66\u1E68\u1E6A\u1E6C\u1E6E\u1E70\u1E72\u1E74\u1E76\u1E78\u1E7A\u1E7C\u1E7E\u1E80\u1E82\u1E84\u1E86\u1E88\u1E8A\u1E8C\u1E8E\u1E90\u1E92\u1E94\u1E9E\u1EA0\u1EA2\u1EA4\u1EA6\u1EA8\u1EAA\u1EAC\u1EAE\u1EB0\u1EB2\u1EB4\u1EB6\u1EB8\u1EBA\u1EBC\u1EBE\u1EC0\u1EC2\u1EC4\u1EC6\u1EC8\u1ECA\u1ECC\u1ECE\u1ED0\u1ED2\u1ED4\u1ED6\u1ED8\u1EDA\u1EDC\u1EDE\u1EE0\u1EE2\u1EE4\u1EE6\u1EE8\u1EEA\u1EEC\u1EEE\u1EF0\u1EF2\u1EF4\u1EF6\u1EF8\u1EFA\u1EFC\u1EFEЁА-ЯӘӨҮҖҢҺΑ-ΩΆΈΊΌΏΉΎА-ЩЮЯІЇЄҐЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F][A-Z\uFF21-\uFF3A\u00C0-\u00D6\u00D8-\u00DE\u0100\u0102\u0104\u0106\u0108\u010A\u010C\u010E\u0110\u0112\u0114\u0116\u0118\u011A\u011C\u011E\u0120\u0122\u0124\u0126\u0128\u012A\u012C\u012E\u0130\u0132\u0134\u0136\u0139\u013B\u013D\u013F\u0141\u0143\u0145\u0147\u014A\u014C\u014E\u0150\u0152\u0154\u0156\u0158\u015A\u015C\u015E\u0160\u0162\u0164\u0166\u0168\u016A\u016C\u016E\u0170\u0172\u0174\u0176\u0178\u0179\u017B\u017D\u0181\u0182\u0184\u0186\u0187\u0189-\u018B\u018E-\u0191\u0193\u0194\u0196-\u0198\u019C\u019D\u019F\u01A0\u01A2\u01A4\u01A6\u01A7\u01A9\u01AC\u01AE\u01AF\u01B1-\u01B3\u01B5\u01B7\u01B8\u01BC\u01C4\u01C7\u01CA\u01CD\u01CF\u01D1\u01D3\u01D5\u01D7\u01D9\u01DB\u01DE\u01E0\u01E2\u01E4\u01E6\u01E8\u01EA\u01EC\u01EE\u01F1\u01F4\u01F6-\u01F8\u01FA\u01FC\u01FE\u0200\u0202\u0204\u0206\u0208\u020A\u020C\u020E\u0210\u0212\u0214\u0216\u0218\u021A\u021C\u021E\u0220\u0222\u0224\u0226\u0228\u022A\u022C\u022E\u0230\u0232\u023A\u023B\u023D\u023E\u0241\u0243-\u0246\u0248\u024A\u024C\u024E\u2C60\u2C62-\u2C64\u2C67\u2C69\u2C6B\u2C6D-\u2C70\u2C72\u2C75\u2C7E\u2C7F\uA722\uA724\uA726\uA728\uA72A\uA72C\uA72E\uA732\uA734\uA736\uA738\uA73A\uA73C\uA73E\uA740\uA742\uA744\uA746\uA748\uA74A\uA74C\uA74E\uA750\uA752\uA754\uA756\uA758\uA75A\uA75C\uA75E\uA760\uA762\uA764\uA766\uA768\uA76A\uA76C\uA76E\uA779\uA77B\uA77D\uA77E\uA780\uA782\uA784\uA786\uA78B\uA78D\uA790\uA792\uA796\uA798\uA79A\uA79C\uA79E\uA7A0\uA7A2\uA7A4\uA7A6\uA7A8\uA7AA-\uA7AE\uA7B0-\uA7B4\uA7B6\uA7B8\u1E00\u1E02\u1E04\u1E06\u1E08\u1E0A\u1E0C\u1E0E\u1E10\u1E12\u1E14\u1E16\u1E18\u1E1A\u1E1C\u1E1E\u1E20\u1E22\u1E24\u1E26\u1E28\u1E2A\u1E2C\u1E2E\u1E30\u1E32\u1E34\u1E36\u1E38\u1E3A\u1E3C\u1E3E\u1E40\u1E42\u1E44\u1E46\u1E48\u1E4A\u1E4C\u1E4E\u1E50\u1E52\u1E54\u1E56\u1E58\u1E5A\u1E5C\u1E5E\u1E60\u1E62\u1E64\u1E66\u1E68\u1E6A\u1E6C\u1E6E\u1E70\u1E72\u1E74\u1E76\u1E78\u1E7A\u1E7C\u1E7E\u1E80\u1E82\u1E84\u1E86\u1E88\u1E8A\u1E8C\u1E8E\u1E90\u1E92\u1E94\u1E9E\u1EA0\u1EA2\u1EA4\u1EA6\u1EA8\u1EAA\u1EAC\u1EAE\u1EB0\u1EB2\u1EB4\u1EB6\u1EB8\u1EBA\u1EBC\u1EBE\u1EC0\u1EC2\u1EC4\u1EC6\u1EC8\u1ECA\u1ECC\u1ECE\u1ED0\u1ED2\u1ED4\u1ED6\u1ED8\u1EDA\u1EDC\u1EDE\u1EE0\u1EE2\u1EE4\u1EE6\u1EE8\u1EEA\u1EEC\u1EEE\u1EF0\u1EF2\u1EF4\u1EF6\u1EF8\u1EFA\u1EFC\u1EFEЁА-ЯӘӨҮҖҢҺΑ-ΩΆΈΊΌΏΉΎА-ЩЮЯІЇЄҐЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F])\.$�infix_finditer�>�\.\.+|…|[\u00A6\u00A9\u00AE\u00B0\u0482\u058D\u058E\u060E\u060F\u06DE\u06E9\u06FD\u06FE\u07F6\u09FA\u0B70\u0BF3-\u0BF8\u0BFA\u0C7F\u0D4F\u0D79\u0F01-\u0F03\u0F13\u0F15-\u0F17\u0F1A-\u0F1F\u0F34\u0F36\u0F38\u0FBE-\u0FC5\u0FC7-\u0FCC\u0FCE\u0FCF\u0FD5-\u0FD8\u109E\u109F\u1390-\u1399\u1940\u19DE-\u19FF\u1B61-\u1B6A\u1B74-\u1B7C\u2100\u2101\u2103-\u2106\u2108\u2109\u2114\u2116\u2117\u211E-\u2123\u2125\u2127\u2129\u212E\u213A\u213B\u214A\u214C\u214D\u214F\u218A\u218B\u2195-\u2199\u219C-\u219F\u21A1\u21A2\u21A4\u21A5\u21A7-\u21AD\u21AF-\u21CD\u21D0\u21D1\u21D3\u21D5-\u21F3\u2300-\u2307\u230C-\u231F\u2322-\u2328\u232B-\u237B\u237D-\u239A\u23B4-\u23DB\u23E2-\u2426\u2440-\u244A\u249C-\u24E9\u2500-\u25B6\u25B8-\u25C0\u25C2-\u25F7\u2600-\u266E\u2670-\u2767\u2794-\u27BF\u2800-\u28FF\u2B00-\u2B2F\u2B45\u2B46\u2B4D-\u2B73\u2B76-\u2B95\u2B98-\u2BC8\u2BCA-\u2BFE\u2CE5-\u2CEA\u2E80-\u2E99\u2E9B-\u2EF3\u2F00-\u2FD5\u2FF0-\u2FFB\u3004\u3012\u3013\u3020\u3036\u3037\u303E\u303F\u3190\u3191\u3196-\u319F\u31C0-\u31E3\u3200-\u321E\u322A-\u3247\u3250\u3260-\u327F\u328A-\u32B0\u32C0-\u32FE\u3300-\u33FF\u4DC0-\u4DFF\uA490-\uA4C6\uA828-\uA82B\uA836\uA837\uA839\uAA77-\uAA79\uFDFD\uFFE4\uFFE8\uFFED\uFFEE\uFFFC\uFFFD\U00010137-\U0001013F\U00010179-\U00010189\U0001018C-\U0001018E\U00010190-\U0001019B\U000101A0\U000101D0-\U000101FC\U00010877\U00010878\U00010AC8\U0001173F\U00016B3C-\U00016B3F\U00016B45\U0001BC9C\U0001D000-\U0001D0F5\U0001D100-\U0001D126\U0001D129-\U0001D164\U0001D16A-\U0001D16C\U0001D183\U0001D184\U0001D18C-\U0001D1A9\U0001D1AE-\U0001D1E8\U0001D200-\U0001D241\U0001D245\U0001D300-\U0001D356\U0001D800-\U0001D9FF\U0001DA37-\U0001DA3A\U0001DA6D-\U0001DA74\U0001DA76-\U0001DA83\U0001DA85\U0001DA86\U0001ECAC\U0001F000-\U0001F02B\U0001F030-\U0001F093\U0001F0A0-\U0001F0AE\U0001F0B1-\U0001F0BF\U0001F0C1-\U0001F0CF\U0001F0D1-\U0001F0F5\U0001F110-\U0001F16B\U0001F170-\U0001F1AC\U0001F1E6-\U0001F202\U0001F210-\U0001F23B\U0001F240-\U0001F248\U0001F250\U0001F251\U0001F260-\U0001F265\U0001F300-\U0001F3FA\U0001F400-\U0001F6D4\U0001F6E0-\U0001F6EC\U0001F6F0-\U0001F6F9\U0001F700-\U0001F773\U0001F780-\U0001F7D8\U0001F800-\U0001F80B\U0001F810-\U0001F847\U0001F850-\U0001F859\U0001F860-\U0001F887\U0001F890-\U0001F8AD\U0001F900-\U0001F90B\U0001F910-\U0001F93E\U0001F940-\U0001F970\U0001F973-\U0001F976\U0001F97A\U0001F97C-\U0001F9A2\U0001F9B0-\U0001F9B9\U0001F9C0-\U0001F9C2\U0001F9D0-\U0001F9FF\U0001FA60-\U0001FA6D]|(?<=[0-9])[+\-\*^](?=[0-9-])|(?<=[a-z\uFF41-\uFF5A\u00DF-\u00F6\u00F8-\u00FF\u0101\u0103\u0105\u0107\u0109\u010B\u010D\u010F\u0111\u0113\u0115\u0117\u0119\u011B\u011D\u011F\u0121\u0123\u0125\u0127\u0129\u012B\u012D\u012F\u0131\u0133\u0135\u0137\u0138\u013A\u013C\u013E\u0140\u0142\u0144\u0146\u0148\u0149\u014B\u014D\u014F\u0151\u0153\u0155\u0157\u0159\u015B\u015D\u015F\u0161\u0163\u0165\u0167\u0169\u016B\u016D\u016F\u0171\u0173\u0175\u0177\u017A\u017C\u017E\u017F\u0180\u0183\u0185\u0188\u018C\u018D\u0192\u0195\u0199-\u019B\u019E\u01A1\u01A3\u01A5\u01A8\u01AA\u01AB\u01AD\u01B0\u01B4\u01B6\u01B9\u01BA\u01BD-\u01BF\u01C6\u01C9\u01CC\u01CE\u01D0\u01D2\u01D4\u01D6\u01D8\u01DA\u01DC\u01DD\u01DF\u01E1\u01E3\u01E5\u01E7\u01E9\u01EB\u01ED\u01EF\u01F0\u01F3\u01F5\u01F9\u01FB\u01FD\u01FF\u0201\u0203\u0205\u0207\u0209\u020B\u020D\u020F\u0211\u0213\u0215\u0217\u0219\u021B\u021D\u021F\u0221\u0223\u0225\u0227\u0229\u022B\u022D\u022F\u0231\u0233-\u0239\u023C\u023F\u0240\u0242\u0247\u0249\u024B\u024D\u024F\u2C61\u2C65\u2C66\u2C68\u2C6A\u2C6C\u2C71\u2C73\u2C74\u2C76-\u2C7B\uA723\uA725\uA727\uA729\uA72B\uA72D\uA72F-\uA731\uA733\uA735\uA737\uA739\uA73B\uA73D\uA73F\uA741\uA743\uA745\uA747\uA749\uA74B\uA74D\uA74F\uA751\uA753\uA755\uA757\uA759\uA75B\uA75D\uA75F\uA761\uA763\uA765\uA767\uA769\uA76B\uA76D\uA76F\uA771-\uA778\uA77A\uA77C\uA77F\uA781\uA783\uA785\uA787\uA78C\uA78E\uA791\uA793-\uA795\uA797\uA799\uA79B\uA79D\uA79F\uA7A1\uA7A3\uA7A5\uA7A7\uA7A9\uA7AF\uA7B5\uA7B7\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E01\u1E03\u1E05\u1E07\u1E09\u1E0B\u1E0D\u1E0F\u1E11\u1E13\u1E15\u1E17\u1E19\u1E1B\u1E1D\u1E1F\u1E21\u1E23\u1E25\u1E27\u1E29\u1E2B\u1E2D\u1E2F\u1E31\u1E33\u1E35\u1E37\u1E39\u1E3B\u1E3D\u1E3F\u1E41\u1E43\u1E45\u1E47\u1E49\u1E4B\u1E4D\u1E4F\u1E51\u1E53\u1E55\u1E57\u1E59\u1E5B\u1E5D\u1E5F\u1E61\u1E63\u1E65\u1E67\u1E69\u1E6B\u1E6D\u1E6F\u1E71\u1E73\u1E75\u1E77\u1E79\u1E7B\u1E7D\u1E7F\u1E81\u1E83\u1E85\u1E87\u1E89\u1E8B\u1E8D\u1E8F\u1E91\u1E93\u1E95-\u1E9D\u1E9F\u1EA1\u1EA3\u1EA5\u1EA7\u1EA9\u1EAB\u1EAD\u1EAF\u1EB1\u1EB3\u1EB5\u1EB7\u1EB9\u1EBB\u1EBD\u1EBF\u1EC1\u1EC3\u1EC5\u1EC7\u1EC9\u1ECB\u1ECD\u1ECF\u1ED1\u1ED3\u1ED5\u1ED7\u1ED9\u1EDB\u1EDD\u1EDF\u1EE1\u1EE3\u1EE5\u1EE7\u1EE9\u1EEB\u1EED\u1EEF\u1EF1\u1EF3\u1EF5\u1EF7\u1EF9\u1EFB\u1EFD\u1EFFёа-яәөүҗңһα-ωάέίόώήύа-щюяіїєґѓѕјљњќѐѝ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F\'"”“`‘´’‚,„»«「」『』()〔〕【】《》〈〉〈〉⟦⟧])\.(?=[A-Z\uFF21-\uFF3A\u00C0-\u00D6\u00D8-\u00DE\u0100\u0102\u0104\u0106\u0108\u010A\u010C\u010E\u0110\u0112\u0114\u0116\u0118\u011A\u011C\u011E\u0120\u0122\u0124\u0126\u0128\u012A\u012C\u012E\u0130\u0132\u0134\u0136\u0139\u013B\u013D\u013F\u0141\u0143\u0145\u0147\u014A\u014C\u014E\u0150\u0152\u0154\u0156\u0158\u015A\u015C\u015E\u0160\u0162\u0164\u0166\u0168\u016A\u016C\u016E\u0170\u0172\u0174\u0176\u0178\u0179\u017B\u017D\u0181\u0182\u0184\u0186\u0187\u0189-\u018B\u018E-\u0191\u0193\u0194\u0196-\u0198\u019C\u019D\u019F\u01A0\u01A2\u01A4\u01A6\u01A7\u01A9\u01AC\u01AE\u01AF\u01B1-\u01B3\u01B5\u01B7\u01B8\u01BC\u01C4\u01C7\u01CA\u01CD\u01CF\u01D1\u01D3\u01D5\u01D7\u01D9\u01DB\u01DE\u01E0\u01E2\u01E4\u01E6\u01E8\u01EA\u01EC\u01EE\u01F1\u01F4\u01F6-\u01F8\u01FA\u01FC\u01FE\u0200\u0202\u0204\u0206\u0208\u020A\u020C\u020E\u0210\u0212\u0214\u0216\u0218\u021A\u021C\u021E\u0220\u0222\u0224\u0226\u0228\u022A\u022C\u022E\u0230\u0232\u023A\u023B\u023D\u023E\u0241\u0243-\u0246\u0248\u024A\u024C\u024E\u2C60\u2C62-\u2C64\u2C67\u2C69\u2C6B\u2C6D-\u2C70\u2C72\u2C75\u2C7E\u2C7F\uA722\uA724\uA726\uA728\uA72A\uA72C\uA72E\uA732\uA734\uA736\uA738\uA73A\uA73C\uA73E\uA740\uA742\uA744\uA746\uA748\uA74A\uA74C\uA74E\uA750\uA752\uA754\uA756\uA758\uA75A\uA75C\uA75E\uA760\uA762\uA764\uA766\uA768\uA76A\uA76C\uA76E\uA779\uA77B\uA77D\uA77E\uA780\uA782\uA784\uA786\uA78B\uA78D\uA790\uA792\uA796\uA798\uA79A\uA79C\uA79E\uA7A0\uA7A2\uA7A4\uA7A6\uA7A8\uA7AA-\uA7AE\uA7B0-\uA7B4\uA7B6\uA7B8\u1E00\u1E02\u1E04\u1E06\u1E08\u1E0A\u1E0C\u1E0E\u1E10\u1E12\u1E14\u1E16\u1E18\u1E1A\u1E1C\u1E1E\u1E20\u1E22\u1E24\u1E26\u1E28\u1E2A\u1E2C\u1E2E\u1E30\u1E32\u1E34\u1E36\u1E38\u1E3A\u1E3C\u1E3E\u1E40\u1E42\u1E44\u1E46\u1E48\u1E4A\u1E4C\u1E4E\u1E50\u1E52\u1E54\u1E56\u1E58\u1E5A\u1E5C\u1E5E\u1E60\u1E62\u1E64\u1E66\u1E68\u1E6A\u1E6C\u1E6E\u1E70\u1E72\u1E74\u1E76\u1E78\u1E7A\u1E7C\u1E7E\u1E80\u1E82\u1E84\u1E86\u1E88\u1E8A\u1E8C\u1E8E\u1E90\u1E92\u1E94\u1E9E\u1EA0\u1EA2\u1EA4\u1EA6\u1EA8\u1EAA\u1EAC\u1EAE\u1EB0\u1EB2\u1EB4\u1EB6\u1EB8\u1EBA\u1EBC\u1EBE\u1EC0\u1EC2\u1EC4\u1EC6\u1EC8\u1ECA\u1ECC\u1ECE\u1ED0\u1ED2\u1ED4\u1ED6\u1ED8\u1EDA\u1EDC\u1EDE\u1EE0\u1EE2\u1EE4\u1EE6\u1EE8\u1EEA\u1EEC\u1EEE\u1EF0\u1EF2\u1EF4\u1EF6\u1EF8\u1EFA\u1EFC\u1EFEЁА-ЯӘӨҮҖҢҺΑ-ΩΆΈΊΌΏΉΎА-ЩЮЯІЇЄҐЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F\'"”“`‘´’‚,„»«「」『』()〔〕【】《》〈〉〈〉⟦⟧])|(?<=[A-Za-z\uFF21-\uFF3A\uFF41-\uFF5A\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u00FF\u0100-\u017F\u0180-\u01BF\u01C4-\u024F\u2C60-\u2C7B\u2C7E\u2C7F\uA722-\uA76F\uA771-\uA787\uA78B-\uA78E\uA790-\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E00-\u1EFFёа-яЁА-ЯәөүҗңһӘӨҮҖҢҺα-ωάέίόώήύΑ-ΩΆΈΊΌΏΉΎа-щюяіїєґА-ЩЮЯІЇЄҐѓѕјљњќѐѝЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F]),(?=[A-Za-z\uFF21-\uFF3A\uFF41-\uFF5A\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u00FF\u0100-\u017F\u0180-\u01BF\u01C4-\u024F\u2C60-\u2C7B\u2C7E\u2C7F\uA722-\uA76F\uA771-\uA787\uA78B-\uA78E\uA790-\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E00-\u1EFFёа-яЁА-ЯәөүҗңһӘӨҮҖҢҺα-ωάέίόώήύΑ-ΩΆΈΊΌΏΉΎа-щюяіїєґА-ЩЮЯІЇЄҐѓѕјљњќѐѝЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F])|(?<=[A-Za-z\uFF21-\uFF3A\uFF41-\uFF5A\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u00FF\u0100-\u017F\u0180-\u01BF\u01C4-\u024F\u2C60-\u2C7B\u2C7E\u2C7F\uA722-\uA76F\uA771-\uA787\uA78B-\uA78E\uA790-\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E00-\u1EFFёа-яЁА-ЯәөүҗңһӘӨҮҖҢҺα-ωάέίόώήύΑ-ΩΆΈΊΌΏΉΎа-щюяіїєґА-ЩЮЯІЇЄҐѓѕјљњќѐѝЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F])(?:-|–|—|--|---|——|~)(?=[A-Za-z\uFF21-\uFF3A\uFF41-\uFF5A\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u00FF\u0100-\u017F\u0180-\u01BF\u01C4-\u024F\u2C60-\u2C7B\u2C7E\u2C7F\uA722-\uA76F\uA771-\uA787\uA78B-\uA78E\uA790-\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E00-\u1EFFёа-яЁА-ЯәөүҗңһӘӨҮҖҢҺα-ωάέίόώήύΑ-ΩΆΈΊΌΏΉΎа-щюяіїєґА-ЩЮЯІЇЄҐѓѕјљњќѐѝЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F])|(?<=[A-Za-z\uFF21-\uFF3A\uFF41-\uFF5A\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u00FF\u0100-\u017F\u0180-\u01BF\u01C4-\u024F\u2C60-\u2C7B\u2C7E\u2C7F\uA722-\uA76F\uA771-\uA787\uA78B-\uA78E\uA790-\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E00-\u1EFFёа-яЁА-ЯәөүҗңһӘӨҮҖҢҺα-ωάέίόώήύΑ-ΩΆΈΊΌΏΉΎа-щюяіїєґА-ЩЮЯІЇЄҐѓѕјљњќѐѝЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F0-9])[:<>=/](?=[A-Za-z\uFF21-\uFF3A\uFF41-\uFF5A\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u00FF\u0100-\u017F\u0180-\u01BF\u01C4-\u024F\u2C60-\u2C7B\u2C7E\u2C7F\uA722-\uA76F\uA771-\uA787\uA78B-\uA78E\uA790-\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E00-\u1EFFёа-яЁА-ЯәөүҗңһӘӨҮҖҢҺα-ωάέίόώήύΑ-ΩΆΈΊΌΏΉΎа-щюяіїєґА-ЩЮЯІЇЄҐѓѕјљњќѐѝЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F])�token_match��url_match�
2
+ ��A�
3
+ � ��A� �'��A�'�''��A�''�(*_*)��A�(*_*)�(-8��A�(-8�(-:��A�(-:�(-;��A�(-;�(-_-)��A�(-_-)�(._.)��A�(._.)�(:��A�(:�(;��A�(;�(=��A�(=�(>_<)��A�(>_<)�(^_^)��A�(^_^)�(o:��A�(o:�(¬_¬)��A�(¬_¬)�(ಠ_ಠ)��A�(ಠ_ಠ)�(╯°□°)╯︵┻━┻��A�(╯°□°)╯︵┻━┻�)-:��A�)-:�):��A�):�-_-��A�-_-�-__-��A�-__-�._.��A�._.�0.0��A�0.0�0.o��A�0.o�0_0��A�0_0�0_o��A�0_o�8)��A�8)�8-)��A�8-)�8-D��A�8-D�8D��A�8D�:'(��A�:'(�:')��A�:')�:'-(��A�:'-(�:'-)��A�:'-)�:(��A�:(�:((��A�:((�:(((��A�:(((�:()��A�:()�:)��A�:)�:))��A�:))�:)))��A�:)))�:*��A�:*�:-(��A�:-(�:-((��A�:-((�:-(((��A�:-(((�:-)��A�:-)�:-))��A�:-))�:-)))��A�:-)))�:-*��A�:-*�:-/��A�:-/�:-0��A�:-0�:-3��A�:-3�:->��A�:->�:-D��A�:-D�:-O��A�:-O�:-P��A�:-P�:-X��A�:-X�:-]��A�:-]�:-o��A�:-o�:-p��A�:-p�:-x��A�:-x�:-|��A�:-|�:-}��A�:-}�:/��A�:/�:0��A�:0�:1��A�:1�:3��A�:3�:>��A�:>�:D��A�:D�:O��A�:O�:P��A�:P�:X��A�:X�:]��A�:]�:o��A�:o�:o)��A�:o)�:p��A�:p�:x��A�:x�:|��A�:|�:}��A�:}�;)��A�;)�;-)��A�;-)�;-D��A�;-D�;D��A�;D�;_;��A�;_;�<.<��A�<.<�</3��A�</3�<3��A�<3�<33��A�<33�<333��A�<333�<space>��A�<space>�=(��A�=(�=)��A�=)�=/��A�=/�=3��A�=3�=D��A�=D�=[��A�=[�=]��A�=]�=|��A�=|�>.<��A�>.<�>.>��A�>.>�>:(��A�>:(�>:o��A�>:o�><(((*>��A�><(((*>�@_@��A�@_@�C++��A�C++�O.O��A�O.O�O.o��A�O.o�O_O��A�O_O�O_o��A�O_o�V.V��A�V.V�V_V��A�V_V�XD��A�XD�XDD��A�XDD�[-:��A�[-:�[:��A�[:�[=��A�[=�\")��A�\")�\n��A�\n�\t��A�\t�]=��A�]=�^_^��A�^_^�^__^��A�^__^�^___^��A�^___^�a.��A�a.�b.��A�b.�c.��A�c.�d.��A�d.�e.��A�e.�f.��A�f.�g.��A�g.�h.��A�h.�i.��A�i.�j.��A�j.�k.��A�k.�l.��A�l.�m.��A�m.�n.��A�n.�o.��A�o.�o.0��A�o.0�o.O��A�o.O�o.o��A�o.o�o_0��A�o_0�o_O��A�o_O�o_o��A�o_o�p.��A�p.�q.��A�q.�r.��A�r.�s.��A�s.�t.��A�t.�u.��A�u.�v.��A�v.�v.v��A�v.v�v_v��A�v_v�w.��A�w.�x.��A�x.�xD��A�xD�xDD��A�xDD�y.��A�y.�z.��A�z.� ��A� C� �¯\(ツ)/¯��A�¯\(ツ)/¯�°C.��A�°�A�C�A�.�°F.��A�°�A�F�A�.�°K.��A�°�A�K�A�.�°c.��A�°�A�c�A�.�°f.��A�°�A�f�A�.�°k.��A�°�A�k�A�.�ä.��A�ä.�ö.��A�ö.�ü.��A�ü.�ಠ_ಠ��A�ಠ_ಠ�ಠ︵ಠ��A�ಠ︵ಠ�—��A�—�faster_heuristics�
vi_task_ner-any-py3-none-any.whl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f92c313af6e8f6fc608b32e4a549d0ff3df66eaa5896bd382055cdf881f52339
3
+ size 5667925
vocab/key2row ADDED
@@ -0,0 +1 @@
 
 
1
+
vocab/lookups.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76be8b528d0075f7aae98d6fa57a6d3c83ae480a8469e668d7b0af968995ac71
3
+ size 1
vocab/strings.json ADDED
@@ -0,0 +1,1242 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ "\t",
3
+ "\n",
4
+ " ",
5
+ " ",
6
+ "\"",
7
+ "'",
8
+ "''",
9
+ "'-(",
10
+ "'-)",
11
+ "(",
12
+ "(((",
13
+ "(*>",
14
+ "(*_*)",
15
+ "(-8",
16
+ "(-:",
17
+ "(-;",
18
+ "(-_-)",
19
+ "(-d",
20
+ "(._.)",
21
+ "(:",
22
+ "(;",
23
+ "(=",
24
+ "(>_<)",
25
+ "(^_^)",
26
+ "(o:",
27
+ "(x:",
28
+ "(x_x)",
29
+ "(\u00ac_\u00ac)",
30
+ "(\u0ca0_\u0ca0)",
31
+ "(\u256f\u00b0\u25a1\u00b0\uff09\u256f\ufe35\u253b\u2501\u253b",
32
+ ")",
33
+ ")))",
34
+ ")-:",
35
+ ")/\u00af",
36
+ "):",
37
+ "*",
38
+ "-",
39
+ "-((",
40
+ "-))",
41
+ "-/",
42
+ "-0",
43
+ "-3",
44
+ "-8",
45
+ "-D",
46
+ "-O",
47
+ "-P",
48
+ "-X",
49
+ "-_-",
50
+ "-__-",
51
+ "-d",
52
+ "-o",
53
+ "-p",
54
+ "-x",
55
+ "-|",
56
+ ".",
57
+ "._.",
58
+ "/",
59
+ "/10",
60
+ "/11",
61
+ "/12",
62
+ "/3",
63
+ "/d",
64
+ "0",
65
+ "0.0",
66
+ "0.o",
67
+ "0/1",
68
+ "0/9",
69
+ "0_0",
70
+ "0_o",
71
+ "1",
72
+ "1/10",
73
+ "1/12",
74
+ "10",
75
+ "10/10",
76
+ "10/11",
77
+ "10h",
78
+ "10h00",
79
+ "11",
80
+ "11h30",
81
+ "12",
82
+ "12/10",
83
+ "12h",
84
+ "12h00",
85
+ "13h15",
86
+ "14",
87
+ "14:00",
88
+ "14:30",
89
+ "14h",
90
+ "14h30",
91
+ "15",
92
+ "15/10",
93
+ "15/11",
94
+ "15h",
95
+ "15h00",
96
+ "16h45",
97
+ "17",
98
+ "17/10",
99
+ "17:30",
100
+ "17h",
101
+ "17h30",
102
+ "18:00",
103
+ "18h",
104
+ "18h20",
105
+ "19h00",
106
+ "19h30",
107
+ "19h50",
108
+ "1h",
109
+ "2",
110
+ "2/1",
111
+ "2/10",
112
+ "20/1",
113
+ "20/10",
114
+ "20/11",
115
+ "20/12",
116
+ "20h",
117
+ "20h00",
118
+ "21h",
119
+ "21h00",
120
+ "22h00",
121
+ "23/12",
122
+ "23h59",
123
+ "25/10",
124
+ "25/11",
125
+ "3",
126
+ "3/10",
127
+ "30",
128
+ "30/10",
129
+ "30/11",
130
+ "30/12",
131
+ "30/9",
132
+ "33",
133
+ "333",
134
+ "3h",
135
+ "4",
136
+ "4h",
137
+ "5",
138
+ "5h",
139
+ "6",
140
+ "6h",
141
+ "6h00",
142
+ "6h30",
143
+ "7",
144
+ "7h",
145
+ "7h45",
146
+ "8",
147
+ "8)",
148
+ "8-",
149
+ "8-)",
150
+ "8-D",
151
+ "8-d",
152
+ "8D",
153
+ "8d",
154
+ "8h",
155
+ "8h00",
156
+ "8h10",
157
+ "9",
158
+ "9h",
159
+ "9h15",
160
+ "9h30",
161
+ ":",
162
+ ":'(",
163
+ ":')",
164
+ ":'-(",
165
+ ":'-)",
166
+ ":(",
167
+ ":((",
168
+ ":(((",
169
+ ":()",
170
+ ":)",
171
+ ":))",
172
+ ":)))",
173
+ ":*",
174
+ ":-(",
175
+ ":-((",
176
+ ":-(((",
177
+ ":-)",
178
+ ":-))",
179
+ ":-)))",
180
+ ":-*",
181
+ ":-/",
182
+ ":-0",
183
+ ":-3",
184
+ ":->",
185
+ ":-D",
186
+ ":-O",
187
+ ":-P",
188
+ ":-X",
189
+ ":-]",
190
+ ":-d",
191
+ ":-o",
192
+ ":-p",
193
+ ":-x",
194
+ ":-|",
195
+ ":-}",
196
+ ":/",
197
+ ":0",
198
+ ":00",
199
+ ":1",
200
+ ":3",
201
+ ":30",
202
+ ":>",
203
+ ":D",
204
+ ":O",
205
+ ":P",
206
+ ":X",
207
+ ":]",
208
+ ":d",
209
+ ":o",
210
+ ":o)",
211
+ ":p",
212
+ ":x",
213
+ ":x)",
214
+ ":|",
215
+ ":}",
216
+ ";",
217
+ ";)",
218
+ ";-)",
219
+ ";-D",
220
+ ";-X",
221
+ ";-d",
222
+ ";D",
223
+ ";X",
224
+ ";_;",
225
+ ";d",
226
+ "<",
227
+ "<.<",
228
+ "</3",
229
+ "</d",
230
+ "<3",
231
+ "<33",
232
+ "<333",
233
+ "<d",
234
+ "<dd",
235
+ "<ddd",
236
+ "<space>",
237
+ "<xxxx>",
238
+ "=",
239
+ "=(",
240
+ "=)",
241
+ "=/",
242
+ "=3",
243
+ "=D",
244
+ "=X",
245
+ "=[",
246
+ "=]",
247
+ "=d",
248
+ "=|",
249
+ ">",
250
+ ">.<",
251
+ ">.>",
252
+ ">:(",
253
+ ">:o",
254
+ ">:x",
255
+ "><(((*>",
256
+ "@",
257
+ "@_@",
258
+ "A",
259
+ "ABC",
260
+ "AI",
261
+ "ASK",
262
+ "ATE",
263
+ "An",
264
+ "Anh",
265
+ "B",
266
+ "Ba",
267
+ "Backend",
268
+ "B\u00e1ch",
269
+ "B\u00ecnh",
270
+ "B\u1ea3y",
271
+ "B\u1ec7nh",
272
+ "C",
273
+ "C++",
274
+ "C.",
275
+ "CGV",
276
+ "CNTT",
277
+ "Chi\u1ec1u",
278
+ "Ch\u00fang",
279
+ "Ch\u01a1i",
280
+ "Ch\u1ecb",
281
+ "Ch\u1ee7",
282
+ "Cu\u1ed1i",
283
+ "C\u01b0\u1eddng",
284
+ "C\u1ea3",
285
+ "D",
286
+ "Data",
287
+ "Design",
288
+ "Dev",
289
+ "DevOps",
290
+ "Dung",
291
+ "D\u0169ng",
292
+ "D\u1ecdn",
293
+ "EIC",
294
+ "F",
295
+ "F.",
296
+ "FPT",
297
+ "Facebook",
298
+ "Frontend",
299
+ "G",
300
+ "G\u00f2n",
301
+ "H",
302
+ "Hai",
303
+ "Hoa",
304
+ "Ho\u00e0n",
305
+ "Ho\u00e0ng",
306
+ "Ho\u00e1",
307
+ "Huy",
308
+ "H\u00e0",
309
+ "H\u00f2a",
310
+ "H\u00f3a",
311
+ "H\u00f4m",
312
+ "H\u00f9ng",
313
+ "H\u01b0ng",
314
+ "H\u01b0\u01a1ng",
315
+ "H\u1ea1",
316
+ "H\u1ea1nh",
317
+ "H\u1ea3i",
318
+ "H\u1eb1ng",
319
+ "H\u1ecdc",
320
+ "IME",
321
+ "ION",
322
+ "K",
323
+ "K.",
324
+ "Khoa",
325
+ "Khuya",
326
+ "Kh\u1ea3i",
327
+ "L",
328
+ "LOCATION",
329
+ "Lan",
330
+ "Linh",
331
+ "L\u00e0m",
332
+ "L\u00e2m",
333
+ "L\u1ea1t",
334
+ "L\u1ecbch",
335
+ "M",
336
+ "Mai",
337
+ "Marketing",
338
+ "Minh",
339
+ "Mobile",
340
+ "M\u00f9ng",
341
+ "M\u1ed1t",
342
+ "N",
343
+ "NTT",
344
+ "Nam",
345
+ "Netflix",
346
+ "Nghe",
347
+ "Ng\u00e0y",
348
+ "Ng\u1ecdc",
349
+ "Ng\u1eef",
350
+ "Nh\u00f3m",
351
+ "Nh\u1eadt",
352
+ "N\u0103m",
353
+ "N\u1ea5u",
354
+ "N\u1eb5ng",
355
+ "N\u1ed9i",
356
+ "O",
357
+ "O.O",
358
+ "O.o",
359
+ "O_O",
360
+ "O_o",
361
+ "Ops",
362
+ "P",
363
+ "Ph\u00e1p",
364
+ "Ph\u00f2ng",
365
+ "Ph\u00fac",
366
+ "Ph\u01b0\u01a1ng",
367
+ "Ph\u01b0\u1edbc",
368
+ "Product",
369
+ "Python",
370
+ "Q",
371
+ "QA",
372
+ "Quang",
373
+ "Qu\u00e2n",
374
+ "R",
375
+ "ROOT",
376
+ "React",
377
+ "ReactJS",
378
+ "S",
379
+ "SON",
380
+ "Sinh",
381
+ "S\u00e0i",
382
+ "S\u00e1ng",
383
+ "S\u00e1u",
384
+ "S\u1eafp",
385
+ "S\u1ebfp",
386
+ "T",
387
+ "TASK",
388
+ "TOEIC",
389
+ "Team",
390
+ "Th\u00e1ng",
391
+ "Th\u1ea3o",
392
+ "Th\u1eafng",
393
+ "Th\u1ee7",
394
+ "Th\u1ee9",
395
+ "Tin",
396
+ "Ti\u1ebfng",
397
+ "To\u00e1n",
398
+ "Tr\u00e2m",
399
+ "Tr\u01b0a",
400
+ "Tu\u1ea5n",
401
+ "Tu\u1ea7n",
402
+ "T\u00e0u",
403
+ "T\u00f4i",
404
+ "T\u01b0",
405
+ "T\u1eadp",
406
+ "T\u1ed1i",
407
+ "V",
408
+ "V.V",
409
+ "V_V",
410
+ "Vi\u1ebft",
411
+ "Vi\u1ec7t",
412
+ "V\u0103n",
413
+ "V\u0169ng",
414
+ "V\u1eadt",
415
+ "X++",
416
+ "X.",
417
+ "X.X",
418
+ "X.x",
419
+ "XD",
420
+ "XDD",
421
+ "XX",
422
+ "XXX",
423
+ "XXXX",
424
+ "X_X",
425
+ "X_x",
426
+ "Xem",
427
+ "Xx",
428
+ "Xxx",
429
+ "XxxXxx",
430
+ "Xxxx",
431
+ "Xxxxx",
432
+ "XxxxxXX",
433
+ "Z",
434
+ "Zoom",
435
+ "[",
436
+ "[-:",
437
+ "[:",
438
+ "[=",
439
+ "\\",
440
+ "\\\")",
441
+ "\\n",
442
+ "\\t",
443
+ "\\x",
444
+ "]",
445
+ "]=",
446
+ "^",
447
+ "^_^",
448
+ "^__^",
449
+ "^___^",
450
+ "_*)",
451
+ "_-)",
452
+ "_.)",
453
+ "_<)",
454
+ "_^)",
455
+ "__-",
456
+ "__^",
457
+ "_\u00ac)",
458
+ "_\u0ca0)",
459
+ "a",
460
+ "a.",
461
+ "abc",
462
+ "ace",
463
+ "act",
464
+ "ai",
465
+ "ail",
466
+ "all",
467
+ "ame",
468
+ "an",
469
+ "ang",
470
+ "anh",
471
+ "ano",
472
+ "app",
473
+ "ase",
474
+ "ask",
475
+ "assignment",
476
+ "ata",
477
+ "auth",
478
+ "b",
479
+ "b.",
480
+ "ba",
481
+ "backend",
482
+ "ban",
483
+ "banh",
484
+ "bi\u1ec3n",
485
+ "buffet",
486
+ "bug",
487
+ "bu\u1ed5i",
488
+ "b\u00e0i",
489
+ "b\u00e0n",
490
+ "b\u00e1c",
491
+ "b\u00e1ch",
492
+ "b\u00e1n",
493
+ "b\u00e1nh",
494
+ "b\u00e1o",
495
+ "b\u00e1t",
496
+ "b\u00e8",
497
+ "b\u00e9",
498
+ "b\u00ecnh",
499
+ "b\u00f3ng",
500
+ "b\u01a1i",
501
+ "b\u1ea1n",
502
+ "b\u1ea3n",
503
+ "b\u1ea3o",
504
+ "b\u1ea3y",
505
+ "b\u1eaft",
506
+ "b\u1ec7nh",
507
+ "b\u1ecb",
508
+ "b\u1ed1",
509
+ "b\u1ed9",
510
+ "b\u1ee5i",
511
+ "c",
512
+ "c++",
513
+ "c.",
514
+ "ca",
515
+ "call",
516
+ "cao",
517
+ "ce>",
518
+ "cgv",
519
+ "chi\u1ec1u",
520
+ "cho",
521
+ "chung",
522
+ "chuy\u1ebfn",
523
+ "chuy\u1ec1n",
524
+ "chu\u1ea9n",
525
+ "ch\u00e1u",
526
+ "ch\u00ednh",
527
+ "ch\u00f3",
528
+ "ch\u00fang",
529
+ "ch\u01a1i",
530
+ "ch\u01b0\u01a1ng",
531
+ "ch\u1ea1y",
532
+ "ch\u1ecb",
533
+ "ch\u1ed1t",
534
+ "ch\u1ee3",
535
+ "ch\u1ee7",
536
+ "ch\u1ee9c",
537
+ "cntt",
538
+ "code",
539
+ "con",
540
+ "concert",
541
+ "cu\u1ed1i",
542
+ "cu\u1ed9c",
543
+ "c\u00e0",
544
+ "c\u00e0y",
545
+ "c\u00e1",
546
+ "c\u00e1c",
547
+ "c\u00e1o",
548
+ "c\u00e2y",
549
+ "c\u00f3",
550
+ "c\u00f4",
551
+ "c\u00f4ng",
552
+ "c\u00f9ng",
553
+ "c\u0103ng",
554
+ "c\u0169",
555
+ "c\u01a1m",
556
+ "c\u01b0\u1edbi",
557
+ "c\u01b0\u1eddng",
558
+ "c\u1ea3",
559
+ "c\u1ea7n",
560
+ "c\u1ea7u",
561
+ "c\u1eadp",
562
+ "c\u1ee7",
563
+ "c\u1ee7a",
564
+ "c\u1eeda",
565
+ "d",
566
+ "d)",
567
+ "d-",
568
+ "d-)",
569
+ "d-X",
570
+ "d.",
571
+ "d.d",
572
+ "d.x",
573
+ "d/d",
574
+ "d/dd",
575
+ "dX",
576
+ "d_d",
577
+ "d_x",
578
+ "data",
579
+ "database",
580
+ "date",
581
+ "dd",
582
+ "dd/d",
583
+ "dd/dd",
584
+ "dd:dd",
585
+ "ddd",
586
+ "ddx",
587
+ "ddxdd",
588
+ "deo",
589
+ "deploy",
590
+ "design",
591
+ "dev",
592
+ "devops",
593
+ "du",
594
+ "dung",
595
+ "dx",
596
+ "dxdd",
597
+ "d\u00e3",
598
+ "d\u0169ng",
599
+ "d\u01b0\u1ee1ng",
600
+ "d\u1ea1o",
601
+ "d\u1ea1y",
602
+ "d\u1ea7u",
603
+ "d\u1eabn",
604
+ "d\u1eady",
605
+ "d\u1eaft",
606
+ "d\u1eb9p",
607
+ "d\u1ecdn",
608
+ "d\u1ee5c",
609
+ "d\u1ee5ng",
610
+ "d\u1ef1",
611
+ "e",
612
+ "e.",
613
+ "eam",
614
+ "eic",
615
+ "em",
616
+ "email",
617
+ "end",
618
+ "ent",
619
+ "ert",
620
+ "est",
621
+ "f",
622
+ "f.",
623
+ "facebook",
624
+ "fet",
625
+ "fix",
626
+ "fpt",
627
+ "frontend",
628
+ "g",
629
+ "g.",
630
+ "game",
631
+ "ghe",
632
+ "gia",
633
+ "giao",
634
+ "gi\u00e1o",
635
+ "gi\u00e3n",
636
+ "gi\u1ea3ng",
637
+ "gi\u1eb7t",
638
+ "gi\u1edd",
639
+ "guitar",
640
+ "gym",
641
+ "g\u00e0y",
642
+ "g\u00e2n",
643
+ "g\u00f2n",
644
+ "g\u1eb7p",
645
+ "g\u1ecdc",
646
+ "g\u1ecdi",
647
+ "g\u1eedi",
648
+ "h",
649
+ "h.",
650
+ "h00",
651
+ "h10",
652
+ "h15",
653
+ "h20",
654
+ "h30",
655
+ "h45",
656
+ "h50",
657
+ "h59",
658
+ "hai",
659
+ "ham",
660
+ "hay",
661
+ "him",
662
+ "hip",
663
+ "hi\u1ec7u",
664
+ "hoa",
665
+ "hoan",
666
+ "hon",
667
+ "hop",
668
+ "ho\u00e0n",
669
+ "ho\u00e0ng",
670
+ "ho\u00e1",
671
+ "ho\u1ea1ch",
672
+ "ho\u1ea1t",
673
+ "huy",
674
+ "h\u00e0",
675
+ "h\u00e0ng",
676
+ "h\u00e1m",
677
+ "h\u00e1p",
678
+ "h\u00e1t",
679
+ "h\u00e1u",
680
+ "h\u00e2n",
681
+ "h\u00eam",
682
+ "h\u00ecnh",
683
+ "h\u00f2a",
684
+ "h\u00f3a",
685
+ "h\u00f3m",
686
+ "h\u00f4m",
687
+ "h\u00f9ng",
688
+ "h\u00fac",
689
+ "h\u00fat",
690
+ "h\u01a1i",
691
+ "h\u01b0ng",
692
+ "h\u01b0\u01a1ng",
693
+ "h\u01b0\u1edbng",
694
+ "h\u1ea1",
695
+ "h\u1ea1c",
696
+ "h\u1ea1n",
697
+ "h\u1ea1nh",
698
+ "h\u1ea1y",
699
+ "h\u1ea3i",
700
+ "h\u1ea3n",
701
+ "h\u1ea3o",
702
+ "h\u1ea7u",
703
+ "h\u1ea7y",
704
+ "h\u1ea9m",
705
+ "h\u1eadn",
706
+ "h\u1eadt",
707
+ "h\u1eafn",
708
+ "h\u1eb1ng",
709
+ "h\u1eb9n",
710
+ "h\u1ebft",
711
+ "h\u1ec7",
712
+ "h\u1ecdc",
713
+ "h\u1ecdp",
714
+ "h\u1ecfe",
715
+ "h\u1ed1t",
716
+ "h\u1ed3",
717
+ "h\u1ed9p",
718
+ "h\u1ee9c",
719
+ "h\u1ef1c",
720
+ "i",
721
+ "i.",
722
+ "iao",
723
+ "ide",
724
+ "iew",
725
+ "ign",
726
+ "ile",
727
+ "ine",
728
+ "ing",
729
+ "inh",
730
+ "int",
731
+ "ive",
732
+ "i\u00e1o",
733
+ "i\u00e3n",
734
+ "i\u00ean",
735
+ "i\u00eau",
736
+ "i\u1eb7t",
737
+ "i\u1ebft",
738
+ "i\u1ec1n",
739
+ "i\u1ec1u",
740
+ "i\u1ec3m",
741
+ "i\u1ec3n",
742
+ "i\u1ec3u",
743
+ "i\u1ec7c",
744
+ "i\u1ec7m",
745
+ "i\u1ec7n",
746
+ "i\u1ec7p",
747
+ "i\u1ec7t",
748
+ "i\u1ec7u",
749
+ "j",
750
+ "j.",
751
+ "k",
752
+ "k.",
753
+ "karaoke",
754
+ "khai",
755
+ "khi",
756
+ "khoa",
757
+ "khu",
758
+ "khuya",
759
+ "kh\u00e1ch",
760
+ "kh\u00e1m",
761
+ "kh\u00f3a",
762
+ "kh\u1ea3i",
763
+ "kh\u1ea3o",
764
+ "kh\u1ecfe",
765
+ "kia",
766
+ "ki\u1ec3m",
767
+ "km",
768
+ "k\u00e8m",
769
+ "k\u00fd",
770
+ "k\u1ebf",
771
+ "k\u1ef9",
772
+ "l",
773
+ "l.",
774
+ "lan",
775
+ "lax",
776
+ "lin",
777
+ "linh",
778
+ "live",
779
+ "livestream",
780
+ "lix",
781
+ "li\u00ean",
782
+ "li\u1ec7u",
783
+ "location",
784
+ "loy",
785
+ "luy\u1ec7n",
786
+ "lu\u1eadn",
787
+ "l\u00e0m",
788
+ "l\u00e2m",
789
+ "l\u00f4ng",
790
+ "l\u00fac",
791
+ "l\u00fd",
792
+ "l\u1ea1i",
793
+ "l\u1ea1t",
794
+ "l\u1ea9u",
795
+ "l\u1eadp",
796
+ "l\u1ecbch",
797
+ "l\u1ed7i",
798
+ "l\u1edbp",
799
+ "l\u1eddi",
800
+ "m",
801
+ "m.",
802
+ "mai",
803
+ "mail",
804
+ "marketing",
805
+ "minh",
806
+ "mobile",
807
+ "module",
808
+ "mua",
809
+ "mu\u1ed1n",
810
+ "mu\u1ed9n",
811
+ "m\u00e1y",
812
+ "m\u00ec",
813
+ "m\u00f4n",
814
+ "m\u00f9ng",
815
+ "m\u1ea5t",
816
+ "m\u1eb9",
817
+ "m\u1ec1m",
818
+ "m\u1ed1t",
819
+ "m\u1ed7i",
820
+ "m\u1edbi",
821
+ "n",
822
+ "n.",
823
+ "nam",
824
+ "nay",
825
+ "netflix",
826
+ "nghe",
827
+ "nghi\u1ec7m",
828
+ "nghi\u1ec7p",
829
+ "ngo\u00e0i",
830
+ "ngo\u1ea1i",
831
+ "ng\u00e0y",
832
+ "ng\u00e2n",
833
+ "ng\u01b0\u1eddi",
834
+ "ng\u1ecdc",
835
+ "ng\u1ee7",
836
+ "ng\u1eef",
837
+ "nha",
838
+ "nhanh",
839
+ "nh\u00e0",
840
+ "nh\u00e2n",
841
+ "nh\u00f3m",
842
+ "nh\u1ea1c",
843
+ "nh\u1eadn",
844
+ "nh\u1eadt",
845
+ "nh\u1eafn",
846
+ "nh\u1edb",
847
+ "nic",
848
+ "nit",
849
+ "ntt",
850
+ "n\u00e0y",
851
+ "n\u00e2ng",
852
+ "n\u0103m",
853
+ "n\u0103ng",
854
+ "n\u01b0\u1edbc",
855
+ "n\u1ea5u",
856
+ "n\u1eb5ng",
857
+ "n\u1ed9i",
858
+ "n\u1ed9p",
859
+ "n\u1eefa",
860
+ "o",
861
+ "o.",
862
+ "o.0",
863
+ "o.O",
864
+ "o.o",
865
+ "o_0",
866
+ "o_O",
867
+ "o_o",
868
+ "oan",
869
+ "ode",
870
+ "offline",
871
+ "oga",
872
+ "oke",
873
+ "ong",
874
+ "online",
875
+ "ook",
876
+ "oom",
877
+ "ops",
878
+ "o\u00e0i",
879
+ "o\u00e0n",
880
+ "o\u00e1n",
881
+ "o\u1ea1i",
882
+ "o\u1ea1n",
883
+ "o\u1ea1t",
884
+ "p",
885
+ "p.",
886
+ "person",
887
+ "pha",
888
+ "phim",
889
+ "phi\u00ean",
890
+ "ph\u00e1p",
891
+ "ph\u00ea",
892
+ "ph\u00f2ng",
893
+ "ph\u00fac",
894
+ "ph\u00fat",
895
+ "ph\u01b0\u01a1ng",
896
+ "ph\u01b0\u1edbc",
897
+ "ph\u1ea3i",
898
+ "ph\u1ea3n",
899
+ "ph\u1ea9m",
900
+ "ph\u1ecfng",
901
+ "ph\u1ed1",
902
+ "ph\u1edf",
903
+ "piano",
904
+ "picnic",
905
+ "product",
906
+ "pull",
907
+ "python",
908
+ "q",
909
+ "q.",
910
+ "qa",
911
+ "qua",
912
+ "quang",
913
+ "quanh",
914
+ "quen",
915
+ "qu\u00e1n",
916
+ "qu\u00e2n",
917
+ "qu\u00ean",
918
+ "qu\u00fd",
919
+ "qu\u1ea7n",
920
+ "qu\u1ed1c",
921
+ "r",
922
+ "r.",
923
+ "ra",
924
+ "rau",
925
+ "react",
926
+ "reactjs",
927
+ "relax",
928
+ "release",
929
+ "request",
930
+ "review",
931
+ "r\u00e1c",
932
+ "r\u00e2m",
933
+ "r\u00ean",
934
+ "r\u0103ng",
935
+ "r\u01b0a",
936
+ "r\u1ed3i",
937
+ "r\u1ed5",
938
+ "r\u1eeda",
939
+ "r\u1ef1c",
940
+ "s",
941
+ "s.",
942
+ "sau",
943
+ "server",
944
+ "ship",
945
+ "sinh",
946
+ "si\u00eau",
947
+ "slide",
948
+ "so\u1ea1n",
949
+ "space",
950
+ "sprint",
951
+ "stream",
952
+ "s\u00e0i",
953
+ "s\u00e1ch",
954
+ "s\u00e1ng",
955
+ "s\u00e1u",
956
+ "s\u00e2n",
957
+ "s\u01a1",
958
+ "s\u1eafp",
959
+ "s\u1ebd",
960
+ "s\u1ebfp",
961
+ "s\u1edbm",
962
+ "s\u1ee9c",
963
+ "s\u1eed",
964
+ "s\u1eeda",
965
+ "s\u1eefa",
966
+ "t",
967
+ "t.",
968
+ "tJS",
969
+ "tar",
970
+ "task",
971
+ "team",
972
+ "test",
973
+ "tham",
974
+ "thanh",
975
+ "thay",
976
+ "thi",
977
+ "tho\u1ea1i",
978
+ "thu",
979
+ "thuy\u1ebft",
980
+ "thu\u1ed1c",
981
+ "th\u00e0nh",
982
+ "th\u00e1ng",
983
+ "th\u00eam",
984
+ "th\u00ed",
985
+ "th\u01b0",
986
+ "th\u1ea3o",
987
+ "th\u1ea7u",
988
+ "th\u1ea7y",
989
+ "th\u1eafng",
990
+ "th\u1ec3",
991
+ "th\u1ecb",
992
+ "th\u1ed1ng",
993
+ "th\u1ee7",
994
+ "th\u1ee9",
995
+ "th\u1ef1c",
996
+ "time",
997
+ "tin",
998
+ "ti\u1ebfng",
999
+ "ti\u1ec1n",
1000
+ "ti\u1ec3u",
1001
+ "ti\u1ec7c",
1002
+ "tjs",
1003
+ "toeic",
1004
+ "to\u00e1n",
1005
+ "tra",
1006
+ "training",
1007
+ "tri\u1ec3n",
1008
+ "trong",
1009
+ "trung",
1010
+ "truy\u1ec1n",
1011
+ "tr\u00e0",
1012
+ "tr\u00e2m",
1013
+ "tr\u00ean",
1014
+ "tr\u00ecnh",
1015
+ "tr\u01b0a",
1016
+ "tr\u01b0\u1edbc",
1017
+ "tr\u01b0\u1eddng",
1018
+ "tr\u1ea3",
1019
+ "tr\u1ef1c",
1020
+ "tuy\u1ebfn",
1021
+ "tu\u1ea5n",
1022
+ "tu\u1ea7n",
1023
+ "ty",
1024
+ "t\u00e0i",
1025
+ "t\u00e0u",
1026
+ "t\u00e1c",
1027
+ "t\u00e2m",
1028
+ "t\u00f4i",
1029
+ "t\u01b0",
1030
+ "t\u01b0\u1edbi",
1031
+ "t\u1ea1i",
1032
+ "t\u1eadp",
1033
+ "t\u1eb7ng",
1034
+ "t\u1ebf",
1035
+ "t\u1ed1i",
1036
+ "t\u1ed5",
1037
+ "t\u1edbi",
1038
+ "t\u1ee5",
1039
+ "t\u1ee7",
1040
+ "t\u1ee9c",
1041
+ "t\u1eeb",
1042
+ "u",
1043
+ "u.",
1044
+ "uct",
1045
+ "uen",
1046
+ "ule",
1047
+ "ull",
1048
+ "ung",
1049
+ "unit",
1050
+ "uth",
1051
+ "uya",
1052
+ "u\u00e1n",
1053
+ "u\u00e2n",
1054
+ "u\u00ean",
1055
+ "u\u1ea5n",
1056
+ "u\u1ea7n",
1057
+ "u\u1ea9n",
1058
+ "u\u1eadn",
1059
+ "u\u1ed1c",
1060
+ "u\u1ed1i",
1061
+ "u\u1ed1n",
1062
+ "u\u1ed1ng",
1063
+ "u\u1ed5i",
1064
+ "u\u1ed9c",
1065
+ "u\u1ed9n",
1066
+ "v",
1067
+ "v.",
1068
+ "v.v",
1069
+ "v_v",
1070
+ "ver",
1071
+ "video",
1072
+ "violin",
1073
+ "vi\u00ean",
1074
+ "vi\u1ebft",
1075
+ "vi\u1ec7c",
1076
+ "vi\u1ec7n",
1077
+ "vi\u1ec7t",
1078
+ "v\u00e0",
1079
+ "v\u00e0o",
1080
+ "v\u0103n",
1081
+ "v\u0169ng",
1082
+ "v\u01b0\u1eddn",
1083
+ "v\u1ea5n",
1084
+ "v\u1eadt",
1085
+ "v\u1ebd",
1086
+ "v\u1ec1",
1087
+ "v\u1edbi",
1088
+ "w",
1089
+ "w.",
1090
+ "workshop",
1091
+ "x",
1092
+ "x.",
1093
+ "x.X",
1094
+ "x.d",
1095
+ "x.x",
1096
+ "xD",
1097
+ "xDD",
1098
+ "xX",
1099
+ "xXX",
1100
+ "x_X",
1101
+ "x_d",
1102
+ "x_x",
1103
+ "xd",
1104
+ "xdd",
1105
+ "xe",
1106
+ "xem",
1107
+ "xin",
1108
+ "xx",
1109
+ "xxx",
1110
+ "xxxx",
1111
+ "x\u00e1c",
1112
+ "x\u1ea1",
1113
+ "x\u1ebfp",
1114
+ "x\ufe35x",
1115
+ "y",
1116
+ "y.",
1117
+ "yoga",
1118
+ "y\u00eau",
1119
+ "y\u1ebfn",
1120
+ "y\u1ebft",
1121
+ "y\u1ec1n",
1122
+ "y\u1ec7n",
1123
+ "z",
1124
+ "z.",
1125
+ "zoom",
1126
+ "|",
1127
+ "}",
1128
+ "\u00a0",
1129
+ "\u00ac",
1130
+ "\u00ac_\u00ac",
1131
+ "\u00af",
1132
+ "\u00af\\(x)/\u00af",
1133
+ "\u00af\\(\u30c4)/\u00af",
1134
+ "\u00b0",
1135
+ "\u00b0C.",
1136
+ "\u00b0F.",
1137
+ "\u00b0K.",
1138
+ "\u00b0X.",
1139
+ "\u00b0c.",
1140
+ "\u00b0f.",
1141
+ "\u00b0k.",
1142
+ "\u00b0x.",
1143
+ "\u00d4",
1144
+ "\u00d4n",
1145
+ "\u00e0ng",
1146
+ "\u00e0nh",
1147
+ "\u00e1",
1148
+ "\u00e1ch",
1149
+ "\u00e1n",
1150
+ "\u00e1ng",
1151
+ "\u00e1nh",
1152
+ "\u00e1o",
1153
+ "\u00e2ng",
1154
+ "\u00e4",
1155
+ "\u00e4.",
1156
+ "\u00ecnh",
1157
+ "\u00ednh",
1158
+ "\u00f2ng",
1159
+ "\u00f3ng",
1160
+ "\u00f4",
1161
+ "\u00f4n",
1162
+ "\u00f4ng",
1163
+ "\u00f6",
1164
+ "\u00f6.",
1165
+ "\u00f9ng",
1166
+ "\u00fang",
1167
+ "\u00fc",
1168
+ "\u00fc.",
1169
+ "\u0103",
1170
+ "\u0103n",
1171
+ "\u0103ng",
1172
+ "\u0110",
1173
+ "\u0110i",
1174
+ "\u0110\u00e0",
1175
+ "\u0110\u1ecba",
1176
+ "\u0110\u1ecdc",
1177
+ "\u0110\u1ee9c",
1178
+ "\u0111",
1179
+ "\u0111a",
1180
+ "\u0111em",
1181
+ "\u0111i",
1182
+ "\u0111i\u1ec7n",
1183
+ "\u0111\u00e0",
1184
+ "\u0111\u00e0n",
1185
+ "\u0111\u00e1",
1186
+ "\u0111\u00ecnh",
1187
+ "\u0111\u00f3n",
1188
+ "\u0111\u00f3ng",
1189
+ "\u0111\u01a1n",
1190
+ "\u0111\u01b0a",
1191
+ "\u0111\u1ea7u",
1192
+ "\u0111\u1eb7t",
1193
+ "\u0111\u1ebfn",
1194
+ "\u0111\u1ec1",
1195
+ "\u0111\u1ec3",
1196
+ "\u0111\u1ecba",
1197
+ "\u0111\u1ecdc",
1198
+ "\u0111\u1ed1i",
1199
+ "\u0111\u1ed3",
1200
+ "\u0111\u1ed3ng",
1201
+ "\u0111\u1ed5",
1202
+ "\u0111\u1ed9i",
1203
+ "\u0111\u1ee9c",
1204
+ "\u0169ng",
1205
+ "\u01a1ng",
1206
+ "\u01b0ng",
1207
+ "\u01b0\u1edbc",
1208
+ "\u01b0\u1edbi",
1209
+ "\u01b0\u1eddi",
1210
+ "\u01b0\u1eddn",
1211
+ "\u0ca0",
1212
+ "\u0ca0_\u0ca0",
1213
+ "\u0ca0\ufe35\u0ca0",
1214
+ "\u1ea1ch",
1215
+ "\u1ea1nh",
1216
+ "\u1ea3ng",
1217
+ "\u1eafng",
1218
+ "\u1eb1ng",
1219
+ "\u1eb5ng",
1220
+ "\u1eb7ng",
1221
+ "\u1ebfng",
1222
+ "\u1ec7nh",
1223
+ "\u1ecbch",
1224
+ "\u1ecfng",
1225
+ "\u1ed1ng",
1226
+ "\u1ed3ng",
1227
+ "\u1edbng",
1228
+ "\u1eddng",
1229
+ "\u1edf",
1230
+ "\u1ee1ng",
1231
+ "\u1ee5ng",
1232
+ "\u1ee9",
1233
+ "\u1ee9ng",
1234
+ "\u2014",
1235
+ "\u2501",
1236
+ "\u253b",
1237
+ "\u253b\u2501\u253b",
1238
+ "\u256f",
1239
+ "\u25a1",
1240
+ "\ufe35",
1241
+ "\uff09"
1242
+ ]
vocab/vectors ADDED
Binary file (128 Bytes). View file
 
vocab/vectors.cfg ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "mode":"default"
3
+ }