diff --git "a/data/Niger-Congo.json" "b/data/Niger-Congo.json" --- "a/data/Niger-Congo.json" +++ "b/data/Niger-Congo.json" @@ -53,18 +53,7 @@ "name": "Bijago", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"wo\")", - "original_lang_name": "wolof", - "original_lang_code": "wol", - "scripts": [ - "Latn" - ], - "class_name": "StanzaTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bijag\u00f3", @@ -119,18 +108,7 @@ "name": "Balant-Ganja", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"wo\")", - "original_lang_name": "wolof", - "original_lang_code": "wol", - "scripts": [ - "Latn" - ], - "class_name": "StanzaTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Balanta-Ganja", @@ -178,18 +156,7 @@ "name": "Bayot", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"wo\")", - "original_lang_name": "wolof", - "original_lang_code": "wol", - "scripts": [ - "Latn" - ], - "class_name": "StanzaTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bayot", @@ -299,18 +266,7 @@ "name": "Her-Ejamat", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"wo\")", - "original_lang_name": "wolof", - "original_lang_code": "wol", - "scripts": [ - "Latn" - ], - "class_name": "StanzaTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Jola-Felupe", @@ -718,18 +674,7 @@ "name": "Banyun", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"wo\")", - "original_lang_name": "wolof", - "original_lang_code": "wol", - "scripts": [ - "Latn" - ], - "class_name": "StanzaTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bainouk-Gunyu\u00f1o", @@ -770,18 +715,7 @@ "name": "Nun", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"wo\")", - "original_lang_name": "wolof", - "original_lang_code": "wol", - "scripts": [ - "Latn" - ], - "class_name": "StanzaTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kasanga", @@ -928,18 +862,7 @@ "name": "Mbulungish-Nalu", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"wo\")", - "original_lang_name": "wolof", - "original_lang_code": "wol", - "scripts": [ - "Latn" - ], - "class_name": "StanzaTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mbulungish", @@ -1259,18 +1182,7 @@ "name": "Western", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"wo\")", - "original_lang_name": "wolof", - "original_lang_code": "wol", - "scripts": [ - "Latn" - ], - "class_name": "StanzaTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Pulaar", @@ -1517,35 +1429,13 @@ "name": "Bullom", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"wo\")", - "original_lang_name": "wolof", - "original_lang_code": "wol", - "scripts": [ - "Latn" - ], - "class_name": "StanzaTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Northern", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"wo\")", - "original_lang_name": "wolof", - "original_lang_code": "wol", - "scripts": [ - "Latn" - ], - "class_name": "StanzaTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bom-Kim", @@ -1576,18 +1466,7 @@ "name": "Southern", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"wo\")", - "original_lang_name": "wolof", - "original_lang_code": "wol", - "scripts": [ - "Latn" - ], - "class_name": "StanzaTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Sherbro", @@ -1686,18 +1565,7 @@ "name": "Gola", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"wo\")", - "original_lang_name": "wolof", - "original_lang_code": "wol", - "scripts": [ - "Latn" - ], - "class_name": "StanzaTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Gola", @@ -1895,18 +1763,7 @@ "name": "Sua", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"wo\")", - "original_lang_name": "wolof", - "original_lang_code": "wol", - "scripts": [ - "Latn" - ], - "class_name": "StanzaTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mansoanka", @@ -1937,35 +1794,13 @@ "name": "Ijoid", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Defaka", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Defaka", @@ -1986,35 +1821,13 @@ "name": "Ijo", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "East", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ijo, Southeast", @@ -2035,35 +1848,13 @@ "name": "Eastern", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Northeastern", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Nkoroo", @@ -2079,18 +1870,7 @@ "name": "Eastern", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ibani", @@ -2141,35 +1921,13 @@ "name": "West", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Inland Ijo", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Biseni", @@ -2215,18 +1973,7 @@ "name": "West Ijo", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Izon", @@ -2291,18 +2038,7 @@ "name": "Akpes", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Akpes", @@ -2357,18 +2093,7 @@ "name": "Dakoid", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Samba Daka", @@ -2429,18 +2154,7 @@ "name": "Fam", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Fam", @@ -2495,18 +2209,7 @@ "name": "Konja", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kwanja", @@ -2537,18 +2240,7 @@ "name": "Magu-Kamkam-Kila", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mbongno", @@ -2667,18 +2359,7 @@ "name": "Njerup", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Njerep", @@ -2704,18 +2385,7 @@ "name": "Ndoro", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ndoola", @@ -2753,18 +2423,7 @@ "name": "Suga", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Nizaa", @@ -3157,35 +2816,13 @@ "name": "Jarawan", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Cameroon", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Nagumi", @@ -3216,18 +2853,7 @@ "name": "Nigerian", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mbat", @@ -3451,18 +3077,7 @@ "name": "Mbe", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mbe", @@ -3534,18 +3149,7 @@ "name": "Bembe-Buyi (D.54)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bembe", @@ -3566,18 +3170,7 @@ "name": "Bembe-Buyi (D.55)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Buyu", @@ -3598,18 +3191,7 @@ "name": "Bira-Nyali (D.301)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kari", @@ -3630,18 +3212,7 @@ "name": "Bira-Nyali (D.302)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Boguru", @@ -3662,18 +3233,7 @@ "name": "Bira-Nyali (D.303)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ngbinda", @@ -3694,18 +3254,7 @@ "name": "Bira-Nyali (D.304)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Homa", @@ -3726,18 +3275,7 @@ "name": "Bira-Nyali (D.305)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Nyanga-li", @@ -3758,18 +3296,7 @@ "name": "Bira-Nyali (D.307)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mayeka", @@ -3790,18 +3317,7 @@ "name": "Bira-Nyali (D.308)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bodo", @@ -3822,18 +3338,7 @@ "name": "Bira-Nyali (D.31)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bhele", @@ -3854,18 +3359,7 @@ "name": "Bira-Nyali (D.311)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bila", @@ -3886,18 +3380,7 @@ "name": "Bira-Nyali (D.312)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kaiku", @@ -3918,18 +3401,7 @@ "name": "Bira-Nyali (D.32)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bira", @@ -3950,18 +3422,7 @@ "name": "Bira-Nyali (D.33)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Nyali", @@ -3982,18 +3443,7 @@ "name": "Bira-Nyali (D.331)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Vanuma", @@ -4014,18 +3464,7 @@ "name": "Bira-Nyali (D.332)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Budu", @@ -4046,18 +3485,7 @@ "name": "Bira-Nyali (D.333)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ndaka", @@ -4078,18 +3506,7 @@ "name": "Bira-Nyali (D.334)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mbo", @@ -4110,18 +3527,7 @@ "name": "Bira-Nyali (D.335)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Beeke", @@ -4142,18 +3548,7 @@ "name": "Bira-Nyali (D.336)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ngbee", @@ -4174,18 +3569,7 @@ "name": "Lega-Holoholo (D.201)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Lika", @@ -4206,18 +3590,7 @@ "name": "Lega-Holoholo (D.21)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bali", @@ -4238,18 +3611,7 @@ "name": "Lega-Holoholo (D.211)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kango", @@ -4270,18 +3632,7 @@ "name": "Lega-Holoholo (D.22)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Amba", @@ -4302,18 +3653,7 @@ "name": "Lega-Holoholo (D.23)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Komo", @@ -4334,18 +3674,7 @@ "name": "Lega-Holoholo (D.24)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Songoora", @@ -4456,18 +3785,7 @@ "name": "Lega-Holoholo (D.251)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kanu", @@ -4498,18 +3816,7 @@ "name": "Lega-Holoholo (D.26)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Zimba", @@ -4530,18 +3837,7 @@ "name": "Lega-Holoholo (D.27)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bangubangu", @@ -4562,18 +3858,7 @@ "name": "Lega-Holoholo (D.28)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Holoholo", @@ -4594,18 +3879,7 @@ "name": "Mbole-Enya (D.11)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mbole", @@ -4626,18 +3900,7 @@ "name": "Mbole-Enya (D.12)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Lengola", @@ -4658,18 +3921,7 @@ "name": "Mbole-Enya (D.13)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mituku", @@ -4690,18 +3942,7 @@ "name": "Mbole-Enya (D.14)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Enya", @@ -4722,18 +3963,7 @@ "name": "Mbolle-Enya (D.141)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Zula", @@ -4754,18 +3984,7 @@ "name": "Nyanga (D.43)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Nyanga", @@ -4931,18 +4150,7 @@ "name": "Chaga (E.623)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Rombo", @@ -4963,18 +4171,7 @@ "name": "Chaga (E.64)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kahe", @@ -4995,18 +4192,7 @@ "name": "Chaga (E.65)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Gweno", @@ -5072,18 +4258,7 @@ "name": "Kikuyu-Kamba (E.52)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kiembu", @@ -5149,18 +4324,7 @@ "name": "Kikuyu-Kamba (E.531)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mwimbi-Muthambi", @@ -5226,18 +4390,7 @@ "name": "Kikuyu-Kamba (E.541)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Gichuka", @@ -5303,18 +4456,7 @@ "name": "Kikuyu-Kamba (E.56)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Dhaiso", @@ -5335,18 +4477,7 @@ "name": "Nyika-Taita (E.701)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kiwilwana", @@ -5535,18 +4666,7 @@ "name": "Nyika-Taita (E.731)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Segeju", @@ -5567,18 +4687,7 @@ "name": "Nyika-Taita (E.74)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Dawida", @@ -5609,18 +4718,7 @@ "name": "Nyika-Taita (E.741)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Sagalla", @@ -5641,18 +4739,7 @@ "name": "Temi (E.46)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Temi", @@ -5805,18 +4892,7 @@ "name": "Nilamba-Rangi (F.33)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Rangi", @@ -5837,18 +4913,7 @@ "name": "Nilamba-Rangi (F.34)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mbugwe", @@ -5914,18 +4979,7 @@ "name": "Sukuma-Nyamwezi (F.22)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Konongo", @@ -5956,18 +5010,7 @@ "name": "Sukuma-Nyamwezi (F.23)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Sumbwa", @@ -5988,18 +5031,7 @@ "name": "Sukuma-Nyamwezi (F.24)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kimbu", @@ -6020,18 +5052,7 @@ "name": "Sukuma-Nyamwezi (F.25)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bungu", @@ -6052,18 +5073,7 @@ "name": "Tongwe-Bende (F.11)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Tongwe", @@ -6084,18 +5094,7 @@ "name": "Tongwe-Bende (F.12)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bende", @@ -6138,18 +5137,7 @@ "name": "Bena-Kinga (G.61)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Sangu", @@ -6215,18 +5203,7 @@ "name": "Bena-Kinga (G.63)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bena", @@ -6257,18 +5234,7 @@ "name": "Bena-Kinga (G.64)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Pangwa", @@ -6289,18 +5255,7 @@ "name": "Bena-Kinga (G.65)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kinga", @@ -6321,18 +5276,7 @@ "name": "Bena-Kinga (G.651)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Magoma", @@ -6353,18 +5297,7 @@ "name": "Bena-Kinga (G.66)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Vwanji", @@ -6385,18 +5318,7 @@ "name": "Bena-Kinga (G.67)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kisi", @@ -6597,18 +5519,7 @@ "name": "Shambala (G.22)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Asu", @@ -6674,18 +5585,7 @@ "name": "Shambala (G.24)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bondei", @@ -6751,18 +5651,7 @@ "name": "Swahili (G.402)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Makwe", @@ -6961,18 +5850,7 @@ "name": "Zigula-Zaramo (G.301)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Doe", @@ -7038,18 +5916,7 @@ "name": "Zigula-Zaramo (G.311)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mushungulu", @@ -7115,18 +5982,7 @@ "name": "Zigula-Zaramo (G.33)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Zaramo", @@ -7237,18 +6093,7 @@ "name": "Zigula-Zaramo (G.36)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kami", @@ -7359,18 +6204,7 @@ "name": "Zigula-Zaramo (G.39)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Sagala", @@ -7458,18 +6292,7 @@ "name": "Kikongo (H.112)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Doondo", @@ -7500,18 +6323,7 @@ "name": "Kikongo (H.12)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Vili", @@ -7532,18 +6344,7 @@ "name": "Kikongo (H.13)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kunyi", @@ -7564,18 +6365,7 @@ "name": "Kikongo (H.131)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Suundi", @@ -7765,18 +6555,7 @@ "name": "Kimbundu (H.23)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kibala", @@ -7797,18 +6576,7 @@ "name": "Kimbundu (H.24)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Songo", @@ -7829,18 +6597,7 @@ "name": "Mbala-Hunganna (H.41)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mbala", @@ -7861,18 +6618,7 @@ "name": "Mbala-Hunganna (H.42)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Hungana", @@ -7893,18 +6639,7 @@ "name": "Yaka (H.31)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Lonzo", @@ -7945,18 +6680,7 @@ "name": "Yaka (H.32)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Hungu", @@ -7987,18 +6711,7 @@ "name": "Yaka (H.321)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Sonde", @@ -8019,18 +6732,7 @@ "name": "Yaka (H.34)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mbangala", @@ -8073,18 +6775,7 @@ "name": "Haya-Jita (E.20)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Subi", @@ -8105,18 +6796,7 @@ "name": "Haya-Jita (E.21)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Nyambo", @@ -8182,18 +6862,7 @@ "name": "Haya-Jita (E.23)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Zinza", @@ -8214,18 +6883,7 @@ "name": "Haya-Jita (E.24)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kerewe", @@ -8246,18 +6904,7 @@ "name": "Haya-Jita (E.25)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Jita", @@ -8278,18 +6925,7 @@ "name": "Haya-Jita (E.251)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kwaya", @@ -8310,18 +6946,7 @@ "name": "Haya-Jita (E.252)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kara", @@ -8342,18 +6967,7 @@ "name": "Konzo-Ndandi (D.40)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kobo", @@ -8464,18 +7078,7 @@ "name": "Logooli-Kuria (E.401)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ngoreme", @@ -8496,18 +7099,7 @@ "name": "Logooli-Kuria (E.402)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ikizu", @@ -8573,18 +7165,7 @@ "name": "Logooli-Kuria (E.405)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kabwa", @@ -8605,18 +7186,7 @@ "name": "Logooli-Kuria (E.406)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Singa", @@ -8637,18 +7207,7 @@ "name": "Logooli-Kuria (E.41)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Lulogooli", @@ -8669,18 +7228,7 @@ "name": "Logooli-Kuria (E.411)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Luidakho-Luisukha-Lutirichi", @@ -8791,18 +7339,7 @@ "name": "Logooli-Kuria (E.431)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Suba-Simbiti", @@ -8823,18 +7360,7 @@ "name": "Logooli-Kuria (E.44)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Zanaki", @@ -8855,18 +7381,7 @@ "name": "Logooli-Kuria (E.45)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ikoma-Nata-Isenye", @@ -9047,18 +7562,7 @@ "name": "Masaba-Luhya (E.33)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Olunyole", @@ -9124,18 +7628,7 @@ "name": "Masaba-Luhya (E.341)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Olukhayo", @@ -9156,18 +7649,7 @@ "name": "Masaba-Luhya (E.342)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Olumarachi", @@ -9323,18 +7805,7 @@ "name": "Nyoro-Ganda (E.103)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ruruuli-Runyala", @@ -9445,18 +7916,7 @@ "name": "Nyoro-Ganda (E.121)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Hema", @@ -9802,18 +8262,7 @@ "name": "Ruanda-Rundi (D.63)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Fuliiru", @@ -9834,18 +8283,7 @@ "name": "Ruanda-Rundi (D.631)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kiviila", @@ -9866,18 +8304,7 @@ "name": "Ruanda-Rundi (D.64)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Shubi", @@ -9898,18 +8325,7 @@ "name": "Ruanda-Rundi (D.65)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Hangaza", @@ -9930,18 +8346,7 @@ "name": "Ruanda-Rundi (D.66)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ha", @@ -9983,18 +8388,7 @@ "name": "Shi-Hunde (D.501)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Nyindu", @@ -10015,18 +8409,7 @@ "name": "Shi-Hunde (D.51)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Hunde", @@ -10137,18 +8520,7 @@ "name": "Shi-Hunde (D.531)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Tembo", @@ -10169,18 +8541,7 @@ "name": "Shi-Hunde (D.56)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"lg\")", - "original_lang_name": "ganda", - "original_lang_code": "lug", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kabwari", @@ -10323,18 +8684,7 @@ "name": "Ciokwe-Luchazi (K.13)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Luchazi", @@ -10445,18 +8795,7 @@ "name": "Ciokwe-Luchazi (K.16)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Nyengo", @@ -10487,18 +8826,7 @@ "name": "Ciokwe-Luchazi (K.17)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mbwela", @@ -10519,18 +8847,7 @@ "name": "Ciokwe-Luchazi (K.18)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Nkangala", @@ -10596,18 +8913,7 @@ "name": "Luyana (K.31)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Luyana", @@ -10628,18 +8934,7 @@ "name": "Luyana (K.32)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mbowe", @@ -10795,18 +9090,7 @@ "name": "Luyana (K.34)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mashi", @@ -10827,18 +9111,7 @@ "name": "Luyana (K.35)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Simaa", @@ -10859,18 +9132,7 @@ "name": "Subiya-Totela (K.402)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Fwe", @@ -10891,18 +9153,7 @@ "name": "Subiya-Totela (K.41)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Totela", @@ -11170,18 +9421,7 @@ "name": "Luba (L.34)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Hemba", @@ -11202,18 +9442,7 @@ "name": "Luba (L.35)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Sanga", @@ -11234,18 +9463,7 @@ "name": "Lunda (L.51)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Salampasu", @@ -11356,18 +9574,7 @@ "name": "Nkoya (L.60)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Nkoya", @@ -11433,18 +9640,7 @@ "name": "Pende (L.12)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Holu", @@ -11475,18 +9671,7 @@ "name": "Pende (L.13)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kwese", @@ -11507,18 +9692,7 @@ "name": "Songe (L.21)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kete", @@ -11539,18 +9713,7 @@ "name": "Songe (L.221)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Lwalu", @@ -11616,18 +9779,7 @@ "name": "Songe (L.231)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bindji", @@ -11648,18 +9800,7 @@ "name": "Songe (L.24)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Luna", @@ -11702,18 +9843,7 @@ "name": "Bemba (M.401)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bwile", @@ -11734,18 +9864,7 @@ "name": "Bemba (M.402)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Aushi", @@ -11856,18 +9975,7 @@ "name": "Fipa-Mambwe (M.11)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Pimbwe", @@ -11888,18 +9996,7 @@ "name": "Fipa-Mambwe (M.12)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Rungwa", @@ -11920,18 +10017,7 @@ "name": "Fipa-Mambwe (M.13)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Fipa", @@ -11997,18 +10083,7 @@ "name": "Lala-Bisa-Lamba (M.51)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Lala-Bisa", @@ -12074,18 +10149,7 @@ "name": "Lala-Bisa-Lamba (M.55)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Seba", @@ -12241,18 +10305,7 @@ "name": "Lenje-Tonga (M.631)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Sala", @@ -12463,18 +10516,7 @@ "name": "Nyiha-Safwa (M.21)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Wanda", @@ -12540,18 +10582,7 @@ "name": "Nyiha-Safwa (M.23)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Nyiha, Tanzania", @@ -12602,18 +10633,7 @@ "name": "Nyiha-Safwa (M.24)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Malila", @@ -12634,18 +10654,7 @@ "name": "Nyiha-Safwa (M.25)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Safwa", @@ -12733,18 +10742,7 @@ "name": "Manda (N.101)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ndendeule", @@ -12775,18 +10773,7 @@ "name": "Manda (N.102)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Nindi", @@ -12807,18 +10794,7 @@ "name": "Manda (N.11)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Manda", @@ -12839,18 +10815,7 @@ "name": "Manda (N.12)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Chingoni", @@ -12881,18 +10846,7 @@ "name": "Manda (N.13)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Matengo", @@ -12913,18 +10867,7 @@ "name": "Manda (N.14)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mpoto", @@ -13058,18 +11001,7 @@ "name": "Senga-Sena (N.42)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kunda", @@ -13235,18 +11167,7 @@ "name": "Tumbuka (N.201)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mwera", @@ -13592,18 +11513,7 @@ "name": "Makhuwa (P.312)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Nathembo", @@ -13669,18 +11579,7 @@ "name": "Makhuwa (P.331)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Lomwe, Malawi", @@ -13756,18 +11655,7 @@ "name": "Makhuwa (P.341)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Makhuwa-Moniga", @@ -13788,18 +11676,7 @@ "name": "Matuumbi (P.11)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ndengereko", @@ -13820,18 +11697,7 @@ "name": "Matuumbi (P.12)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Rufiji", @@ -13852,18 +11718,7 @@ "name": "Matuumbi (P.13)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Matumbi", @@ -13929,18 +11784,7 @@ "name": "Matuumbi (P.15)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mbunga", @@ -14006,18 +11850,7 @@ "name": "Yao (P.22)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mwera", @@ -14103,18 +11936,7 @@ "name": "Yao (P.24)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ndonde Hamba", @@ -14247,18 +12069,7 @@ "name": "Umbundu (R.101)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ngendelengo", @@ -14334,18 +12145,7 @@ "name": "Umbundu (R.12)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ndombe", @@ -14421,18 +12221,7 @@ "name": "Umbundu (R.14)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Nkumbi", @@ -14498,18 +12287,7 @@ "name": "Wambo (R.214)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mbalanhu", @@ -14575,18 +12353,7 @@ "name": "Wambo (R.23)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kwambi", @@ -14607,18 +12374,7 @@ "name": "Wambo (R.24)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ngandjera", @@ -14639,18 +12395,7 @@ "name": "Yeyi (R.41)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Yeyi", @@ -15063,18 +12808,7 @@ "name": "Shona (S.11)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Tawara", @@ -15295,18 +13029,7 @@ "name": "Sotho-Tswana (S.311)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kgalagadi", @@ -15661,18 +13384,7 @@ "name": "Bafia (A.501)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Hijuk", @@ -15693,18 +13405,7 @@ "name": "Bafia (A.51)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Lefa", @@ -15725,18 +13426,7 @@ "name": "Bafia (A.52)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Dimbong", @@ -15802,18 +13492,7 @@ "name": "Bafia (A.54)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Tibea", @@ -15834,18 +13513,7 @@ "name": "Basaa (A.41)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Barombi", @@ -15866,18 +13534,7 @@ "name": "Basaa (A.42)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bankon", @@ -15953,18 +13610,7 @@ "name": "Basaa (A.44)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Tunen", @@ -15985,18 +13631,7 @@ "name": "Basaa (A.45)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Nyokon", @@ -16062,18 +13697,7 @@ "name": "Basaa (A.461)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Tuotomb", @@ -16139,18 +13763,7 @@ "name": "Bubi-Benga (A.31)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bubia", @@ -16181,18 +13794,7 @@ "name": "Bubi-Benga (A.32)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Batanga", @@ -16213,18 +13815,7 @@ "name": "Bubi-Benga (A.33)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kombe", @@ -16255,18 +13846,7 @@ "name": "Bubi-Benga (A.34)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Benga", @@ -16287,18 +13867,7 @@ "name": "Duala (A.21)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Wumboko", @@ -16319,18 +13888,7 @@ "name": "Duala (A.22)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mokpwe", @@ -16351,18 +13909,7 @@ "name": "Duala (A.23)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Isubu", @@ -16383,18 +13930,7 @@ "name": "Duala (A.231)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bakole", @@ -16460,18 +13996,7 @@ "name": "Duala (A.27)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mulimba", @@ -16592,18 +14117,7 @@ "name": "Ewondo-Fang (A.73)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bebele", @@ -16724,18 +14238,7 @@ "name": "Kaka (A.91)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kwakum", @@ -16756,18 +14259,7 @@ "name": "Kaka (A.92)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Pol", @@ -16833,18 +14325,7 @@ "name": "Lundu-Balong (A.11)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Oroko", @@ -16865,18 +14346,7 @@ "name": "Lundu-Balong (A.13)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bafaw-Balong", @@ -16897,18 +14367,7 @@ "name": "Lundu-Balong (A.14)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bonkeng", @@ -16929,18 +14388,7 @@ "name": "Lundu-Balong (A.15)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mbo", @@ -16961,18 +14409,7 @@ "name": "Lundu-Balong (A.151)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Nkongho", @@ -16993,18 +14430,7 @@ "name": "Lundu-Balong (A.15B)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bassossi", @@ -17080,18 +14506,7 @@ "name": "Makaa-Njem (A.801)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Gyele", @@ -17112,18 +14527,7 @@ "name": "Makaa-Njem (A.802)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ukhwejo", @@ -17144,18 +14548,7 @@ "name": "Makaa-Njem (A.81)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kwasio", @@ -17176,18 +14569,7 @@ "name": "Makaa-Njem (A.82)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Swo", @@ -17253,18 +14635,7 @@ "name": "Makaa-Njem (A.831)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Byep", @@ -17285,18 +14656,7 @@ "name": "Makaa-Njem (A.832)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kol", @@ -17317,18 +14677,7 @@ "name": "Makaa-Njem (A.84)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Njyem", @@ -17394,18 +14743,7 @@ "name": "Makaa-Njem (A.85)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bekwel", @@ -17426,18 +14764,7 @@ "name": "Makaa-Njem (A.86)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mpiemo", @@ -17468,18 +14795,7 @@ "name": "Makaa-Njem (A.87)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bomwali", @@ -17500,18 +14816,7 @@ "name": "Sanaga (A.601)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Tuki", @@ -17542,18 +14847,7 @@ "name": "Sanaga (A.62)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Nulibie", @@ -17594,18 +14888,7 @@ "name": "Sanaga (A.621)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Nubaca", @@ -17671,18 +14954,7 @@ "name": "Sanaga (A.623)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mbule", @@ -17703,18 +14975,7 @@ "name": "Sanaga (A.65)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bati", @@ -17740,35 +15001,13 @@ "name": "B", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kele (B.201)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ndasa", @@ -17789,18 +15028,7 @@ "name": "Kele (B.202)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Sighu", @@ -17821,18 +15049,7 @@ "name": "Kele (B.203)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Samay", @@ -17853,18 +15070,7 @@ "name": "Kele (B.204)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ndambomo", @@ -17885,18 +15091,7 @@ "name": "Kele (B.21)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Seki", @@ -17917,18 +15112,7 @@ "name": "Kele (B.211)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Molengue", @@ -17949,18 +15133,7 @@ "name": "Kele (B.22)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "K\u00e9l\u00e9", @@ -17991,18 +15164,7 @@ "name": "Kele (B.23)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mbangwe", @@ -18023,18 +15185,7 @@ "name": "Kele (B.24)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Wumbvu", @@ -18055,18 +15206,7 @@ "name": "Kele (B.25)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kota", @@ -18087,18 +15227,7 @@ "name": "Kele (B.251)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Sake", @@ -18119,18 +15248,7 @@ "name": "Kele (B.252)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mahongwe", @@ -18151,18 +15269,7 @@ "name": "Mbete (B.602)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kaningi", @@ -18183,18 +15290,7 @@ "name": "Mbete (B.61)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mbere", @@ -18215,18 +15311,7 @@ "name": "Mbete (B.62)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ombamba", @@ -18247,18 +15332,7 @@ "name": "Mbete (B.63)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ndumu", @@ -18279,18 +15353,7 @@ "name": "Myene (B.11)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Myene", @@ -18311,18 +15374,7 @@ "name": "Nzebi (B.501)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Wandji", @@ -18343,18 +15395,7 @@ "name": "Nzebi (B.51)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Duma", @@ -18375,18 +15416,7 @@ "name": "Nzebi (B.52)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Njebi", @@ -18407,18 +15437,7 @@ "name": "Nzebi (B.53)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Tsaangi", @@ -18439,18 +15458,7 @@ "name": "Shira-Punu (B.401)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bwisi", @@ -18471,18 +15479,7 @@ "name": "Shira-Punu (B.402)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Barama", @@ -18503,18 +15500,7 @@ "name": "Shira-Punu (B.403)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Vumbu", @@ -18535,18 +15521,7 @@ "name": "Shira-Punu (B.41)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Sira", @@ -18567,18 +15542,7 @@ "name": "Shira-Punu (B.42)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Sangu", @@ -18599,18 +15563,7 @@ "name": "Shira-Punu (B.43)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Punu", @@ -18631,18 +15584,7 @@ "name": "Shira-Punu (B.44)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Lumbu", @@ -18663,18 +15605,7 @@ "name": "Teke (B.701)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Tchitchege", @@ -18695,18 +15626,7 @@ "name": "Teke (B.71)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Teke-Tege", @@ -18727,18 +15647,7 @@ "name": "Teke (B.72)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ngungwel", @@ -18759,18 +15668,7 @@ "name": "Teke (B.73)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Yaka", @@ -18821,18 +15719,7 @@ "name": "Teke (B.74)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Teke-Eboo", @@ -18863,18 +15750,7 @@ "name": "Teke (B.75)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Teke, Ibali", @@ -18895,18 +15771,7 @@ "name": "Teke (B.77)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Teke-Wuumu", @@ -18937,18 +15802,7 @@ "name": "Tiene-Yanzi (B.81)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Tiene", @@ -18969,18 +15823,7 @@ "name": "Tiene-Yanzi (B.82)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Boma", @@ -19001,18 +15844,7 @@ "name": "Tiene-Yanzi (B.83)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mfinu", @@ -19033,18 +15865,7 @@ "name": "Tiene-Yanzi (B.84)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mbuun", @@ -19065,18 +15886,7 @@ "name": "Tiene-Yanzi (B.85)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Songo", @@ -19107,18 +15917,7 @@ "name": "Tiene-Yanzi (B.86)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ding", @@ -19139,18 +15938,7 @@ "name": "Tiene-Yanzi (B.861)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ngwii", @@ -19171,18 +15959,7 @@ "name": "Tiene-Yanzi (B.862)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Lwel", @@ -19203,18 +15980,7 @@ "name": "Tiene-Yanzi (B.864)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ngongo", @@ -19235,18 +16001,7 @@ "name": "Tiene-Yanzi (B.865)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Nzadi", @@ -19267,18 +16022,7 @@ "name": "Tsogo (B.301)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Eviya", @@ -19299,18 +16043,7 @@ "name": "Tsogo (B.302)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Simba", @@ -19331,18 +16064,7 @@ "name": "Tsogo (B.304)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Pinji", @@ -19363,18 +16085,7 @@ "name": "Tsogo (B.305)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bubi", @@ -19395,18 +16106,7 @@ "name": "Tsogo (B.31)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Tsogo", @@ -19427,18 +16127,7 @@ "name": "Tsogo (B.32)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kande", @@ -19536,18 +16225,7 @@ "name": "Bangi-Ntomba (C.302)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bolondo", @@ -19568,18 +16246,7 @@ "name": "Bangi-Ntomba (C.31)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Baloi", @@ -19610,18 +16277,7 @@ "name": "Bangi-Ntomba (C.311)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mabaale", @@ -19642,18 +16298,7 @@ "name": "Bangi-Ntomba (C.312)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ndobo", @@ -19674,18 +16319,7 @@ "name": "Bangi-Ntomba (C.32)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bangi", @@ -19716,18 +16350,7 @@ "name": "Bangi-Ntomba (C.321)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Libinza", @@ -19748,18 +16371,7 @@ "name": "Bangi-Ntomba (C.33)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Sengele", @@ -19780,18 +16392,7 @@ "name": "Bangi-Ntomba (C.34)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Sakata", @@ -19812,18 +16413,7 @@ "name": "Bangi-Ntomba (C.35)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bolia", @@ -19854,18 +16444,7 @@ "name": "Bangi-Ntomba (C.36)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Boloki", @@ -19916,18 +16495,7 @@ "name": "Bangi-Ntomba (C.37)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Budja", @@ -19948,18 +16516,7 @@ "name": "Bangi-Ntomba (C.371)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Tembo", @@ -19980,18 +16537,7 @@ "name": "Bushoong (C.81)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Dengese", @@ -20057,18 +16603,7 @@ "name": "Bushoong (C.83)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bushoong", @@ -20089,18 +16624,7 @@ "name": "Bushoong (C.84)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Lele", @@ -20121,18 +16645,7 @@ "name": "Bushoong (C.85)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Wongo", @@ -20153,18 +16666,7 @@ "name": "Mboshi (C.21)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mboko", @@ -20185,18 +16687,7 @@ "name": "Mboshi (C.22)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Akwa", @@ -20217,18 +16708,7 @@ "name": "Mboshi (C.24)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Koyo", @@ -20249,18 +16729,7 @@ "name": "Mboshi (C.25)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mbosi", @@ -20281,18 +16750,7 @@ "name": "Mboshi (C.26)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Likwala", @@ -20313,18 +16771,7 @@ "name": "Mboshi (C.27)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Likuba", @@ -20390,18 +16837,7 @@ "name": "Mongo-Nkundo (C.62)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Lalia", @@ -20467,18 +16903,7 @@ "name": "Ngombe (C.401)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Pagibete", @@ -20499,18 +16924,7 @@ "name": "Ngombe (C.403)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kango", @@ -20576,18 +16990,7 @@ "name": "Ngombe (C.411)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bomboma", @@ -20608,18 +17011,7 @@ "name": "Ngombe (C.412)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bamwe", @@ -20640,18 +17032,7 @@ "name": "Ngombe (C.413)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Dzando", @@ -20672,18 +17053,7 @@ "name": "Ngombe (C.414)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ligenza", @@ -20704,18 +17074,7 @@ "name": "Ngombe (C.42)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bwela", @@ -20736,18 +17095,7 @@ "name": "Ngombe (C.44)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bwa", @@ -20768,18 +17116,7 @@ "name": "Ngombe (C.441)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Babango", @@ -20800,18 +17137,7 @@ "name": "Ngombe (C.45)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ngelima", @@ -20832,18 +17158,7 @@ "name": "Ngondi (C.101)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Dibole", @@ -20864,18 +17179,7 @@ "name": "Ngondi (C.102)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ngando", @@ -20896,18 +17200,7 @@ "name": "Ngondi (C.104)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Yaka", @@ -20928,18 +17221,7 @@ "name": "Ngondi (C.11)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ngundi", @@ -20960,18 +17242,7 @@ "name": "Ngondi (C.12)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Pande", @@ -20992,18 +17263,7 @@ "name": "Ngondi (C.13)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mbati", @@ -21024,18 +17284,7 @@ "name": "Ngondi (C.14)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bomitaba", @@ -21056,18 +17305,7 @@ "name": "Ngondi (C.143)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bonjo", @@ -21088,18 +17326,7 @@ "name": "Ngondi (C.15)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bongili", @@ -21175,18 +17402,7 @@ "name": "Ngondi (C.161)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bomboli", @@ -21207,18 +17423,7 @@ "name": "Ngondi (C.162)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bozaba", @@ -21239,18 +17444,7 @@ "name": "Soko-Kele (C.51)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mbesa", @@ -21271,18 +17465,7 @@ "name": "Soko-Kele (C.52)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "So", @@ -21303,18 +17486,7 @@ "name": "Soko-Kele (C.53)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Poke", @@ -21335,18 +17507,7 @@ "name": "Soko-Kele (C.54)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Lombo", @@ -21412,18 +17573,7 @@ "name": "Soko-Kele (C.56)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Foma", @@ -21499,18 +17649,7 @@ "name": "Tetela (C.72)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kusu", @@ -21531,18 +17670,7 @@ "name": "Tetela (C.73)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Nkutu", @@ -21584,18 +17712,7 @@ "name": "Tetela (C.75)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kela", @@ -21616,18 +17733,7 @@ "name": "Tetela (C.76)", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ombo", @@ -21663,18 +17769,7 @@ "name": "Ndemli", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ndemli", @@ -21945,18 +18040,7 @@ "name": "Unclassified", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Busuu", @@ -22024,18 +18108,7 @@ "name": "Menchum", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Befang", @@ -22936,18 +19009,7 @@ "name": "East", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Lamnso\u02bc", @@ -23043,18 +19105,7 @@ "name": "West", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Aghem", @@ -23120,18 +19171,7 @@ "name": "Unclassified", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Nde-Gbite", @@ -23167,18 +19207,7 @@ "name": "Western Momo", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ambele", @@ -23224,18 +19253,7 @@ "name": "Yemne-Kimbi", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mundabli", @@ -23301,18 +19319,7 @@ "name": "Unclassified", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "\u00c1nc\u00e1", @@ -23652,18 +19659,7 @@ "name": "Kugbo", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kugbo", @@ -23766,18 +19762,7 @@ "name": "Ebughu", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ebughu", @@ -23798,18 +19783,7 @@ "name": "Efai", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Efai", @@ -23905,18 +19879,7 @@ "name": "Ekit", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ekit", @@ -23947,18 +19910,7 @@ "name": "Enwang-Uda", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Enwan", @@ -23989,18 +19941,7 @@ "name": "Ibino", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ibino", @@ -24021,18 +19962,7 @@ "name": "Ibuoro", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ibuoro", @@ -24083,18 +20013,7 @@ "name": "Iko", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Iko", @@ -24115,18 +20034,7 @@ "name": "Ilue", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ilue", @@ -24147,18 +20055,7 @@ "name": "Okobo", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Okobo", @@ -24179,18 +20076,7 @@ "name": "Oro", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Oro", @@ -24211,18 +20097,7 @@ "name": "Usaghade", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Usaghade", @@ -24348,18 +20223,7 @@ "name": "West", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Baan", @@ -24412,18 +20276,7 @@ "name": "Agoi-Doko-Iyoniyong", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Iyongiyong", @@ -24464,18 +20317,7 @@ "name": "Akpet", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ukpet-Ehom", @@ -24530,18 +20372,7 @@ "name": "Ikom", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Olulumo-Ikom", @@ -24627,35 +20458,13 @@ "name": "Mbembe-Legbo", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Legbo", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Legbo", @@ -24696,18 +20505,7 @@ "name": "Mbembe", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mbembe, Cross River", @@ -24772,18 +20570,7 @@ "name": "Koring", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Oring", @@ -24864,35 +20651,13 @@ "name": "Ubaghara-Kohumono", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kohumono", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Hohumono", @@ -24933,18 +20698,7 @@ "name": "Ubaghara", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ubaghara", @@ -24980,18 +20734,7 @@ "name": "Kiong-Korop", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kiong", @@ -25064,18 +20807,7 @@ "name": "Akokoid", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"yo\")", - "original_lang_name": "yoruba", - "original_lang_code": "yor", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Arigidi", @@ -25096,18 +20828,7 @@ "name": "Ayere-Ahan", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"yo\")", - "original_lang_name": "yoruba", - "original_lang_code": "yor", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "\u00c0h\u00e0n", @@ -25346,18 +21067,7 @@ "name": "Igala", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"yo\")", - "original_lang_name": "yoruba", - "original_lang_code": "yor", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Igala", @@ -25405,18 +21115,7 @@ "name": "Delta", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Degema", @@ -25702,18 +21401,7 @@ "name": "Northwestern", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Aduge", @@ -25729,18 +21417,7 @@ "name": "Osse", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ehueun", @@ -25791,18 +21468,7 @@ "name": "Southern", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Akuku", @@ -26018,18 +21684,7 @@ "name": "Eloyi", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ajiri", @@ -26067,18 +21722,7 @@ "name": "Etulo", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Etulo", @@ -26207,18 +21851,7 @@ "name": "Yatye-Akpa", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Akweya", @@ -26271,18 +21904,7 @@ "name": "Ekpeye", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ekpeye", @@ -26634,18 +22256,7 @@ "name": "Kororofa", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Wannu", @@ -26731,18 +22342,7 @@ "name": "Unclassified", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Shoo-Minda-Nye", @@ -26763,18 +22363,7 @@ "name": "Wurbo", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Karimjo", @@ -26820,18 +22409,7 @@ "name": "Kpan-Icen", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Etkywan", @@ -26974,35 +22552,13 @@ "name": "Eastern", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Amo", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Amo", @@ -27023,18 +22579,7 @@ "name": "Northern Jos", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Panawa", @@ -27050,18 +22595,7 @@ "name": "Jera", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Gamo-Ningi", @@ -27202,18 +22736,7 @@ "name": "Kauru", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bina", @@ -27369,18 +22892,7 @@ "name": "Piti-Atsam", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Atsam", @@ -27433,18 +22945,7 @@ "name": "Basa", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Basa-Gumna", @@ -27495,18 +22996,7 @@ "name": "Baushi-Gurmana", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bauchi", @@ -27632,18 +23122,7 @@ "name": "Kainji Lake", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Tsucuba", @@ -27795,18 +23274,7 @@ "name": "Kamuku", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Acipa, Eastern", @@ -27897,18 +23365,7 @@ "name": "Reshe", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Reshe", @@ -27956,18 +23413,7 @@ "name": "Ebira-Gade", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Gade", @@ -28080,18 +23526,7 @@ "name": "Nupe", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Asu", @@ -28172,18 +23607,7 @@ "name": "Oko", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Oko-Eni-Osayen", @@ -28231,18 +23655,7 @@ "name": "Alumic", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Arum", @@ -28263,18 +23676,7 @@ "name": "Ayu", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ayu", @@ -28377,18 +23779,7 @@ "name": "North-Central", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Cara", @@ -28540,18 +23931,7 @@ "name": "West-Central", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ahwai", @@ -28577,18 +23957,7 @@ "name": "Northern", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ejuele", @@ -28659,18 +24028,7 @@ "name": "Southeastern", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Horom", @@ -28711,18 +24069,7 @@ "name": "Southern", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Migili", @@ -28773,18 +24120,7 @@ "name": "Tarokoid", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Yangkam", @@ -28852,35 +24188,13 @@ "name": "Northwestern", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Hyamic", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kyoli", @@ -28941,18 +24255,7 @@ "name": "Koro", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ashe", @@ -29216,18 +24519,7 @@ "name": "B", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Akye", @@ -29293,18 +24585,7 @@ "name": "Ukaan", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ukaan", @@ -29325,18 +24606,7 @@ "name": "Unclassified", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Fali of Baissa", @@ -29604,18 +24874,7 @@ "name": "Aizi", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Aizi, Tiagbamrin", @@ -29673,18 +24932,7 @@ "name": "Bakwe", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bakw\u00e9", @@ -29787,18 +25035,7 @@ "name": "Western", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "B\u00e9t\u00e9, Guiberoua", @@ -29919,18 +25156,7 @@ "name": "Kwadia", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kodia", @@ -30001,18 +25227,7 @@ "name": "Seme", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Siamou", @@ -30132,18 +25347,7 @@ "name": "Glio-Oubi", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Glio-Oubi", @@ -30332,18 +25536,7 @@ "name": "Klao", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Klao", @@ -30391,18 +25584,7 @@ "name": "Guere-Krahn", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Daho-Doo", @@ -31105,18 +26287,7 @@ "name": "Kebu-Animere", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Animere", @@ -31575,18 +26746,7 @@ "name": "Ega", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ega", @@ -31765,18 +26925,7 @@ "name": "Logba", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Logba", @@ -31797,18 +26946,7 @@ "name": "Potou", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Tchaman", @@ -31873,18 +27011,7 @@ "name": "Akan", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Abron", @@ -32398,18 +27525,7 @@ "name": "South Guang", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Awutu", @@ -32465,18 +27581,7 @@ "name": "Krobu", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Krobu", @@ -32497,18 +27602,7 @@ "name": "Western", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Abure", @@ -32665,18 +27759,7 @@ "name": "Kam", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kam", @@ -32697,18 +27780,7 @@ "name": "Kwa", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kwa", @@ -32729,18 +27801,7 @@ "name": "La\u2019bi", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "La\u2019bi", @@ -32860,18 +27921,7 @@ "name": "Duli", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Duli-Gey", @@ -33033,18 +28083,7 @@ "name": "Gimme", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Gimnime", @@ -33140,18 +28179,7 @@ "name": "Voko", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Longto", @@ -33379,18 +28407,7 @@ "name": "Yandang", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bali", @@ -33456,18 +28473,7 @@ "name": "Nimbari", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Nimbari", @@ -33510,18 +28516,7 @@ "name": "Bua", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bua", @@ -33632,18 +28627,7 @@ "name": "Day", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Day", @@ -33763,18 +28747,7 @@ "name": "Karang", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kare", @@ -33892,18 +28865,7 @@ "name": "Dama-Galke", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Dama", @@ -34027,18 +28989,7 @@ "name": "Southern", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mbum", @@ -34059,18 +29010,7 @@ "name": "Unclassified", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Dek", @@ -34121,18 +29061,7 @@ "name": "Unclassified", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Oblo", @@ -34170,18 +29099,7 @@ "name": "Jen", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kyak", @@ -34292,18 +29210,7 @@ "name": "Longuda", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Longuda", @@ -34341,18 +29248,7 @@ "name": "Awak", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Awak", @@ -34383,18 +29279,7 @@ "name": "Cham-Mona", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Cham", @@ -34425,18 +29310,7 @@ "name": "Dadiya", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Dadiya", @@ -34527,35 +29401,13 @@ "name": "Yungur", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Libo", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kaan", @@ -34576,18 +29428,7 @@ "name": "Mboi", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mboi", @@ -34608,18 +29449,7 @@ "name": "Yungur-Roba", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Lala-Roba", @@ -34692,69 +29522,25 @@ "name": "Banda", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Central", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Central Core", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Banda-Bambari", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Banda-Bambari", @@ -34775,18 +29561,7 @@ "name": "Banda-Banda", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Banda-Banda", @@ -34807,18 +29582,7 @@ "name": "Banda-Mbres", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Banda-Mbr\u00e8s", @@ -34839,18 +29603,7 @@ "name": "Banda-Ndele", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Banda-Nd\u00e9l\u00e9", @@ -34871,18 +29624,7 @@ "name": "Mid-Southern", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Banda, Mid-Southern", @@ -34943,18 +29685,7 @@ "name": "Togbo-Vara", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Banda, Togbo-Vara", @@ -34980,18 +29711,7 @@ "name": "Western", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Banda-Yangere", @@ -35017,18 +29737,7 @@ "name": "South Central", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Langbashe", @@ -35059,18 +29768,7 @@ "name": "Southern", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mbandja", @@ -35091,18 +29789,7 @@ "name": "Southwestern", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ngbundu", @@ -35123,18 +29810,7 @@ "name": "West Central", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Banda, West Central", @@ -35187,18 +29863,7 @@ "name": "Central", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bhogoto", @@ -35249,18 +29914,7 @@ "name": "East", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ali", @@ -35575,18 +30229,7 @@ "name": "Mba", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Dongo", @@ -35671,18 +30314,7 @@ "name": "Mayogo-Bangba", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bangba", @@ -35763,35 +30395,13 @@ "name": "Western", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Baka-Gundi", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Baka", @@ -35842,18 +30452,7 @@ "name": "Bwaka", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Gilima", @@ -35884,18 +30483,7 @@ "name": "Gbanzili", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Buraka", @@ -35926,18 +30514,7 @@ "name": "Monzombo", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kpala", @@ -36010,18 +30587,7 @@ "name": "Feroge-Mangaya", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Feroge", @@ -36052,18 +30618,7 @@ "name": "Indri-Togoyo", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Indri", @@ -36111,18 +30666,7 @@ "name": "Bai-Viri", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bai", @@ -36250,18 +30794,7 @@ "name": "Barambo-Pambia", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Barambu", @@ -36566,18 +31099,7 @@ "name": "Kurumfe", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Koromf\u00e9", @@ -37035,18 +31557,7 @@ "name": "Nootre", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Notre", @@ -37557,18 +32068,7 @@ "name": "Dogoso-Khe", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Dogoso", @@ -37599,18 +32099,7 @@ "name": "Dyan", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Dyan", @@ -38274,18 +32763,7 @@ "name": "Kulango", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kulango, Bondoukou", @@ -38433,18 +32911,7 @@ "name": "Kpalaga", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "S\u00e9noufo, Palaka", @@ -38510,18 +32977,7 @@ "name": "Senari", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "S\u00e9noufo, Cebaara", @@ -38730,18 +33186,7 @@ "name": "Teen", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Loma", @@ -38772,18 +33217,7 @@ "name": "Tiefo", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ti\u00e9fo", @@ -38859,18 +33293,7 @@ "name": "Viemo", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Viemo", @@ -38891,18 +33314,7 @@ "name": "Wara-Natioro", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Natioro", @@ -38997,18 +33409,7 @@ "name": "Eastern", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ko", @@ -39056,52 +33457,19 @@ "name": "Central", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ebang-Logol", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ebang-Laru", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Heiban", @@ -39132,18 +33500,7 @@ "name": "Logol", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Logol", @@ -39164,18 +33521,7 @@ "name": "Utoro", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Otoro", @@ -39201,18 +33547,7 @@ "name": "Rere", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Koalib", @@ -39238,18 +33573,7 @@ "name": "Shirumba", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Shwai", @@ -39335,18 +33659,7 @@ "name": "Katla", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Katla", @@ -39377,18 +33690,7 @@ "name": "Rashad", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Tegali", @@ -39419,52 +33721,19 @@ "name": "Talodi", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Talodi Proper", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Jomang", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Talodi", @@ -39485,18 +33754,7 @@ "name": "Nding", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Nding", @@ -39517,18 +33775,7 @@ "name": "Ngile-Dengebu", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Dagik", @@ -39559,18 +33806,7 @@ "name": "Tocho", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Acheron", @@ -39626,18 +33862,7 @@ "name": "Tegem", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Lafofa", @@ -39855,18 +34080,7 @@ "name": "Kyanga", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Shanga", @@ -40256,18 +34470,7 @@ "name": "Ben-Gban", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Gban", @@ -40446,18 +34649,7 @@ "name": "Jogo-Jeri", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Jeri Kuo", @@ -40473,18 +34665,7 @@ "name": "Jeri-Jalkuna", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Jalkunan", @@ -40505,18 +34686,7 @@ "name": "Jogo", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Ligbi", @@ -40650,18 +34820,7 @@ "name": "Marka-Dafin", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Marka", @@ -40842,18 +35001,7 @@ "name": "Maninka-Mori", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Wojenaka", @@ -41276,18 +35424,7 @@ "name": "Kpelle", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Kpelle, Guinea", @@ -41440,18 +35577,7 @@ "name": "Bandi", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bandi", @@ -41587,18 +35713,7 @@ "name": "Samogo", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bankagooma", @@ -41744,52 +35859,19 @@ "name": "Soninke-Boso", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Boso", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Eastern", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bozo, Tiemac\u00e8w\u00e8", @@ -41830,18 +35912,7 @@ "name": "Jenaama", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Bozo, Jenaama", @@ -41867,18 +35938,7 @@ "name": "Soninke", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Soninke", @@ -41924,18 +35984,7 @@ "name": "Unclassified", "iso_1_code": null, "iso_3_code": null, - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "scripts": [ - "Latn" - ], - "class_name": "SpaCyTokenizer", - "macrolanguage": false - } - }, + "tokenizers": {}, "children": [ { "name": "Mbre",