| { | |
| "name": "Austro-Asiatic", | |
| "depth": 0, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Mon-Khmer", | |
| "depth": 1, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Aslian", | |
| "depth": 2, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Jah Hut", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Jah Hut", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "jah", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1167", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1166", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "North Aslian", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Chewong", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Cheq Wong", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "cwg", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1170", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1169", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Eastern", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Batek", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "btq", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1172", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Jehai", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "jhi", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1173", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Minriq", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "mnq", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1174", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Mintil", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "mzt", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1175", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1171", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Tonga", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Ten\u2019edn", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "tnz", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1177", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1176", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Western", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Kintaq", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "knq", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1179", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Kensiu", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "kns", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1180", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1178", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1168", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Senoic", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Lanoh", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "lnh", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1182", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Sab\u00fcm", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "sbo", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1183", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Semai", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "sea", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1184", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Semnam", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "ssm", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1185", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Temiar", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "tea", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1186", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1181", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "South Aslian", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Mah Meri", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "mhe", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1188", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Semelai", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "sza", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1189", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Semaq Beri", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "szc", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1190", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Temoq", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "tmo", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1191", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1187", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1165", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Eastern Mon-Khmer", | |
| "depth": 2, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Bahnaric", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Central Bahnaric", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Alak", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "alk", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1195", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Bahnar", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "bdq", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Latn": { | |
| "full_object": "SpaCyTokenizer(\"vi\")", | |
| "original_lang_name": "vietnamese", | |
| "original_lang_code": "vie", | |
| "script": "Latn", | |
| "class_name": "SpaCyTokenizer" | |
| } | |
| }, | |
| "node_i": "1196", | |
| "native_tokenizers": [], | |
| "scripts": [ | |
| "Latn" | |
| ] | |
| }, | |
| { | |
| "name": "Romam", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "rmx", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1197", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Tampuan", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "tpu", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1198", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Latn": { | |
| "full_object": "SpaCyTokenizer(\"vi\")", | |
| "original_lang_name": "vietnamese", | |
| "original_lang_code": "vie", | |
| "script": "Latn", | |
| "class_name": "SpaCyTokenizer" | |
| } | |
| }, | |
| "node_i": "1194", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "East Bahnaric", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Cua", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "cua", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1200", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1199", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "North Bahnaric", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Katua", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "kta", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1202", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Kachok", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "xkk", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1203", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "East", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Kayong", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "kxy", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1205", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Takua", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "tkz", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1206", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1204", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "West", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Trieng", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "stg", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1208", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Talieng", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "tdf", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1209", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Duan", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Halang Doan", | |
| "depth": 7, | |
| "iso_1_code": null, | |
| "iso_3_code": "hld", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1211", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1210", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Jeh-Halang", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Halang", | |
| "depth": 7, | |
| "iso_1_code": null, | |
| "iso_3_code": "hal", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1213", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Jeh", | |
| "depth": 7, | |
| "iso_1_code": null, | |
| "iso_3_code": "jeh", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1214", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1212", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Rengao", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Rengao", | |
| "depth": 7, | |
| "iso_1_code": null, | |
| "iso_3_code": "ren", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1216", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1215", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Sedang-Todrah", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Sedang", | |
| "depth": 7, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Hre", | |
| "depth": 8, | |
| "iso_1_code": null, | |
| "iso_3_code": "hre", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1219", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Sedang", | |
| "depth": 8, | |
| "iso_1_code": null, | |
| "iso_3_code": "sed", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1220", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1218", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Todrah-Monom", | |
| "depth": 7, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Monom", | |
| "depth": 8, | |
| "iso_1_code": null, | |
| "iso_3_code": "moo", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1222", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Todrah", | |
| "depth": 8, | |
| "iso_1_code": null, | |
| "iso_3_code": "tdr", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1223", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1221", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1217", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1207", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1201", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "South Bahnaric", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Stieng, Budeh", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "stt", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1225", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Sre-Mnong", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Mnong", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Eastern Mnong", | |
| "depth": 7, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Mnong, Eastern", | |
| "depth": 8, | |
| "iso_1_code": null, | |
| "iso_3_code": "mng", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1229", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1228", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Southern-Central Mnong", | |
| "depth": 7, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Mnong, Central", | |
| "depth": 8, | |
| "iso_1_code": null, | |
| "iso_3_code": "cmo", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Khmr": { | |
| "full_object": "KhmerTokenizer()", | |
| "original_lang_name": "khmer", | |
| "original_lang_code": "khm", | |
| "script": "Khmr", | |
| "class_name": "KhmerTokenizer" | |
| }, | |
| "Latn": { | |
| "full_object": "SpaCyTokenizer(\"vi\")", | |
| "original_lang_name": "vietnamese", | |
| "original_lang_code": "vie", | |
| "script": "Latn", | |
| "class_name": "SpaCyTokenizer" | |
| } | |
| }, | |
| "node_i": "1231", | |
| "native_tokenizers": [], | |
| "scripts": [ | |
| "Latn", | |
| "Khmr" | |
| ] | |
| }, | |
| { | |
| "name": "Mnong, Southern", | |
| "depth": 8, | |
| "iso_1_code": null, | |
| "iso_3_code": "mnn", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1232", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Kraol", | |
| "depth": 8, | |
| "iso_1_code": null, | |
| "iso_3_code": "rka", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1233", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Khmr": { | |
| "full_object": "KhmerTokenizer()", | |
| "original_lang_name": "khmer", | |
| "original_lang_code": "khm", | |
| "script": "Khmr", | |
| "class_name": "KhmerTokenizer" | |
| }, | |
| "Latn": { | |
| "full_object": "SpaCyTokenizer(\"vi\")", | |
| "original_lang_name": "vietnamese", | |
| "original_lang_code": "vie", | |
| "script": "Latn", | |
| "class_name": "SpaCyTokenizer" | |
| } | |
| }, | |
| "node_i": "1230", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Khmr": { | |
| "full_object": "KhmerTokenizer()", | |
| "original_lang_name": "khmer", | |
| "original_lang_code": "khm", | |
| "script": "Khmr", | |
| "class_name": "KhmerTokenizer" | |
| }, | |
| "Latn": { | |
| "full_object": "SpaCyTokenizer(\"vi\")", | |
| "original_lang_name": "vietnamese", | |
| "original_lang_code": "vie", | |
| "script": "Latn", | |
| "class_name": "SpaCyTokenizer" | |
| } | |
| }, | |
| "node_i": "1227", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Sre", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Maa", | |
| "depth": 7, | |
| "iso_1_code": null, | |
| "iso_3_code": "cma", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1235", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Koho", | |
| "depth": 7, | |
| "iso_1_code": null, | |
| "iso_3_code": "kpm", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1236", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1234", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Khmr": { | |
| "full_object": "KhmerTokenizer()", | |
| "original_lang_name": "khmer", | |
| "original_lang_code": "khm", | |
| "script": "Khmr", | |
| "class_name": "KhmerTokenizer" | |
| }, | |
| "Latn": { | |
| "full_object": "SpaCyTokenizer(\"vi\")", | |
| "original_lang_name": "vietnamese", | |
| "original_lang_code": "vie", | |
| "script": "Latn", | |
| "class_name": "SpaCyTokenizer" | |
| } | |
| }, | |
| "node_i": "1226", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Stieng-Chrau", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Chrau", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "crw", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1238", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Mel-Khaonh", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "hkn", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1239", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Stieng, Bulo", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "sti", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1240", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1237", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Khmr": { | |
| "full_object": "KhmerTokenizer()", | |
| "original_lang_name": "khmer", | |
| "original_lang_code": "khm", | |
| "script": "Khmr", | |
| "class_name": "KhmerTokenizer" | |
| }, | |
| "Latn": { | |
| "full_object": "SpaCyTokenizer(\"vi\")", | |
| "original_lang_name": "vietnamese", | |
| "original_lang_code": "vie", | |
| "script": "Latn", | |
| "class_name": "SpaCyTokenizer" | |
| } | |
| }, | |
| "node_i": "1224", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "West Bahnaric", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Lavi", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "lvi", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1242", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Brao-Kravet", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Brao", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "brb", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1244", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Krung", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "krr", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1245", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Kavet", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "krv", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1246", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Sou", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "sqq", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1247", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1243", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Laven", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Laven", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "lbo", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1249", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1248", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Nyaheun", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Nyaheun", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "nev", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1251", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1250", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Oi-The", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Oy", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "oyb", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1253", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Sapuan", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "spu", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1254", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1252", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1241", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Khmr": { | |
| "full_object": "KhmerTokenizer()", | |
| "original_lang_name": "khmer", | |
| "original_lang_code": "khm", | |
| "script": "Khmr", | |
| "class_name": "KhmerTokenizer" | |
| }, | |
| "Latn": { | |
| "full_object": "SpaCyTokenizer(\"vi\")", | |
| "original_lang_name": "vietnamese", | |
| "original_lang_code": "vie", | |
| "script": "Latn", | |
| "class_name": "SpaCyTokenizer" | |
| } | |
| }, | |
| "node_i": "1193", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Katuic", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Central Katuic", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Ta\u2019oih", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Ir", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "irr", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1258", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Ong", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "oog", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1259", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Ta\u2019oih, Upper", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "tth", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1260", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Ta\u2019oih, Lower", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "tto", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1261", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1257", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1256", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "East Katuic", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Katu-Pacoh", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Katu, Eastern", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "ktv", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1264", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Katu, Western", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "kuf", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1265", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Pacoh", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "pac", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1266", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Phuong", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "phg", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1267", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Tareng", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "tgr", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1268", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1263", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Ngeq-Nkriang", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Kriang", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "ngt", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1270", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1269", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1262", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "West Katuic", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Bru", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Bru, Eastern", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "bru", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Latn": { | |
| "full_object": "SpaCyTokenizer(\"vi\")", | |
| "original_lang_name": "vietnamese", | |
| "original_lang_code": "vie", | |
| "script": "Latn", | |
| "class_name": "SpaCyTokenizer" | |
| } | |
| }, | |
| "node_i": "1273", | |
| "native_tokenizers": [], | |
| "scripts": [ | |
| "Latn" | |
| ] | |
| }, | |
| { | |
| "name": "Bru, Western", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "brv", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1274", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Katang, Northern", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "ncq", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1275", | |
| "native_tokenizers": [], | |
| "scripts": [ | |
| "Laoo" | |
| ] | |
| }, | |
| { | |
| "name": "Katang, Southern", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "sct", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1276", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "So", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "sss", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1277", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Khua", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "xhv", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1278", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Latn": { | |
| "full_object": "SpaCyTokenizer(\"vi\")", | |
| "original_lang_name": "vietnamese", | |
| "original_lang_code": "vie", | |
| "script": "Latn", | |
| "class_name": "SpaCyTokenizer" | |
| } | |
| }, | |
| "node_i": "1272", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Kuay", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Kuay", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "kdt", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1280", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Nyeu", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "nyl", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1281", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1279", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Latn": { | |
| "full_object": "SpaCyTokenizer(\"vi\")", | |
| "original_lang_name": "vietnamese", | |
| "original_lang_code": "vie", | |
| "script": "Latn", | |
| "class_name": "SpaCyTokenizer" | |
| } | |
| }, | |
| "node_i": "1271", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Latn": { | |
| "full_object": "SpaCyTokenizer(\"vi\")", | |
| "original_lang_name": "vietnamese", | |
| "original_lang_code": "vie", | |
| "script": "Latn", | |
| "class_name": "SpaCyTokenizer" | |
| } | |
| }, | |
| "node_i": "1255", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Khmer", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Khmer", | |
| "depth": 4, | |
| "iso_1_code": "km", | |
| "iso_3_code": "khm", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Khmr": { | |
| "full_object": "KhmerTokenizer()", | |
| "original_lang_name": "khmer", | |
| "original_lang_code": "khm", | |
| "script": "Khmr", | |
| "class_name": "KhmerTokenizer" | |
| } | |
| }, | |
| "node_i": "1283", | |
| "native_tokenizers": [ | |
| "Khmr" | |
| ], | |
| "scripts": [ | |
| "Khmr" | |
| ] | |
| }, | |
| { | |
| "name": "Khmer, Northern", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "kxm", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1284", | |
| "native_tokenizers": [], | |
| "scripts": [ | |
| "Thai" | |
| ] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Khmr": { | |
| "full_object": "KhmerTokenizer()", | |
| "original_lang_name": "khmer", | |
| "original_lang_code": "khm", | |
| "script": "Khmr", | |
| "class_name": "KhmerTokenizer" | |
| } | |
| }, | |
| "node_i": "1282", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Pearic", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Eastern", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Pear", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "pcb", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1287", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1286", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Western", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Chong", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Chong", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "cog", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1290", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Chung", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "scq", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1291", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1289", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Samre", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Somray", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "smu", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1293", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Samre", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "sxm", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1294", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1292", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Suoy", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Su\u2019ung", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "syo", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1296", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1295", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1288", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1285", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Khmr": { | |
| "full_object": "KhmerTokenizer()", | |
| "original_lang_name": "khmer", | |
| "original_lang_code": "khm", | |
| "script": "Khmr", | |
| "class_name": "KhmerTokenizer" | |
| }, | |
| "Latn": { | |
| "full_object": "SpaCyTokenizer(\"vi\")", | |
| "original_lang_name": "vietnamese", | |
| "original_lang_code": "vie", | |
| "script": "Latn", | |
| "class_name": "SpaCyTokenizer" | |
| } | |
| }, | |
| "node_i": "1192", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Monic", | |
| "depth": 2, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Mon", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": "mnw", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1298", | |
| "native_tokenizers": [], | |
| "scripts": [ | |
| "Mymr" | |
| ] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1297", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Nicobar", | |
| "depth": 2, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Car", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Nicobarese, Car", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "caq", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Latn": { | |
| "full_object": "SpaCyTokenizer(\"vi\")", | |
| "original_lang_name": "vietnamese", | |
| "original_lang_code": "vie", | |
| "script": "Latn", | |
| "class_name": "SpaCyTokenizer" | |
| } | |
| }, | |
| "node_i": "1301", | |
| "native_tokenizers": [], | |
| "scripts": [ | |
| "Latn" | |
| ] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Latn": { | |
| "full_object": "SpaCyTokenizer(\"vi\")", | |
| "original_lang_name": "vietnamese", | |
| "original_lang_code": "vie", | |
| "script": "Latn", | |
| "class_name": "SpaCyTokenizer" | |
| } | |
| }, | |
| "node_i": "1300", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Chowra-Teressa", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Chaura", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "crv", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1303", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Teressa", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "tef", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1304", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1302", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Great Nicobar", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Nicobarese, Southern", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "nik", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1306", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1305", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Nancowry", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Nicobarese, Central", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "ncb", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1308", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1307", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Shom Peng", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Shom Peng", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "sii", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1310", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1309", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Latn": { | |
| "full_object": "SpaCyTokenizer(\"vi\")", | |
| "original_lang_name": "vietnamese", | |
| "original_lang_code": "vie", | |
| "script": "Latn", | |
| "class_name": "SpaCyTokenizer" | |
| } | |
| }, | |
| "node_i": "1299", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Northern Mon-Khmer", | |
| "depth": 2, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Khasian", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "War-Jaintia", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "aml", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1313", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Khasi", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "kha", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Latn": { | |
| "full_object": "SpaCyTokenizer(\"vi\")", | |
| "original_lang_name": "vietnamese", | |
| "original_lang_code": "vie", | |
| "script": "Latn", | |
| "class_name": "SpaCyTokenizer" | |
| } | |
| }, | |
| "node_i": "1314", | |
| "native_tokenizers": [], | |
| "scripts": [ | |
| "Latn" | |
| ] | |
| }, | |
| { | |
| "name": "Lyngngam", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "lyg", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1315", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Pnar", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "pbv", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1316", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Latn": { | |
| "full_object": "SpaCyTokenizer(\"vi\")", | |
| "original_lang_name": "vietnamese", | |
| "original_lang_code": "vie", | |
| "script": "Latn", | |
| "class_name": "SpaCyTokenizer" | |
| } | |
| }, | |
| "node_i": "1312", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Khmuic", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Khao", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Khao", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "xao", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1319", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1318", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Mal-Khmu\u2019", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Khmu\u2019", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Khuen", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "khf", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1322", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Khmu", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "kjg", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1323", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "O\u2019du", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "tyh", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1324", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1321", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Mal-Prai", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Mal", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "mlf", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1326", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Prai", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "prt", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1327", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1325", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1320", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Mlabri", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Mlabri", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "mra", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1329", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1328", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Xinh Mul", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Phong-Kniang", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "pnx", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1331", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Puoc", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "puo", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1332", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1330", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1317", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Mang", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Mang", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "zng", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1334", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1333", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Palaungic", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Eastern Palaungic", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Angkuic", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Hu", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "huo", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1338", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Kon Keu", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "kkn", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1339", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Man Met", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "mml", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1340", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Mok", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "mqt", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1341", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Samtao", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "stu", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1342", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Tai Loi", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "tlq", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1343", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Muak Sa-aak", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "ukk", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1344", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "U", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "uuu", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1345", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Kiorr", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "xko", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1346", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1337", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Bit-Khang", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Bit", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "bgk", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1348", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Bumang", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "bvp", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1349", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Kh\u00e1ng", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "kjm", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1350", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1347", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Lametic", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Con", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "cno", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1352", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Rmeet", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "lbn", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1353", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1351", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Waic", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Bulang", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Blang", | |
| "depth": 7, | |
| "iso_1_code": null, | |
| "iso_3_code": "blr", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1356", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1355", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Lawa", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Lawa, Western", | |
| "depth": 7, | |
| "iso_1_code": null, | |
| "iso_3_code": "lcp", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1358", | |
| "native_tokenizers": [], | |
| "scripts": [ | |
| "Thai" | |
| ] | |
| }, | |
| { | |
| "name": "Lawa, Eastern", | |
| "depth": 7, | |
| "iso_1_code": null, | |
| "iso_3_code": "lwl", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1359", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1357", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Wa", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Wa, Parauk", | |
| "depth": 7, | |
| "iso_1_code": null, | |
| "iso_3_code": "prk", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1361", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Awa", | |
| "depth": 7, | |
| "iso_1_code": null, | |
| "iso_3_code": "vwa", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1362", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Wa, Vo", | |
| "depth": 7, | |
| "iso_1_code": null, | |
| "iso_3_code": "wbm", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Latn": { | |
| "full_object": "SpaCyTokenizer(\"vi\")", | |
| "original_lang_name": "vietnamese", | |
| "original_lang_code": "vie", | |
| "script": "Latn", | |
| "class_name": "SpaCyTokenizer" | |
| } | |
| }, | |
| "node_i": "1363", | |
| "native_tokenizers": [], | |
| "scripts": [ | |
| "Latn" | |
| ] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Latn": { | |
| "full_object": "SpaCyTokenizer(\"vi\")", | |
| "original_lang_name": "vietnamese", | |
| "original_lang_code": "vie", | |
| "script": "Latn", | |
| "class_name": "SpaCyTokenizer" | |
| } | |
| }, | |
| "node_i": "1360", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Latn": { | |
| "full_object": "SpaCyTokenizer(\"vi\")", | |
| "original_lang_name": "vietnamese", | |
| "original_lang_code": "vie", | |
| "script": "Latn", | |
| "class_name": "SpaCyTokenizer" | |
| } | |
| }, | |
| "node_i": "1354", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Latn": { | |
| "full_object": "SpaCyTokenizer(\"vi\")", | |
| "original_lang_name": "vietnamese", | |
| "original_lang_code": "vie", | |
| "script": "Latn", | |
| "class_name": "SpaCyTokenizer" | |
| } | |
| }, | |
| "node_i": "1336", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Western Palaungic", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Danau", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Danau", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "dnu", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1366", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1365", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Palaung", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Palaung, Ruching", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "pce", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1368", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Palaung, Shwe", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "pll", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1369", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Palaung, Rumai", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "rbb", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1370", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1367", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Riang", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Riang Lang", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "ril", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1372", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Riang Lai", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "yin", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1373", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1371", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1364", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Latn": { | |
| "full_object": "SpaCyTokenizer(\"vi\")", | |
| "original_lang_name": "vietnamese", | |
| "original_lang_code": "vie", | |
| "script": "Latn", | |
| "class_name": "SpaCyTokenizer" | |
| } | |
| }, | |
| "node_i": "1335", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Latn": { | |
| "full_object": "SpaCyTokenizer(\"vi\")", | |
| "original_lang_name": "vietnamese", | |
| "original_lang_code": "vie", | |
| "script": "Latn", | |
| "class_name": "SpaCyTokenizer" | |
| } | |
| }, | |
| "node_i": "1311", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Palyu", | |
| "depth": 2, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Bugan", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": "bbh", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1375", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Bolyu", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": "ply", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1376", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1374", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Southern Monic", | |
| "depth": 2, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Nyahkur", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": "cbn", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1378", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1377", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Unclassified", | |
| "depth": 2, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Kemiehua", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": "kfj", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1380", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Kuanhua", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": "xnh", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1381", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1379", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Viet-Muong", | |
| "depth": 2, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Chut", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Arem", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "aem", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1384", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Maleng", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "pkt", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1385", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Chut", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "scb", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1386", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1383", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Cuoi", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Hung", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "hnu", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1388", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Tho", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "tou", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1389", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1387", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Muong", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Bo", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "bgl", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1391", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Muong", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "mtq", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1392", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Ngu\u00f4n", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "nuo", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1393", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1390", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Thavung", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Aheu", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "thm", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1395", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1394", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Vietnamese", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Vietnamese", | |
| "depth": 4, | |
| "iso_1_code": "vi", | |
| "iso_3_code": "vie", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Latn": { | |
| "full_object": "SpaCyTokenizer(\"vi\")", | |
| "original_lang_name": "vietnamese", | |
| "original_lang_code": "vie", | |
| "script": "Latn", | |
| "class_name": "SpaCyTokenizer" | |
| } | |
| }, | |
| "node_i": "1397", | |
| "native_tokenizers": [ | |
| "Latn" | |
| ], | |
| "scripts": [ | |
| "Latn" | |
| ] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Latn": { | |
| "full_object": "SpaCyTokenizer(\"vi\")", | |
| "original_lang_name": "vietnamese", | |
| "original_lang_code": "vie", | |
| "script": "Latn", | |
| "class_name": "SpaCyTokenizer" | |
| } | |
| }, | |
| "node_i": "1396", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Latn": { | |
| "full_object": "SpaCyTokenizer(\"vi\")", | |
| "original_lang_name": "vietnamese", | |
| "original_lang_code": "vie", | |
| "script": "Latn", | |
| "class_name": "SpaCyTokenizer" | |
| } | |
| }, | |
| "node_i": "1382", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": { | |
| "Khmr": { | |
| "full_object": "KhmerTokenizer()", | |
| "original_lang_name": "khmer", | |
| "original_lang_code": "khm", | |
| "script": "Khmr", | |
| "class_name": "KhmerTokenizer" | |
| }, | |
| "Latn": { | |
| "full_object": "SpaCyTokenizer(\"vi\")", | |
| "original_lang_name": "vietnamese", | |
| "original_lang_code": "vie", | |
| "script": "Latn", | |
| "class_name": "SpaCyTokenizer" | |
| } | |
| }, | |
| "node_i": "1164", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Munda", | |
| "depth": 1, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "North Munda", | |
| "depth": 2, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Kherwari", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Agariya", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "agi", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1401", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Bijori", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "bix", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1402", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Kodaku", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "ksz", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1403", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Mundari", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Asuri", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "asr", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1405", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Birhor", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "biy", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1406", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Koda", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "cdz", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1407", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Kol", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "ekl", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1408", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Ho", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "hoc", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1409", | |
| "native_tokenizers": [], | |
| "scripts": [ | |
| "Latn", | |
| "Wara" | |
| ] | |
| }, | |
| { | |
| "name": "Korwa", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "kfp", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1410", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Mundari", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "unr", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1411", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Munda", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "unx", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1412", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1404", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Santali", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Mahali", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "mjx", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1414", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Santhali", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "sat", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1415", | |
| "native_tokenizers": [], | |
| "scripts": [ | |
| "Latn", | |
| "Olck" | |
| ] | |
| }, | |
| { | |
| "name": "Turi", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": "trd", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1416", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1413", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1400", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Korku", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Korku", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "kfq", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1418", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1417", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1399", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "South Munda", | |
| "depth": 2, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Kharia-Juang", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Juang", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "jun", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1421", | |
| "native_tokenizers": [], | |
| "scripts": [ | |
| "Orya" | |
| ] | |
| }, | |
| { | |
| "name": "Kharia", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": "khr", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1422", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1420", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Koraput Munda", | |
| "depth": 3, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Gutob-Remo-Geta\u2019", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Geta\u2019", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Gata\u2019", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "gaq", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1426", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1425", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Gutob-Remo", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Bondo", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "bfw", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1428", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Gadaba, Bodo", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "gbj", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1429", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1427", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1424", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Sora-Juray-Gorum", | |
| "depth": 4, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Gorum", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Parenga", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "pcj", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1432", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1431", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Sora-Juray", | |
| "depth": 5, | |
| "iso_1_code": null, | |
| "iso_3_code": null, | |
| "children": [ | |
| { | |
| "name": "Juray", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "juy", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1434", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| }, | |
| { | |
| "name": "Sora", | |
| "depth": 6, | |
| "iso_1_code": null, | |
| "iso_3_code": "srb", | |
| "children": [], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1435", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1433", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1430", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1423", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1419", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1398", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } | |
| ], | |
| "family": "Austro-Asiatic", | |
| "tokenizers": {}, | |
| "node_i": "1163", | |
| "native_tokenizers": [], | |
| "scripts": [] | |
| } |