swarlekha / nepali_tokenizer.json
indra17's picture
Upload nepali_tokenizer.json
4da5a78 verified
{
"version": "1.0",
"truncation": null,
"padding": null,
"added_tokens": [
{
"id": 0,
"special": true,
"content": "[STOP]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false
},
{
"id": 1,
"special": true,
"content": "[UNK]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false
},
{
"id": 2,
"special": true,
"content": "[SPACE]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false
},
{
"id": 255,
"special": true,
"content": "[START]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false
},
{
"id": 604,
"content": "[UH]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 605,
"content": "[UM]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 606,
"content": "[giggle]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 607,
"content": "[laughter]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 608,
"content": "[guffaw]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 609,
"content": "[inhale]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 610,
"content": "[exhale]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 611,
"content": "[sigh]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 612,
"content": "[cry]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 613,
"content": "[bark]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 614,
"content": "[howl]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 615,
"content": "[meow]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 616,
"content": "[singing]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 617,
"content": "[music]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 618,
"content": "[whistle]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 619,
"content": "[humming]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 620,
"content": "[gasp]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 621,
"content": "[groan]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 622,
"content": "[whisper]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 623,
"content": "[mumble]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 624,
"content": "[sniff]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 625,
"content": "[sneeze]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 626,
"content": "[cough]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 627,
"content": "[snore]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 628,
"content": "[chew]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 629,
"content": "[sip]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 630,
"content": "[clear_throat]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 631,
"content": "[kiss]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 632,
"content": "[shhh]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 633,
"content": "[gibberish]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 634,
"content": "[fr]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 635,
"content": "[es]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 636,
"content": "[de]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 637,
"content": "[it]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 638,
"content": "[ipa]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 639,
"content": "[end_of_label]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 695,
"content": "[ne]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 696,
"content": "[PLACEHOLDER56]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 697,
"content": "[PLACEHOLDER57]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 698,
"content": "[PLACEHOLDER58]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 699,
"content": "[PLACEHOLDER59]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 700,
"content": "[PLACEHOLDER60]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 701,
"content": "[PLACEHOLDER61]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 702,
"content": "[PLACEHOLDER62]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 703,
"content": "[PLACEHOLDER63]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
}
],
"normalizer": null,
"pre_tokenizer": {
"type": "Whitespace"
},
"post_processor": null,
"decoder": null,
"model": {
"type": "BPE",
"dropout": null,
"unk_token": "[UNK]",
"continuing_subword_prefix": null,
"end_of_word_suffix": null,
"fuse_unk": false,
"vocab": {
"[STOP]": 0,
"[UNK]": 1,
"[SPACE]": 2,
"!": 3,
"'": 4,
"(": 5,
")": 6,
",": 7,
"-": 8,
".": 9,
"/": 10,
":": 11,
";": 12,
"?": 13,
"a": 14,
"b": 15,
"c": 16,
"d": 17,
"e": 18,
"f": 19,
"g": 20,
"h": 21,
"i": 22,
"j": 23,
"k": 24,
"l": 25,
"m": 26,
"n": 27,
"o": 28,
"p": 29,
"q": 30,
"r": 31,
"s": 32,
"t": 33,
"u": 34,
"v": 35,
"w": 36,
"x": 37,
"y": 38,
"z": 39,
"th": 40,
"in": 41,
"the": 42,
"an": 43,
"er": 44,
"ou": 45,
"re": 46,
"on": 47,
"at": 48,
"ed": 49,
"en": 50,
"to": 51,
"ing": 52,
"and": 53,
"is": 54,
"as": 55,
"al": 56,
"or": 57,
"of": 58,
"ar": 59,
"it": 60,
"es": 61,
"he": 62,
"st": 63,
"le": 64,
"om": 65,
"se": 66,
"be": 67,
"ad": 68,
"ow": 69,
"ly": 70,
"ch": 71,
"wh": 72,
"that": 73,
"you": 74,
"li": 75,
"ve": 76,
"ac": 77,
"ti": 78,
"ld": 79,
"me": 80,
"was": 81,
"gh": 82,
"id": 83,
"ll": 84,
"wi": 85,
"ent": 86,
"for": 87,
"ay": 88,
"ro": 89,
"ver": 90,
"ic": 91,
"her": 92,
"ke": 93,
"his": 94,
"no": 95,
"ut": 96,
"un": 97,
"ir": 98,
"lo": 99,
"we": 100,
"ri": 101,
"ha": 102,
"with": 103,
"ght": 104,
"out": 105,
"im": 106,
"ion": 107,
"all": 108,
"ab": 109,
"one": 110,
"ne": 111,
"ge": 112,
"ould": 113,
"ter": 114,
"mo": 115,
"had": 116,
"ce": 117,
"she": 118,
"go": 119,
"sh": 120,
"ur": 121,
"am": 122,
"so": 123,
"pe": 124,
"my": 125,
"de": 126,
"are": 127,
"but": 128,
"ome": 129,
"fr": 130,
"ther": 131,
"fe": 132,
"su": 133,
"do": 134,
"con": 135,
"te": 136,
"ain": 137,
"ere": 138,
"po": 139,
"if": 140,
"they": 141,
"us": 142,
"ag": 143,
"tr": 144,
"now": 145,
"oun": 146,
"this": 147,
"have": 148,
"not": 149,
"sa": 150,
"il": 151,
"up": 152,
"thing": 153,
"from": 154,
"ap": 155,
"him": 156,
"ack": 157,
"ation": 158,
"ant": 159,
"our": 160,
"op": 161,
"like": 162,
"ust": 163,
"ess": 164,
"bo": 165,
"ok": 166,
"ul": 167,
"ind": 168,
"ex": 169,
"com": 170,
"some": 171,
"there": 172,
"ers": 173,
"co": 174,
"res": 175,
"man": 176,
"ard": 177,
"pl": 178,
"wor": 179,
"way": 180,
"tion": 181,
"fo": 182,
"ca": 183,
"were": 184,
"by": 185,
"ate": 186,
"pro": 187,
"ted": 188,
"ound": 189,
"own": 190,
"would": 191,
"ts": 192,
"what": 193,
"qu": 194,
"ally": 195,
"ight": 196,
"ck": 197,
"gr": 198,
"when": 199,
"ven": 200,
"can": 201,
"ough": 202,
"ine": 203,
"end": 204,
"per": 205,
"ous": 206,
"od": 207,
"ide": 208,
"know": 209,
"ty": 210,
"very": 211,
"si": 212,
"ak": 213,
"who": 214,
"about": 215,
"ill": 216,
"them": 217,
"est": 218,
"red": 219,
"ye": 220,
"could": 221,
"ong": 222,
"your": 223,
"their": 224,
"em": 225,
"just": 226,
"other": 227,
"into": 228,
"any": 229,
"whi": 230,
"um": 231,
"tw": 232,
"ast": 233,
"der": 234,
"did": 235,
"ie": 236,
"been": 237,
"ace": 238,
"ink": 239,
"ity": 240,
"back": 241,
"ting": 242,
"br": 243,
"more": 244,
"ake": 245,
"pp": 246,
"then": 247,
"sp": 248,
"el": 249,
"use": 250,
"bl": 251,
"said": 252,
"over": 253,
"get": 254,
"[START]": 255,
"\"": 256,
"#": 257,
"$": 258,
"%": 259,
"&": 260,
"*": 261,
"+": 262,
"0": 263,
"1": 264,
"2": 265,
"3": 266,
"4": 267,
"5": 268,
"6": 269,
"7": 270,
"8": 271,
"9": 272,
"<": 273,
"=": 274,
">": 275,
"@": 276,
"A": 277,
"B": 278,
"C": 279,
"D": 280,
"E": 281,
"F": 282,
"G": 283,
"H": 284,
"I": 285,
"J": 286,
"K": 287,
"L": 288,
"M": 289,
"N": 290,
"O": 291,
"P": 292,
"Q": 293,
"R": 294,
"S": 295,
"T": 296,
"U": 297,
"V": 298,
"W": 299,
"X": 300,
"Y": 301,
"Z": 302,
"[": 303,
"\\": 304,
"]": 305,
"^": 306,
"_": 307,
"`": 308,
"{": 309,
"|": 310,
"}": 311,
"~": 312,
"‐": 313,
"‑": 314,
"‒": 315,
"–": 316,
"—": 317,
"―": 318,
"‖": 319,
"‗": 320,
"‘": 321,
"’": 322,
"‚": 323,
"‛": 324,
"“": 325,
"”": 326,
"„": 327,
"‟": 328,
" ": 329,
"¡": 330,
"¢": 331,
"£": 332,
"¤": 333,
"¥": 334,
"¦": 335,
"§": 336,
"¨": 337,
"©": 338,
"ª": 339,
"«": 340,
"¬": 341,
"­": 342,
"®": 343,
"¯": 344,
"°": 345,
"±": 346,
"²": 347,
"³": 348,
"´": 349,
"µ": 350,
"¶": 351,
"·": 352,
"¸": 353,
"¹": 354,
"º": 355,
"»": 356,
"¼": 357,
"½": 358,
"¾": 359,
"¿": 360,
"À": 361,
"Á": 362,
"Â": 363,
"Ã": 364,
"Ä": 365,
"Å": 366,
"Æ": 367,
"Ç": 368,
"È": 369,
"É": 370,
"Ê": 371,
"Ë": 372,
"Ì": 373,
"Í": 374,
"Î": 375,
"Ï": 376,
"Ð": 377,
"Ñ": 378,
"Ò": 379,
"Ó": 380,
"Ô": 381,
"Õ": 382,
"Ö": 383,
"×": 384,
"Ø": 385,
"Ù": 386,
"Ú": 387,
"Û": 388,
"Ü": 389,
"Ý": 390,
"Þ": 391,
"ß": 392,
"à": 393,
"á": 394,
"â": 395,
"ã": 396,
"ä": 397,
"å": 398,
"æ": 399,
"ç": 400,
"è": 401,
"é": 402,
"ê": 403,
"ë": 404,
"ì": 405,
"í": 406,
"î": 407,
"ï": 408,
"ð": 409,
"ñ": 410,
"ò": 411,
"ó": 412,
"ô": 413,
"õ": 414,
"ö": 415,
"÷": 416,
"ø": 417,
"ù": 418,
"ú": 419,
"û": 420,
"ü": 421,
"ý": 422,
"þ": 423,
"ÿ": 424,
"ɐ": 425,
"ɑ": 426,
"ɒ": 427,
"ɓ": 428,
"ɔ": 429,
"ɕ": 430,
"ɖ": 431,
"ɗ": 432,
"ɘ": 433,
"ə": 434,
"ɚ": 435,
"ɛ": 436,
"ɜ": 437,
"ɝ": 438,
"ɞ": 439,
"ɟ": 440,
"ɠ": 441,
"ɡ": 442,
"ɢ": 443,
"ɣ": 444,
"ɤ": 445,
"ɥ": 446,
"ɦ": 447,
"ɧ": 448,
"ɨ": 449,
"ɩ": 450,
"ɪ": 451,
"ɫ": 452,
"ɬ": 453,
"ɭ": 454,
"ɮ": 455,
"ɯ": 456,
"ɰ": 457,
"ɱ": 458,
"ɲ": 459,
"ɳ": 460,
"ɴ": 461,
"ɵ": 462,
"ɶ": 463,
"ɷ": 464,
"ɸ": 465,
"ɹ": 466,
"ɺ": 467,
"ɻ": 468,
"ɼ": 469,
"ɽ": 470,
"ɾ": 471,
"ɿ": 472,
"ʀ": 473,
"ʁ": 474,
"ʂ": 475,
"ʃ": 476,
"ʄ": 477,
"ʅ": 478,
"ʆ": 479,
"ʇ": 480,
"ʈ": 481,
"ʉ": 482,
"ʊ": 483,
"ʋ": 484,
"ʌ": 485,
"ʍ": 486,
"ʎ": 487,
"ʏ": 488,
"ʐ": 489,
"ʑ": 490,
"ʒ": 491,
"ʓ": 492,
"ʔ": 493,
"ʕ": 494,
"ʖ": 495,
"ʗ": 496,
"ʘ": 497,
"ʙ": 498,
"ʚ": 499,
"ʛ": 500,
"ʜ": 501,
"ʝ": 502,
"ʞ": 503,
"ʟ": 504,
"ʠ": 505,
"ʡ": 506,
"ʢ": 507,
"ʣ": 508,
"ʤ": 509,
"ʥ": 510,
"ʦ": 511,
"ʧ": 512,
"ʨ": 513,
"ʩ": 514,
"ʪ": 515,
"ʫ": 516,
"ʬ": 517,
"ʭ": 518,
"ʮ": 519,
"ʯ": 520,
"ʰ": 521,
"ʱ": 522,
"ʲ": 523,
"ʳ": 524,
"ʴ": 525,
"ʵ": 526,
"ʶ": 527,
"ʷ": 528,
"ʸ": 529,
"ʹ": 530,
"ʺ": 531,
"ʻ": 532,
"ʼ": 533,
"ʽ": 534,
"ʾ": 535,
"ʿ": 536,
"ˀ": 537,
"ˁ": 538,
"˂": 539,
"˃": 540,
"˄": 541,
"˅": 542,
"ˆ": 543,
"ˇ": 544,
"ˈ": 545,
"ˉ": 546,
"ˊ": 547,
"ˋ": 548,
"ˌ": 549,
"ˍ": 550,
"ˎ": 551,
"ˏ": 552,
"ː": 553,
"ˑ": 554,
"˒": 555,
"˓": 556,
"˔": 557,
"˕": 558,
"˖": 559,
"˗": 560,
"˘": 561,
"˙": 562,
"˚": 563,
"˛": 564,
"˜": 565,
"˝": 566,
"˞": 567,
"˟": 568,
"ˠ": 569,
"ˡ": 570,
"ˢ": 571,
"ˣ": 572,
"ˤ": 573,
"˥": 574,
"˦": 575,
"˧": 576,
"˨": 577,
"˩": 578,
"˪": 579,
"˫": 580,
"ˬ": 581,
"˭": 582,
"ˮ": 583,
"˯": 584,
"˰": 585,
"˱": 586,
"˲": 587,
"˳": 588,
"˴": 589,
"˵": 590,
"˶": 591,
"˷": 592,
"˸": 593,
"˹": 594,
"˺": 595,
"˻": 596,
"˼": 597,
"˽": 598,
"˾": 599,
"˿": 600,
"ā": 601,
"ō": 602,
"…": 603,
"[UH]": 604,
"[UM]": 605,
"[giggle]": 606,
"[laughter]": 607,
"[guffaw]": 608,
"[inhale]": 609,
"[exhale]": 610,
"[sigh]": 611,
"[cry]": 612,
"[bark]": 613,
"[howl]": 614,
"[meow]": 615,
"[singing]": 616,
"[music]": 617,
"[whistle]": 618,
"[humming]": 619,
"[gasp]": 620,
"[groan]": 621,
"[whisper]": 622,
"[mumble]": 623,
"[sniff]": 624,
"[sneeze]": 625,
"[cough]": 626,
"[snore]": 627,
"[chew]": 628,
"[sip]": 629,
"[clear_throat]": 630,
"[kiss]": 631,
"[shhh]": 632,
"[gibberish]": 633,
"[fr]": 634,
"[es]": 635,
"[de]": 636,
"[it]": 637,
"[ipa]": 638,
"[end_of_label]": 639,
"ŋ": 640,
"ᵻ": 641,
"θ": 642,
"̩": 643,
"̃": 644,
"ɑː": 645,
"iː": 646,
"uː": 647,
"ɜː": 648,
"ɔː": 649,
"oː": 650,
"eɪ": 651,
"oʊ": 652,
"aɪ": 653,
"aʊ": 654,
"ɔɪ": 655,
"dʒ": 656,
"tʃ": 657,
"ɪŋ": 658,
"ᵻd": 659,
"ˈiː": 660,
"ˌiː": 661,
"ˈɪ": 662,
"ˌɪ": 663,
"ˈeɪ": 664,
"ˌeɪ": 665,
"ˈɛ": 666,
"ˌɛ": 667,
"ˈæ": 668,
"ˌæ": 669,
"ˈɑː": 670,
"ˌɑː": 671,
"ˈɔː": 672,
"ˌɔː": 673,
"oːɹ": 674,
"ˈoːɹ": 675,
"ˌoːɹ": 676,
"ˈoʊ": 677,
"ˌoʊ": 678,
"ˈʊ": 679,
"ˌʊ": 680,
"ˈuː": 681,
"ˌuː": 682,
"ˈɜː": 683,
"ˌɜː": 684,
"ˈʌ": 685,
"ˌʌ": 686,
"ˈaɪ": 687,
"ˌaɪ": 688,
"ˈaʊ": 689,
"ˌaʊ": 690,
"ˈɔɪ": 691,
"ˌɔɪ": 692,
"ˈɚ": 693,
"ˌɐ": 694,
"[PLACEHOLDER56]": 696,
"[PLACEHOLDER57]": 697,
"[PLACEHOLDER58]": 698,
"[PLACEHOLDER59]": 699,
"[PLACEHOLDER60]": 700,
"[PLACEHOLDER61]": 701,
"[PLACEHOLDER62]": 702,
"[PLACEHOLDER63]": 703,
"[ne]": 695,
"ँ": 704,
"ं": 705,
"ः": 706,
"अ": 707,
"आ": 708,
"इ": 709,
"ई": 710,
"उ": 711,
"ऊ": 712,
"ऋ": 713,
"ए": 714,
"ऐ": 715,
"ओ": 716,
"औ": 717,
"क": 718,
"ख": 719,
"ग": 720,
"घ": 721,
"ङ": 722,
"च": 723,
"छ": 724,
"ज": 725,
"झ": 726,
"ञ": 727,
"ट": 728,
"ठ": 729,
"ड": 730,
"ढ": 731,
"ण": 732,
"त": 733,
"थ": 734,
"द": 735,
"ध": 736,
"न": 737,
"प": 738,
"फ": 739,
"ब": 740,
"भ": 741,
"म": 742,
"य": 743,
"र": 744,
"ल": 745,
"व": 746,
"श": 747,
"ष": 748,
"स": 749,
"ह": 750,
"़": 751,
"ऽ": 752,
"ा": 753,
"ि": 754,
"ी": 755,
"ु": 756,
"ू": 757,
"ृ": 758,
"ॅ": 759,
"ॆ": 760,
"े": 761,
"ै": 762,
"ॊ": 763,
"ो": 764,
"ौ": 765,
"्": 766,
"ॐ": 767,
"।": 768,
"॥": 769,
"०": 770,
"१": 771,
"२": 772,
"३": 773,
"४": 774,
"५": 775,
"६": 776,
"७": 777,
"८": 778,
"९": 779,
"को": 780,
"मा": 781,
"न्": 782,
"्र": 783,
"र्": 784,
"का": 785,
"ला": 786,
"्य": 787,
"ले": 788,
"ने": 789,
"रा": 790,
"स्": 791,
"रू": 792,
"नि": 793,
"प्र": 794,
"पा": 795,
"वि": 796,
"यो": 797,
"ना": 798,
"हरू": 799,
"क्": 800,
"ति": 801,
"ार": 802,
"वा": 803,
"लाई": 804,
"ता": 805,
"हा": 806,
"त्र": 807,
"गर": 808,
"हु": 809,
"न्छ": 810,
"सा": 811,
"म्": 812,
"ल्": 813,
"गर्": 814,
"एको": 815,
"बा": 816,
"थि": 817,
"नु": 818,
"था": 819,
"दि": 820,
"हो": 821,
"यस": 822,
"त्य": 823,
"दा": 824,
"्या": 825,
"क्ष": 826,
"नी": 827,
"दे": 828,
"या": 829,
"जा": 830,
"कार": 831,
"हि": 832,
"त्": 833,
"ेर": 834,
"लि": 835,
"पनि": 836,
"कु": 837,
"ङ्": 838,
"एक": 839,
"ली": 840,
"सि": 841,
"कि": 842,
"मि": 843,
"पु": 844,
"ेको": 845,
"टा": 846,
"गा": 847,
"उन": 848,
"जि": 849,
"भा": 850,
"ष्": 851,
"द्": 852,
"नेपा": 853,
"रि": 854,
"छन्": 855,
"सम्": 856,
"री": 857,
"रह": 858,
"के": 859,
"बाट": 860,
"सु": 861,
"मु": 862,
"नै": 863,
"लाग": 864,
"स्त": 865,
"न्द": 866,
"भएको": 867,
"धि": 868,
"खि": 869,
"ल्ला": 870,
"वर्": 871,
"ती": 872,
"पू": 873,
"भि": 874,
"्च": 875,
"गरि": 876,
"छि": 877,
"हुन्छ": 878,
"पर्": 879,
"सम": 880,
"लो": 881,
"२०": 882,
"दै": 883,
"जिल्ला": 884,
"राज": 885,
"आफ": 886,
"नेपाल": 887,
"हरूको": 888,
"उँ": 889,
"हाँ": 890,
"नो": 891,
"पछि": 892,
"स्था": 893,
"ङ्ग": 894,
"जन": 895,
"भए": 896,
"धा": 897,
"अन्": 898,
"भन्": 899,
"रो": 900,
"त्यस": 901,
"दु": 902,
"शा": 903,
"योग": 904,
"रूप": 905,
"थिए": 906,
"थियो": 907,
"तर": 908,
"ही": 909,
"ित": 910,
"तथा": 911,
"देखि": 912,
"लागि": 913,
"नको": 914,
"पूर्": 915,
"्व": 916,
"क्र": 917,
"जु": 918,
"सं": 919,
"ष्ट": 920,
"देश": 921,
"खा": 922,
"आफ्": 923,
"की": 924,
"रु": 925,
"एउ": 926,
"गरे": 927,
"से": 928,
"ेत्र": 929,
"बै": 930,
"भने": 931,
"चा": 932,
"नमा": 933,
"क्षेत्र": 934,
"प्": 935,
"डा": 936,
"समा": 937,
"सन्": 938,
"जी": 939,
"दी": 940,
"यु": 941,
"एउटा": 942,
"उप": 943,
"चि": 944,
"विश": 945,
"्रो": 946,
"अनु": 947,
"सी": 948,
"लेख": 949,
"्रे": 950,
"कृ": 951,
"बि": 952,
"भार": 953,
"मी": 954,
"गर्न": 955,
"रूपमा": 956,
"ध्य": 957,
"रहेको": 958,
"टि": 959,
"एका": 960,
"सो": 961,
"र्य": 962,
"नाम": 963,
"सम्म": 964,
"उनी": 965,
"परि": 966,
"उत्": 967,
"व्य": 968,
"गर्ने": 969,
"सबै": 970,
"रे": 971,
"निर्": 972,
"प्रा": 973,
"वर्ष": 974,
"आफ्नो": 975,
"शि": 976,
"क्त": 977,
"मुख": 978,
"गो": 979,
"ञ्च": 980,
"धेर": 981,
"ब्": 982,
"स्ट": 983,
"ग्र": 984,
"मे": 985,
"्यो": 986,
"अव": 987,
"१९": 988,
"धेरै": 989,
"ज्": 990,
"पि": 991,
"भयो": 992,
"द्ध": 993,
"भन्दा": 994,
"डि": 995,
"न्न": 996,
"न्द्र": 997,
"रको": 998,
"नेपाली": 999,
"महा": 1000,
"अर्": 1001,
"बना": 1002,
"मन्": 1003,
"मेर": 1004,
"लको": 1005,
"ैले": 1006,
"हरूमा": 1007,
"ठा": 1008,
"ण्": 1009,
"कुनै": 1010,
"ँग": 1011,
"रण": 1012,
"रमा": 1013,
"निक": 1014,
"ईँ": 1015,
"बन्": 1016,
"वी": 1017,
"िय": 1018,
"प्रति": 1019,
"उनले": 1020,
"टी": 1021,
"सार": 1022,
"सँग": 1023,
"भाग": 1024,
"खे": 1025,
"तपा": 1026,
"राम": 1027,
"तपाईँ": 1028,
"गु": 1029,
"बु": 1030,
"वे": 1031,
"सर": 1032,
"हुन्": 1033,
"अधि": 1034,
"चार": 1035,
"मानि": 1036,
"गर्नु": 1037,
"कर्": 1038,
"सह": 1039,
"स्ता": 1040,
"स्थि": 1041,
"यसको": 1042,
"एर": 1043,
"बे": 1044,
"मो": 1045,
"सको": 1046,
"हरूले": 1047,
"भारत": 1048,
"ज्ञ": 1049,
"काम": 1050,
"छो": 1051,
"िक": 1052,
"कार्य": 1053,
"द्वा": 1054,
"जो": 1055,
"पृ": 1056,
"म्प": 1057,
"दिन": 1058,
"कुरा": 1059,
"ण्ड": 1060,
"छा": 1061,
"भू": 1062,
"लमा": 1063,
"षा": 1064,
"ेका": 1065,
"विद": 1066,
"हरूलाई": 1067,
"उने": 1068,
"पहि": 1069,
"लय": 1070,
"सङ्": 1071,
"ौँ": 1072,
"साथ": 1073,
"राज्य": 1074,
"ग्": 1075,
"जे": 1076,
"मात्र": 1077,
"केही": 1078,
"नेपालको": 1079,
"ष्ट्र": 1080,
"द्वारा": 1081,
"जार": 1082,
"यहाँ": 1083,
"हे": 1084,
"ष्ठ": 1085,
"गत": 1086,
"गरेको": 1087,
"पुर": 1088,
"जन्": 1089,
"जना": 1090,
"हुनु": 1091,
"जुन": 1092,
"कै": 1093,
"वन": 1094,
"विका": 1095,
"प्त": 1096,
"ट्": 1097,
"पर": 1098,
"सक्": 1099,
"मान": 1100,
"काश": 1101,
"कारण": 1102,
"जिल्लाको": 1103,
"टो": 1104,
"डी": 1105,
"ढा": 1106,
"धार": 1107,
"पो": 1108,
"्रा": 1109,
"पाइ": 1110,
"समय": 1111,
"ज्ञा": 1112,
"टे": 1113,
"सर्": 1114,
"प्रयोग": 1115,
"गरी": 1116,
"कारी": 1117,
"विद्या": 1118,
"न्य": 1119,
"भाषा": 1120,
"अनुसार": 1121,
"यन": 1122,
"हुँ": 1123,
"बो": 1124,
"लु": 1125,
"न्त": 1126,
"हुने": 1127,
"छु": 1128,
"महि": 1129,
"विश्व": 1130,
"खो": 1131,
"यी": 1132,
"उनको": 1133,
"जिल्लामा": 1134,
"अन्य": 1135,
"दुई": 1136,
"टक": 1137,
"फल": 1138,
"बर": 1139,
"लन": 1140,
"वार": 1141,
"श्र": 1142,
"िका": 1143,
"पूर्ण": 1144,
"च्च": 1145,
"लगा": 1146,
"माण": 1147,
"राष्ट्र": 1148,
"जाति": 1149,
"त्व": 1150,
"भन्ने": 1151,
"पूर्व": 1152,
"कृति": 1153,
"ख्या": 1154,
"भनि": 1155,
"१०": 1156,
"याँ": 1157,
"गावि": 1158,
"स्तो": 1159,
"भएका": 1160,
"विकास": 1161,
"ते": 1162,
"नदी": 1163,
"र्म": 1164,
"प्रकार": 1165,
"क्षा": 1166,
"धान": 1167,
"अभि": 1168,
"फा": 1169,
"मध्य": 1170,
"राजा": 1171,
"क्ति": 1172,
"त्री": 1173,
"पर्ने": 1174,
"२००": 1175,
"इन्": 1176,
"सकि": 1177,
"कम": 1178,
"दो": 1179,
"फि": 1180,
"बार": 1181,
"भे": 1182,
"मू": 1183,
"यि": 1184,
"ैन": 1185,
"न्त्र": 1186,
"गर्द": 1187,
"भिन्न": 1188,
"दैन": 1189,
"ठाउँ": 1190,
"बन्ध": 1191,
"आदि": 1192,
"क्या": 1193,
"णा": 1194,
"बढ": 1195,
"ल्या": 1196,
"ेत": 1197,
"र्थ": 1198,
"प्रमुख": 1199,
"हुन": 1200,
"गरिन्छ": 1201,
"उहाँ": 1202,
"टर": 1203,
"तर्": 1204,
"नगर": 1205,
"पे": 1206,
"मैले": 1207,
"वै": 1208,
"श्य": 1209,
"श्च": 1210,
"सू": 1211,
"प्रकाश": 1212,
"गर्दा": 1213,
"त्यो": 1214,
"स्थित": 1215,
"पना": 1216,
"शु": 1217,
"मिक": 1218,
"स्तै": 1219,
"क्रम": 1220,
"मन्दि": 1221,
"बेला": 1222,
"विद्यालय": 1223,
"कला": 1224,
"गी": 1225,
"ची": 1226,
"दन": 1227,
"सन": 1228,
"ेष": 1229,
"्ने": 1230,
"पानी": 1231,
"हरूका": 1232,
"नीति": 1233,
"गाउँ": 1234,
"गरिएको": 1235,
"जन्म": 1236,
"चु": 1237,
"पत्र": 1238,
"यत": 1239,
"चित्र": 1240,
"प्राप्त": 1241,
"तु": 1242,
"नले": 1243,
"तीय": 1244,
"गरेका": 1245,
"मेरो": 1246,
"पृष्ठ": 1247,
"खु": 1248,
"गरा": 1249,
"छैन": 1250,
"बी": 1251,
"श्व": 1252,
"सले": 1253,
"राख": 1254,
"स्थ": 1255,
"पुरा": 1256,
"क्रि": 1257,
"क्षेत्रमा": 1258,
"व्यव": 1259,
"ग्रह": 1260,
"अफ": 1261,
"कले": 1262,
"नयाँ": 1263,
"व्या": 1264,
"न्थ": 1265,
"क्षि": 1266,
"उनलाई": 1267,
"रहेका": 1268,
"सुरु": 1269,
"पर्छ": 1270,
"विशेष": 1271,
"पहिलो": 1272,
"भनिन्छ": 1273,
"डे": 1274,
"दक्षि": 1275,
"शी": 1276,
"स्रो": 1277,
"मान्य": 1278,
"विभिन्न": 1279,
"हामी": 1280,
"त्रा": 1281,
"दान": 1282,
"लिया": 1283,
"नेपालमा": 1284,
"मुख्य": 1285,
"सरकार": 1286,
"दक्षिण": 1287,
"झा": 1288,
"ठमा": 1289,
"दर्": 1290,
"पी": 1291
},
"merges": [
"t h",
"i n",
"th e",
"a n",
"e r",
"o u",
"r e",
"o n",
"a t",
"e d",
"e n",
"t o",
"in g",
"an d",
"i s",
"a s",
"a l",
"o r",
"o f",
"a r",
"i t",
"e s",
"h e",
"s t",
"l e",
"o m",
"s e",
"b e",
"a d",
"o w",
"l y",
"c h",
"w h",
"th at",
"y ou",
"l i",
"v e",
"a c",
"t i",
"l d",
"m e",
"w as",
"g h",
"i d",
"l l",
"w i",
"en t",
"f or",
"a y",
"r o",
"v er",
"i c",
"h er",
"k e",
"h is",
"n o",
"u t",
"u n",
"i r",
"l o",
"w e",
"r i",
"h a",
"wi th",
"gh t",
"ou t",
"i m",
"i on",
"al l",
"a b",
"on e",
"n e",
"g e",
"ou ld",
"t er",
"m o",
"h ad",
"c e",
"s he",
"g o",
"s h",
"u r",
"a m",
"s o",
"p e",
"m y",
"d e",
"a re",
"b ut",
"om e",
"f r",
"the r",
"f e",
"s u",
"d o",
"c on",
"t e",
"a in",
"er e",
"p o",
"i f",
"the y",
"u s",
"a g",
"t r",
"n ow",
"ou n",
"th is",
"ha ve",
"no t",
"s a",
"i l",
"u p",
"th ing",
"fr om",
"a p",
"h im",
"ac k",
"at ion",
"an t",
"ou r",
"o p",
"li ke",
"u st",
"es s",
"b o",
"o k",
"u l",
"in d",
"e x",
"c om",
"s ome",
"the re",
"er s",
"c o",
"re s",
"m an",
"ar d",
"p l",
"w or",
"w ay",
"ti on",
"f o",
"c a",
"w ere",
"b y",
"at e",
"p ro",
"t ed",
"oun d",
"ow n",
"w ould",
"t s",
"wh at",
"q u",
"al ly",
"i ght",
"c k",
"g r",
"wh en",
"v en",
"c an",
"ou gh",
"in e",
"en d",
"p er",
"ou s",
"o d",
"id e",
"k now",
"t y",
"ver y",
"s i",
"a k",
"wh o",
"ab out",
"i ll",
"the m",
"es t",
"re d",
"y e",
"c ould",
"on g",
"you r",
"the ir",
"e m",
"j ust",
"o ther",
"in to",
"an y",
"wh i",
"u m",
"t w",
"as t",
"d er",
"d id",
"i e",
"be en",
"ac e",
"in k",
"it y",
"b ack",
"t ing",
"b r",
"mo re",
"a ke",
"p p",
"the n",
"s p",
"e l",
"u se",
"b l",
"sa id",
"o ver",
"ge t",
"ɑ ː",
"i ː",
"u ː",
"ɜ ː",
"ɔ ː",
"o ː",
"e ɪ",
"o ʊ",
"a ɪ",
"a ʊ",
"ɔ ɪ",
"d ʒ",
"t ʃ",
"ɪ ŋ",
"ᵻ d",
"ˈ iː",
"ˌ iː",
"ˈ ɪ",
"ˌ ɪ",
"ˈ eɪ",
"ˌ eɪ",
"ˈ ɛ",
"ˌ ɛ",
"ˈ æ",
"ˌ æ",
"ˈ ɑː",
"ˌ ɑː",
"ˈ ɔː",
"ˌ ɔː",
"oː ɹ",
"ˈ oːɹ",
"ˌ oːɹ",
"ˈ oʊ",
"ˌ oʊ",
"ˈ ʊ",
"ˌ ʊ",
"ˈ uː",
"ˌ uː",
"ˈ ɜː",
"ˌ ɜː",
"ˈ ʌ",
"ˌ ʌ",
"ˈ aɪ",
"ˌ aɪ",
"ˈ aʊ",
"ˌ aʊ",
"ˈ ɔɪ",
"ˌ ɔɪ",
"ˈ ɚ",
"ˌ ɐ",
"क ो",
"म ा",
"न ्",
"् र",
"र ्",
"क ा",
"ल ा",
"् य",
"ल े",
"न े",
"र ा",
"स ्",
"र ू",
"न ि",
"प ्र",
"प ा",
"व ि",
"य ो",
"न ा",
"ह रू",
"क ्",
"त ि",
"ा र",
"व ा",
"ला ई",
"त ा",
"ह ा",
"त ्र",
"ग र",
"ह ु",
"न् छ",
"स ा",
"म ्",
"ल ्",
"ग र्",
"ए को",
"ब ा",
"थ ि",
"न ु",
"थ ा",
"द ि",
"ह ो",
"य स",
"त ्य",
"द ा",
"्य ा",
"क् ष",
"न ी",
"द े",
"य ा",
"ज ा",
"का र",
"ह ि",
"त ्",
"े र",
"ल ि",
"प नि",
"क ु",
"ङ ्",
"ए क",
"ल ी",
"स ि",
"क ि",
"म ि",
"प ु",
"े को",
"ट ा",
"ग ा",
"उ न",
"ज ि",
"भ ा",
"ष ्",
"द ्",
"ने पा",
"र ि",
"छ न्",
"स म्",
"र ी",
"र ह",
"क े",
"बा ट",
"स ु",
"म ु",
"न ै",
"ला ग",
"स् त",
"न् द",
"भ एको",
"ध ि",
"ख ि",
"ल् ला",
"व र्",
"त ी",
"प ू",
"भ ि",
"् च",
"गर ि",
"छ ि",
"हु न्छ",
"प र्",
"स म",
"ल ो",
"२ ०",
"द ै",
"जि ल्ला",
"रा ज",
"आ फ",
"नेपा ल",
"हरू को",
"उ ँ",
"हा ँ",
"न ो",
"प छि",
"स् था",
"ङ् ग",
"ज न",
"भ ए",
"ध ा",
"अ न्",
"भ न्",
"र ो",
"त्य स",
"द ु",
"श ा",
"यो ग",
"रू प",
"थि ए",
"थि यो",
"त र",
"ह ी",
"ि त",
"त था",
"दे खि",
"लाग ि",
"न को",
"पू र्",
"् व",
"क ्र",
"ज ु",
"स ं",
"ष् ट",
"दे श",
"ख ा",
"आफ ्",
"क ी",
"र ु",
"ए उ",
"गर े",
"स े",
"े त्र",
"ब ै",
"भ ने",
"च ा",
"न मा",
"क्ष ेत्र",
"प ्",
"ड ा",
"स मा",
"स न्",
"ज ी",
"द ी",
"य ु",
"एउ टा",
"उ प",
"च ि",
"वि श",
"्र ो",
"अ नु",
"स ी",
"ले ख",
"्र े",
"क ृ",
"ब ि",
"भ ार",
"म ी",
"गर् न",
"रूप मा",
"ध ्य",
"रह ेको",
"ट ि",
"ए का",
"स ो",
"र् य",
"ना म",
"सम् म",
"उ नी",
"प रि",
"उ त्",
"व ्य",
"गर् ने",
"स बै",
"र े",
"नि र्",
"प्र ा",
"वर् ष",
"आफ् नो",
"श ि",
"क् त",
"मु ख",
"ग ो",
"ञ ्च",
"ध ेर",
"ब ्",
"स् ट",
"ग ्र",
"म े",
"्य ो",
"अ व",
"१ ९",
"धेर ै",
"ज ्",
"प ि",
"भ यो",
"द् ध",
"भन् दा",
"ड ि",
"न् न",
"न्द ्र",
"र को",
"नेपा ली",
"म हा",
"अ र्",
"ब ना",
"म न्",
"म ेर",
"ल को",
"ै ले",
"हरू मा",
"ठ ा",
"ण ्",
"कु नै",
"ँ ग",
"र ण",
"र मा",
"नि क",
"ई ँ",
"ब न्",
"व ी",
"ि य",
"प्र ति",
"उन ले",
"ट ी",
"स ार",
"स ँग",
"भा ग",
"ख े",
"त पा",
"रा म",
"तपा ईँ",
"ग ु",
"ब ु",
"व े",
"स र",
"हु न्",
"अ धि",
"च ार",
"मा नि",
"गर् नु",
"क र्",
"स ह",
"स् ता",
"स् थि",
"यस को",
"ए र",
"ब े",
"म ो",
"स को",
"हरू ले",
"भार त",
"ज् ञ",
"का म",
"छ ो",
"ि क",
"का र्य",
"द् वा",
"ज ो",
"प ृ",
"म् प",
"दि न",
"कु रा",
"ण् ड",
"छ ा",
"भ ू",
"ल मा",
"ष ा",
"े का",
"वि द",
"हरू लाई",
"उ ने",
"प हि",
"ल य",
"स ङ्",
"ौ ँ",
"सा थ",
"राज ्य",
"ग ्",
"ज े",
"मा त्र",
"के ही",
"नेपाल को",
"ष्ट ्र",
"द्वा रा",
"ज ार",
"य हाँ",
"ह े",
"ष् ठ",
"ग त",
"गर ेको",
"पु र",
"ज न्",
"ज ना",
"हु नु",
"जु न",
"क ै",
"व न",
"वि का",
"प् त",
"ट ्",
"प र",
"स क्",
"मा न",
"का श",
"कार ण",
"जिल्ला को",
"ट ो",
"ड ी",
"ढ ा",
"ध ार",
"प ो",
"्र ा",
"पा इ",
"सम य",
"ज्ञ ा",
"ट े",
"स र्",
"प्र योग",
"गर ी",
"कार ी",
"विद ्या",
"न् य",
"भा षा",
"अनु सार",
"य न",
"हु ँ",
"ब ो",
"ल ु",
"न् त",
"हु ने",
"छ ु",
"म हि",
"विश ्व",
"ख ो",
"य ी",
"उन को",
"जिल्ला मा",
"अन् य",
"दु ई",
"ट क",
"फ ल",
"ब र",
"ल न",
"व ार",
"श ्र",
"ि का",
"पूर् ण",
"च ्च",
"ल गा",
"मा ण",
"रा ष्ट्र",
"जा ति",
"त् व",
"भन् ने",
"पूर् व",
"कृ ति",
"ख ्या",
"भ नि",
"१ ०",
"या ँ",
"गा वि",
"स्त ो",
"भए का",
"विका स",
"त े",
"न दी",
"र् म",
"प्र कार",
"क्ष ा",
"धा न",
"अ भि",
"फ ा",
"म ध्य",
"रा जा",
"क् ति",
"त्र ी",
"पर् ने",
"२० ०",
"इ न्",
"स कि",
"क म",
"द ो",
"फ ि",
"ब ार",
"भ े",
"म ू",
"य ि",
"ै न",
"न् त्र",
"गर् द",
"भि न्न",
"दै न",
"ठा उँ",
"बन् ध",
"आ दि",
"क ्या",
"ण ा",
"ब ढ",
"ल ्या",
"े त",
"र् थ",
"प्र मुख",
"हु न",
"गरि न्छ",
"उ हाँ",
"ट र",
"त र्",
"न गर",
"प े",
"म ैले",
"व ै",
"श ्य",
"श ्च",
"स ू",
"प्र काश",
"गर् दा",
"त्य ो",
"स्थि त",
"प ना",
"श ु",
"मि क",
"स्त ै",
"क्र म",
"मन् दि",
"बे ला",
"विद्या लय",
"क ला",
"ग ी",
"च ी",
"द न",
"स न",
"े ष",
"् ने",
"पा नी",
"हरू का",
"नी ति",
"गा उँ",
"गरि एको",
"जन् म",
"च ु",
"प त्र",
"य त",
"चि त्र",
"प्रा प्त",
"त ु",
"न ले",
"ती य",
"गरे का",
"मेर ो",
"पृ ष्ठ",
"ख ु",
"ग रा",
"छ ैन",
"ब ी",
"श ्व",
"स ले",
"रा ख",
"स् थ",
"पु रा",
"क्र ि",
"क्षेत्र मा",
"व्य व",
"ग्र ह",
"अ फ",
"क ले",
"न याँ",
"व ्या",
"न् थ",
"क्ष ि",
"उन लाई",
"रह ेका",
"सु रु",
"पर् छ",
"विश ेष",
"पहि लो",
"भनि न्छ",
"ड े",
"द क्षि",
"श ी",
"स ्रो",
"मा न्य",
"वि भिन्न",
"हा मी",
"त्र ा",
"दा न",
"लि या",
"नेपाल मा",
"मुख ्य",
"सर कार",
"दक्षि ण",
"झ ा",
"ठ मा",
"द र्",
"प ी"
]
}
}