gpt2_m000_tiny-stories_1024 / tokenizer.json
jonasknobloch's picture
Upload folder using huggingface_hub
2b55245 verified
{
"version": "1.0",
"truncation": null,
"padding": null,
"added_tokens": [
{
"id": 1024,
"content": "<|endoftext|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": true,
"special": true
}
],
"normalizer": null,
"pre_tokenizer": {
"type": "ByteLevel",
"add_prefix_space": false,
"trim_offsets": true,
"use_regex": true
},
"post_processor": {
"type": "ByteLevel",
"add_prefix_space": true,
"trim_offsets": false,
"use_regex": true
},
"decoder": {
"type": "ByteLevel",
"add_prefix_space": true,
"trim_offsets": true,
"use_regex": true
},
"model": {
"type": "BPE",
"dropout": null,
"unk_token": null,
"continuing_subword_prefix": null,
"end_of_word_suffix": null,
"fuse_unk": false,
"byte_fallback": false,
"ignore_merges": false,
"vocab": {
"!": 0,
"\"": 1,
"#": 2,
"$": 3,
"%": 4,
"&": 5,
"'": 6,
"(": 7,
")": 8,
"*": 9,
"+": 10,
",": 11,
"-": 12,
".": 13,
"/": 14,
"0": 15,
"1": 16,
"2": 17,
"3": 18,
"4": 19,
"5": 20,
"6": 21,
"7": 22,
"8": 23,
"9": 24,
":": 25,
";": 26,
"<": 27,
"=": 28,
">": 29,
"?": 30,
"@": 31,
"A": 32,
"B": 33,
"C": 34,
"D": 35,
"E": 36,
"F": 37,
"G": 38,
"H": 39,
"I": 40,
"J": 41,
"K": 42,
"L": 43,
"M": 44,
"N": 45,
"O": 46,
"P": 47,
"Q": 48,
"R": 49,
"S": 50,
"T": 51,
"U": 52,
"V": 53,
"W": 54,
"X": 55,
"Y": 56,
"Z": 57,
"[": 58,
"\\": 59,
"]": 60,
"_": 61,
"`": 62,
"a": 63,
"b": 64,
"c": 65,
"d": 66,
"e": 67,
"f": 68,
"g": 69,
"h": 70,
"i": 71,
"j": 72,
"k": 73,
"l": 74,
"m": 75,
"n": 76,
"o": 77,
"p": 78,
"q": 79,
"r": 80,
"s": 81,
"t": 82,
"u": 83,
"v": 84,
"w": 85,
"x": 86,
"y": 87,
"z": 88,
"{": 89,
"|": 90,
"}": 91,
"~": 92,
"¡": 93,
"¢": 94,
"£": 95,
"¤": 96,
"¥": 97,
"¦": 98,
"§": 99,
"¨": 100,
"©": 101,
"ª": 102,
"«": 103,
"¬": 104,
"®": 105,
"¯": 106,
"°": 107,
"±": 108,
"³": 109,
"´": 110,
"µ": 111,
"¶": 112,
"·": 113,
"¸": 114,
"¹": 115,
"º": 116,
"»": 117,
"¼": 118,
"½": 119,
"¾": 120,
"¿": 121,
"Â": 122,
"Ã": 123,
"Ä": 124,
"Å": 125,
"É": 126,
"Ê": 127,
"Ñ": 128,
"Ò": 129,
"á": 130,
"â": 131,
"ã": 132,
"ä": 133,
"å": 134,
"æ": 135,
"ç": 136,
"è": 137,
"é": 138,
"î": 139,
"ï": 140,
"ð": 141,
"ĉ": 142,
"Ċ": 143,
"Ġ": 144,
"Ģ": 145,
"ģ": 146,
"Ĥ": 147,
"ĥ": 148,
"Ħ": 149,
"ħ": 150,
"Ĩ": 151,
"ĩ": 152,
"Ī": 153,
"ī": 154,
"Ĭ": 155,
"ĭ": 156,
"Į": 157,
"į": 158,
"İ": 159,
"ı": 160,
"IJ": 161,
"ij": 162,
"Ĵ": 163,
"ĵ": 164,
"Ķ": 165,
"ķ": 166,
"ĸ": 167,
"ĺ": 168,
"Ļ": 169,
"ļ": 170,
"Ľ": 171,
"ľ": 172,
"Ŀ": 173,
"ŀ": 174,
"Ł": 175,
"ł": 176,
"Ń": 177,
"Ġt": 178,
"he": 179,
"Ġa": 180,
"Ġs": 181,
"nd": 182,
"Ġw": 183,
"Ġthe": 184,
"ed": 185,
"Ġb": 186,
"Ġto": 187,
"Ġand": 188,
"ĠT": 189,
"Ġh": 190,
"Ġf": 191,
"in": 192,
"Ġwa": 193,
"re": 194,
"it": 195,
"ou": 196,
"Ġl": 197,
"Ġd": 198,
"Ġc": 199,
"Ġp": 200,
"ĠThe": 201,
"ay": 202,
"Ġm": 203,
"er": 204,
"Ġwas": 205,
"om": 206,
"Ġhe": 207,
"is": 208,
"ar": 209,
"Ġn": 210,
"im": 211,
"on": 212,
"Ġsa": 213,
"id": 214,
"ll": 215,
"ĠS": 216,
"Ġha": 217,
"Ġg": 218,
"at": 219,
"ing": 220,
"ot": 221,
"en": 222,
"an": 223,
"le": 224,
"or": 225,
"end": 226,
"Ġ\"": 227,
"ir": 228,
"ĠH": 229,
"of": 230,
"am": 231,
"ĠThey": 232,
"et": 233,
"Ġit": 234,
"Ġth": 235,
"ig": 236,
"ĠHe": 237,
"Ġin": 238,
"il": 239,
"Ġpl": 240,
"ow": 241,
"ver": 242,
"ri": 243,
"ut": 244,
"Ġbe": 245,
"Ġu": 246,
"Ġsaid": 247,
"Ġplay": 248,
"ĠO": 249,
"ith": 250,
"ĠTim": 251,
"Ġday": 252,
"Ġwith": 253,
"pp": 254,
"ĠOn": 255,
"Ġy": 256,
"oo": 257,
"ked": 258,
"Ġr": 259,
"ĠI": 260,
"ĠShe": 261,
"Ġher": 262,
"ex": 263,
"ce": 264,
"ld": 265,
"Ġhis": 266,
"Ġst": 267,
"ke": 268,
"ĠL": 269,
"Ġbig": 270,
"nt": 271,
"ck": 272,
"Ġyou": 273,
"very": 274,
"st": 275,
"ve": 276,
"ĠB": 277,
"Ġon": 278,
"un": 279,
"Ġhapp": 280,
"riend": 281,
"Ġfriend": 282,
"all": 283,
"ily": 284,
"ext": 285,
"ĠM": 286,
"Ġthey": 287,
"oft": 288,
"Ġwe": 289,
"Ġhad": 290,
"Ġnot": 291,
"Ġli": 292,
"Ġup": 293,
"her": 294,
"Ġwant": 295,
"Ġof": 296,
"ad": 297,
"itt": 298,
"Ġ<": 299,
"|>": 300,
"endoft": 301,
"Ġ<|": 302,
"endoftext": 303,
"se": 304,
"Ġdo": 305,
"Ġe": 306,
"Ġhappy": 307,
"ent": 308,
"Ġvery": 309,
"es": 310,
"Ġthat": 311,
"Ġsaw": 312,
"ĠLily": 313,
"ĠOne": 314,
"'s": 315,
"ĠA": 316,
"ould": 317,
"Ġmom": 318,
"Ġfor": 319,
"Ġsh": 320,
"ittle": 321,
"Ġlittle": 322,
"ĠTom": 323,
"Ġshe": 324,
"ch": 325,
"ime": 326,
"Ġnam": 327,
".\"": 328,
"Ġtime": 329,
"Ġk": 330,
"ound": 331,
"Ġso": 332,
"Ġthere": 333,
"Ġnamed": 334,
"Ġsm": 335,
"Ġbo": 336,
"Ġwere": 337,
"Ġne": 338,
"Ġwanted": 339,
"Ġbut": 340,
"out": 341,
"Ġfriends": 342,
"ved": 343,
"!\"": 344,
"ht": 345,
"ird": 346,
"el": 347,
"Ġbird": 348,
"al": 349,
"Ġan": 350,
"ake": 351,
"ĠIt": 352,
"Ġtoo": 353,
"ome": 354,
"ug": 355,
"ĠĊ": 356,
"ide": 357,
"Ġwent": 358,
"Ġwh": 359,
"Ġhel": 360,
"ĠOnce": 361,
"Ġis": 362,
"Ġall": 363,
"Ġhelp": 364,
"ue": 365,
"Ġloo": 366,
"Ġlo": 367,
"ter": 368,
"Ġupon": 369,
"ry": 370,
"ore": 371,
"Ġfun": 372,
"ind": 373,
"get": 374,
"Ġtoy": 375,
"ill": 376,
"ame": 377,
"Ġas": 378,
"Ġat": 379,
"ra": 380,
"Ġj": 381,
"Ġdid": 382,
"gether": 383,
"Ġre": 384,
"ur": 385,
"Ġo": 386,
"Ġse": 387,
"Ġtogether": 388,
"ack": 389,
"Ġcat": 390,
"ly": 391,
"Ġtre": 392,
"ood": 393,
"ic": 394,
"ted": 395,
"Ġdog": 396,
"Ġcould": 397,
"Ġcan": 398,
"Ġtheir": 399,
"ard": 400,
"ec": 401,
"ark": 402,
"Ġgir": 403,
"Ġplayed": 404,
"Ġball": 405,
"Ġhim": 406,
"?\"": 407,
"Ġgirl": 408,
"Ġro": 409,
"way": 410,
"hed": 411,
"Ġgo": 412,
"my": 413,
"Ġare": 414,
"Ġout": 415,
"Ġle": 416,
"Ġfr": 417,
"ain": 418,
"ĠBut": 419,
"hen": 420,
"Ġkn": 421,
"um": 422,
"Ġthem": 423,
"'t": 424,
"ax": 425,
"Ġsad": 426,
"ĠW": 427,
"ĠSue": 428,
"Ġboy": 429,
"ul": 430,
"Ġtree": 431,
"other": 432,
"Ġhave": 433,
"Ġman": 434,
"ĠMax": 435,
"Ġcl": 436,
"Ġloved": 437,
"Ġlooked": 438,
"oug": 439,
"Ġfound": 440,
"Ġsp": 441,
"Ġstar": 442,
"one": 443,
"Ġsc": 444,
"hing": 445,
"Ġback": 446,
"own": 447,
"ĠBen": 448,
"Ġlike": 449,
"are": 450,
"ful": 451,
"side": 452,
"Ġme": 453,
"Ġbec": 454,
"ĠSam": 455,
"Ġpark": 456,
"ight": 457,
"ong": 458,
"Ġcar": 459,
"ĠJ": 460,
"op": 461,
"elt": 462,
"Ġliked": 463,
"Ġwould": 464,
"Ġmake": 465,
"round": 466,
"Ġla": 467,
"Ġfa": 468,
"Ġfelt": 469,
"You": 470,
"Ġsee": 471,
"ell": 472,
"omet": 473,
"Ġasked": 474,
"Ġnew": 475,
"ag": 476,
"Ġno": 477,
"ouse": 478,
"ice": 479,
"Ġstarted": 480,
"ared": 481,
"Ġcame": 482,
"Ġal": 483,
"Ġother": 484,
"ought": 485,
"iled": 486,
"ĠF": 487,
"Ġsomet": 488,
"Ġag": 489,
"Ġgood": 490,
"Ġsmall": 491,
"ss": 492,
"Ġbr": 493,
"Ġsmiled": 494,
"Ġsay": 495,
"ried": 496,
"ade": 497,
"ĠSp": 498,
"ings": 499,
"ob": 500,
"Ġwor": 501,
"ĠSpot": 502,
"Ġfind": 503,
"Ġaway": 504,
"ia": 505,
"Ġput": 506,
"ty": 507,
"Ġex": 508,
"Ġwhat": 509,
"Ġsomething": 510,
"Ġfrom": 511,
"Ġmade": 512,
"Ġthought": 513,
"ened": 514,
"Ġhome": 515,
"Ġplaying": 516,
"Ġco": 517,
"ook": 518,
"Ġevery": 519,
"Ġwal": 520,
"Ġmu": 521,
"uc": 522,
"ach": 523,
"arn": 524,
"Ġran": 525,
"ile": 526,
"ie": 527,
"ĠMia": 528,
"ave": 529,
"Ġagain": 530,
"Ġsome": 531,
"Ġlaug": 532,
"dd": 533,
"Ġhouse": 534,
"Ġdown": 535,
"Ġfl": 536,
"king": 537,
"Ġtook": 538,
"Ġscared": 539,
"Ġpr": 540,
"ny": 541,
"ure": 542,
"Ġtoys": 543,
"Ġlearn": 544,
"ĠYou": 545,
"if": 546,
"Ġwill": 547,
"Ġbox": 548,
"ick": 549,
"ret": 550,
"ab": 551,
"ep": 552,
"Ġmy": 553,
"Ġaround": 554,
"Ġthings": 555,
"Ġyour": 556,
"oud": 557,
"Ġbl": 558,
"uck": 559,
"Ġwhen": 560,
"ish": 561,
"Ġlived": 562,
"Ġfe": 563,
"Ġthen": 564,
"Ġsun": 565,
"as": 566,
"Ġsw": 567,
"ĠSo": 568,
",\"": 569,
"ĠMom": 570,
"Ġch": 571,
"us": 572,
"pped": 573,
"Ġab": 574,
"ank": 575,
"Ġget": 576,
"ucy": 577,
"ump": 578,
"Ġlot": 579,
"ist": 580,
"ĠLucy": 581,
"ĠD": 582,
"oth": 583,
"ap": 584,
"Ġtried": 585,
"Ġknow": 586,
"Ġsays": 587,
"Ġgot": 588,
"ited": 589,
"Ġwho": 590,
"Th": 591,
"Ġkne": 592,
"ust": 593,
"Ġmany": 594,
"ĠBob": 595,
"nder": 596,
"Ġint": 597,
"Ġabout": 598,
"Ġpret": 599,
"Ġdec": 600,
"Ġany": 601,
"Ġred": 602,
"ive": 603,
"Ġknew": 604,
"ace": 605,
"Ġmore": 606,
"ous": 607,
"ise": 608,
"Ġv": 609,
"Ġcare": 610,
"ally": 611,
"Ġpic": 612,
"au": 613,
"qu": 614,
"Ġhug": 615,
"Ġlearned": 616,
"Ġpo": 617,
"Ġwater": 618,
"fter": 619,
"Ġbecame": 620,
"Ġbest": 621,
"ause": 622,
"ĠAnd": 623,
"Ġop": 624,
"Ġgre": 625,
"ĠE": 626,
"Ġexc": 627,
"urp": 628,
"ways": 629,
"âĢ": 630,
"Ġoutside": 631,
"Ġlaughed": 632,
"Ġlook": 633,
"Ġalways": 634,
"Ġdecid": 635,
"Ġshow": 636,
"Ġun": 637,
"ant": 638,
"Ġroom": 639,
"fe": 640,
"Ġdecided": 641,
"Ġho": 642,
"Ġbecause": 643,
"Ġinto": 644,
"Ġeat": 645,
"ite": 646,
"Ġjump": 647,
"Ġpe": 648,
"Ġboth": 649,
"ers": 650,
"ĠThen": 651,
"Ġdad": 652,
"udd": 653,
"Ġke": 654,
"Ġone": 655,
"ĠWhen": 656,
"nn": 657,
"Ġthis": 658,
"Ġexcited": 659,
"Ġfast": 660,
"Ġnice": 661,
"Ġfeel": 662,
"Yes": 663,
"Ġrun": 664,
"Ġlong": 665,
"ĠAnn": 666,
"Ġtold": 667,
"Ġsk": 668,
"Ġam": 669,
"urpr": 670,
"our": 671,
"Ġinside": 672,
"ull": 673,
"Ġtr": 674,
"Ġsurpr": 675,
"Ġmo": 676,
"ĠHis": 677,
"ink": 678,
"Ġpretty": 679,
"iny": 680,
"Ġsor": 681,
"Ġtake": 682,
"ĠFr": 683,
"og": 684,
"ĠC": 685,
"Ġsl": 686,
"Ġeach": 687,
"Ġgave": 688,
"hat": 689,
"Ġmuch": 690,
"Ġgra": 691,
"lew": 692,
"Ġrock": 693,
"Ġhow": 694,
"Ġstr": 695,
"ara": 696,
"Ġanim": 697,
"Ġanimal": 698,
"ged": 699,
"Ġneed": 700,
"Ġthan": 701,
"ĠAnna": 702,
"ĠAmy": 703,
"ven": 704,
"etter": 705,
"Ġtow": 706,
"Ġor": 707,
"ĠAs": 708,
"Ġunder": 709,
"ess": 710,
"Ġold": 711,
"Ġsorry": 712,
"ge": 713,
"ised": 714,
"ro": 715,
"urt": 716,
"ĠSara": 717,
"Ġcle": 718,
"Ġfish": 719,
"Ġwalked": 720,
"and": 721,
"Ġclo": 722,
"here": 723,
"Ġbear": 724,
"ase": 725,
"ast": 726,
"Ġhand": 727,
"ĠWe": 728,
"urn": 729,
"Ġkind": 730,
"Ġhappened": 731,
"Ġjust": 732,
"Ġflow": 733,
"ĠHer": 734,
"Ġfood": 735,
"Ġlist": 736,
"Ġdidn": 737,
"Ġte": 738,
"Ġanimals": 739,
"Ġhig": 740,
"Ġwat": 741,
"Ġnear": 742,
"ĠIn": 743,
"Ġide": 744,
"Ġtry": 745,
"ched": 746,
"Ġsky": 747,
"ine": 748,
"Ġsn": 749,
"pl": 750,
"Ġfi": 751,
"ving": 752,
"Ġus": 753,
"ĠFrom": 754,
"Ġidea": 755,
"Ġbetter": 756,
"Ġbug": 757,
"Ġheard": 758,
"gry": 759,
"Ġits": 760,
"Ġtw": 761,
"Ġlet": 762,
"pec": 763,
"ate": 764,
"able": 765,
"ff": 766,
"Ġen": 767,
"Ġcareful": 768,
"Ġshare": 769,
"Ġif": 770,
"Thank": 771,
"Ġfly": 772,
"Ġstor": 773,
"ial": 774,
"Ġflew": 775,
"more": 776,
"Ġanymore": 777,
"Ġspec": 778,
"Ġspecial": 779,
"ion": 780,
"Ġcom": 781,
"Ġlots": 782,
"Ġnever": 783,
"Ġby": 784,
"lf": 785,
"ream": 786,
"Ġdan": 787,
"Ġbu": 788,
"Ġfo": 789,
"Ġwind": 790,
"Ġdon": 791,
"ĠEvery": 792,
"Ġtal": 793,
"Ġclean": 794,
"ort": 795,
"Ġgr": 796,
"Ġlove": 797,
"rm": 798,
"ber": 799,
"Ġend": 800,
"ople": 801,
"Ġeven": 802,
"Ġmag": 803,
"ĠK": 804,
"Ġhard": 805,
"Ġshiny": 806,
"udden": 807,
"Ġfore": 808,
"Ġover": 809,
"Ġcake": 810,
"ak": 811,
"Ġbook": 812,
"Ġcol": 813,
"Ġturn": 814,
"Ġfam": 815,
"Ġbad": 816,
"Ġsafe": 817,
"Ġafter": 818,
"ady": 819,
"uddenly": 820,
"Ġpeople": 821,
"Ġproud": 822,
"Ġsurprised": 823,
"pected": 824,
"Let": 825,
"Ġhigh": 826,
"Ġcu": 827,
"Ġhurt": 828,
"Ġcome": 829,
"imb": 830,
"Ġdoor": 831,
"arden": 832,
"Ġgarden": 833,
"bb": 834,
"Ġground": 835,
"Ġopened": 836,
"Ġpicked": 837,
"Ġloud": 838,
"Ġclimb": 839,
"expected": 840,
"Ġunexpected": 841,
"hy": 842,
"Ġgl": 843,
"Ġche": 844,
"ild": 845,
"Ġim": 846,
"Ġgive": 847,
"Ġway": 848,
"ail": 849,
"'m": 850,
"Ġthanked": 851,
"Ġcolor": 852,
"Ġblue": 853,
"Ġstill": 854,
"Ġever": 855,
"Ġhugged": 856,
"ĠP": 857,
"Ġcall": 858,
"Ġfar": 859,
"ip": 860,
"No": 861,
"Ġoff": 862,
"Ġmagic": 863,
"iz": 864,
"age": 865,
"ough": 866,
"ummy": 867,
"Ġjumped": 868,
"Ġshould": 869,
"Ġfamily": 870,
"ool": 871,
"Ġpar": 872,
"Ġkid": 873,
"Ġsmile": 874,
"hes": 875,
"ĠJo": 876,
"Ġplace": 877,
"uff": 878,
"kay": 879,
"Ġwalk": 880,
"Ġnow": 881,
"ct": 882,
"Ġgreat": 883,
"Ġqu": 884,
"em": 885,
"ĠSuddenly": 886,
"les": 887,
"Ġstrong": 888,
"Ġstay": 889,
"Ġunt": 890,
"Ġsto": 891,
"aut": 892,
"Ġforest": 893,
"ture": 894,
"ane": 895,
"Ġbra": 896,
"itty": 897,
"Ġfrog": 898,
"Ġbro": 899,
"Ġuntil": 900,
"Ġbeaut": 901,
"dy": 902,
"Ġsqu": 903,
"Ġstick": 904,
"Ġnext": 905,
"Ġboat": 906,
"lease": 907,
"ning": 908,
"ĠSally": 909,
"ĠAfter": 910,
"ĠN": 911,
"Ġhappily": 912,
"Ġlisten": 913,
"aking": 914,
"Ġkids": 915,
"Ġtra": 916,
"ĠKitty": 917,
"ies": 918,
"iful": 919,
"Ġbeautiful": 920,
"Ġapp": 921,
"Ġhelped": 922,
"Ġdra": 923,
"Ġshowed": 924,
"Ġclos": 925,
"be": 926,
"Ġimp": 927,
"Ġstory": 928,
"unny": 929,
"Ġwhile": 930,
"Ġtown": 931,
"rel": 932,
"pt": 933,
"Ġrain": 934,
"ress": 935,
"Ġpicture": 936,
"ĠAt": 937,
"oy": 938,
"Ġbeing": 939,
"Ġrem": 940,
"Ġeveryone": 941,
"ary": 942,
"ree": 943,
"Ġmor": 944,
"ĠR": 945,
"Ġhat": 946,
"Ġcalled": 947,
"Ġmet": 948,
"Ġstopped": 949,
"Ġad": 950,
"Ġgame": 951,
"Ġwo": 952,
"Can": 953,
"Ġangry": 954,
"ger": 955,
"uffy": 956,
"Ġsoft": 957,
"ĠFin": 958,
"Ġopen": 959,
"Ġtruck": 960,
"Ġkeep": 961,
"Ġcry": 962,
"Ġyummy": 963,
"ĠTh": 964,
"Ġlost": 965,
"Ġbed": 966,
"ĠLet": 967,
"Ġwarm": 968,
"by": 969,
"vent": 970,
"ĠJack": 971,
"Ġbrave": 972,
"Ġmouse": 973,
"Ġate": 974,
"oon": 975,
"ished": 976,
"Ġde": 977,
"It": 978,
"fore": 979,
"Ġdoll": 980,
"so": 981,
"Ġcouldn": 982,
"Ġwatch": 983,
"Ġleave": 984,
"Ġalso": 985,
"dded": 986,
"Ġfell": 987,
"Ġgreen": 988,
"Ġface": 989,
"Ġtwo": 990,
"ĠFl": 991,
"gan": 992,
"iss": 993,
"Ġflowers": 994,
"bit": 995,
"ĠâĢ": 996,
"ble": 997,
"Ġnoise": 998,
"What": 999,
"abbit": 1000,
"irst": 1001,
"owl": 1002,
"Ġwhere": 1003,
"az": 1004,
"Ġsoon": 1005,
"ock": 1006,
"self": 1007,
"Ġslide": 1008,
"Ġrabbit": 1009,
"Ġhole": 1010,
"ĠG": 1011,
"Ġbefore": 1012,
"irrel": 1013,
"Ġpus": 1014,
"ired": 1015,
"Ġsat": 1016,
"illy": 1017,
"Ġhear": 1018,
"ĠFluffy": 1019,
"Ġuse": 1020,
"Ġpa": 1021,
"Ġkept": 1022,
"ĠâĢľ": 1023
},
"merges": [
"Ġ t",
"h e",
"Ġ a",
"Ġ s",
"n d",
"Ġ w",
"Ġt he",
"e d",
"Ġ b",
"Ġt o",
"Ġa nd",
"Ġ T",
"Ġ h",
"Ġ f",
"i n",
"Ġw a",
"r e",
"i t",
"o u",
"Ġ l",
"Ġ d",
"Ġ c",
"Ġ p",
"ĠT he",
"a y",
"Ġ m",
"e r",
"Ġwa s",
"o m",
"Ġ he",
"i s",
"a r",
"Ġ n",
"i m",
"o n",
"Ġs a",
"i d",
"l l",
"Ġ S",
"Ġh a",
"Ġ g",
"a t",
"in g",
"o t",
"e n",
"a n",
"l e",
"o r",
"e nd",
"Ġ \"",
"i r",
"Ġ H",
"o f",
"a m",
"ĠThe y",
"e t",
"Ġ it",
"Ġt h",
"i g",
"ĠH e",
"Ġ in",
"i l",
"Ġp l",
"o w",
"v er",
"r i",
"u t",
"Ġb e",
"Ġ u",
"Ġsa id",
"Ġpl ay",
"Ġ O",
"it h",
"ĠT im",
"Ġd ay",
"Ġw ith",
"p p",
"ĠO n",
"Ġ y",
"o o",
"k ed",
"Ġ r",
"Ġ I",
"ĠS he",
"Ġhe r",
"e x",
"c e",
"l d",
"Ġh is",
"Ġs t",
"k e",
"Ġ L",
"Ġb ig",
"n t",
"c k",
"Ġy ou",
"ver y",
"s t",
"v e",
"Ġ B",
"Ġ on",
"u n",
"Ġha pp",
"ri end",
"Ġf riend",
"a ll",
"il y",
"ex t",
"Ġ M",
"Ġthe y",
"of t",
"Ġw e",
"Ġha d",
"Ġn ot",
"Ġl i",
"Ġu p",
"he r",
"Ġwa nt",
"Ġ of",
"a d",
"it t",
"Ġ <",
"| >",
"end oft",
"Ġ< |",
"endoft ext",
"s e",
"Ġd o",
"Ġ e",
"Ġhapp y",
"en t",
"Ġ very",
"e s",
"Ġth at",
"Ġsa w",
"ĠL ily",
"ĠOn e",
"' s",
"Ġ A",
"ou ld",
"Ġm om",
"Ġf or",
"Ġs h",
"itt le",
"Ġl ittle",
"ĠT om",
"Ġs he",
"c h",
"im e",
"Ġn am",
". \"",
"Ġt ime",
"Ġ k",
"ou nd",
"Ġs o",
"Ġthe re",
"Ġnam ed",
"Ġs m",
"Ġb o",
"Ġwe re",
"Ġn e",
"Ġwant ed",
"Ġb ut",
"ou t",
"Ġfriend s",
"v ed",
"! \"",
"h t",
"ir d",
"e l",
"Ġb ird",
"a l",
"Ġa n",
"a ke",
"ĠI t",
"Ġto o",
"om e",
"u g",
"Ġ Ċ",
"id e",
"Ġw ent",
"Ġw h",
"Ġhe l",
"ĠOn ce",
"Ġ is",
"Ġa ll",
"Ġhel p",
"u e",
"Ġl oo",
"Ġl o",
"t er",
"Ġup on",
"r y",
"o re",
"Ġf un",
"i nd",
"g et",
"Ġto y",
"i ll",
"am e",
"Ġa s",
"Ġa t",
"r a",
"Ġ j",
"Ġd id",
"get her",
"Ġ re",
"u r",
"Ġ o",
"Ġs e",
"Ġto gether",
"a ck",
"Ġc at",
"l y",
"Ġt re",
"oo d",
"i c",
"t ed",
"Ġdo g",
"Ġc ould",
"Ġc an",
"Ġthe ir",
"ar d",
"e c",
"ar k",
"Ġg ir",
"Ġplay ed",
"Ġb all",
"Ġh im",
"? \"",
"Ġgir l",
"Ġr o",
"w ay",
"he d",
"Ġg o",
"m y",
"Ġa re",
"Ġ out",
"Ġl e",
"Ġf r",
"a in",
"ĠB ut",
"he n",
"Ġk n",
"u m",
"Ġthe m",
"' t",
"a x",
"Ġsa d",
"Ġ W",
"ĠS ue",
"Ġbo y",
"u l",
"Ġtre e",
"ot her",
"Ġha ve",
"Ġm an",
"ĠM ax",
"Ġc l",
"Ġlo ved",
"Ġloo ked",
"ou g",
"Ġf ound",
"Ġs p",
"Ġst ar",
"on e",
"Ġs c",
"h ing",
"Ġb ack",
"ow n",
"ĠB en",
"Ġli ke",
"a re",
"f ul",
"s ide",
"Ġm e",
"Ġbe c",
"ĠS am",
"Ġp ark",
"ig ht",
"on g",
"Ġc ar",
"Ġ J",
"o p",
"el t",
"Ġli ked",
"Ġw ould",
"Ġm ake",
"r ound",
"Ġl a",
"Ġf a",
"Ġf elt",
"Y ou",
"Ġse e",
"e ll",
"om et",
"Ġas ked",
"Ġne w",
"a g",
"Ġn o",
"ou se",
"i ce",
"Ġstar ted",
"ar ed",
"Ġc ame",
"Ġa l",
"Ġ other",
"oug ht",
"il ed",
"Ġ F",
"Ġs omet",
"Ġa g",
"Ġg ood",
"Ġsm all",
"s s",
"Ġb r",
"Ġsm iled",
"Ġs ay",
"ri ed",
"ad e",
"ĠS p",
"ing s",
"o b",
"Ġw or",
"ĠSp ot",
"Ġf ind",
"Ġa way",
"i a",
"Ġp ut",
"t y",
"Ġ ex",
"Ġwh at",
"Ġsomet hing",
"Ġfr om",
"Ġm ade",
"Ġth ought",
"en ed",
"Ġh ome",
"Ġplay ing",
"Ġc o",
"oo k",
"Ġe very",
"Ġwa l",
"Ġm u",
"u c",
"a ch",
"ar n",
"Ġr an",
"i le",
"i e",
"ĠM ia",
"a ve",
"Ġag ain",
"Ġs ome",
"Ġla ug",
"d d",
"Ġh ouse",
"Ġd own",
"Ġf l",
"k ing",
"Ġtoo k",
"Ġsc ared",
"Ġp r",
"n y",
"u re",
"Ġtoy s",
"Ġle arn",
"Ġ You",
"i f",
"Ġw ill",
"Ġbo x",
"i ck",
"re t",
"a b",
"e p",
"Ġm y",
"Ġa round",
"Ġth ings",
"Ġyou r",
"ou d",
"Ġb l",
"u ck",
"Ġw hen",
"is h",
"Ġli ved",
"Ġf e",
"Ġthe n",
"Ġs un",
"a s",
"Ġs w",
"ĠS o",
", \"",
"ĠM om",
"Ġc h",
"u s",
"pp ed",
"Ġa b",
"an k",
"Ġg et",
"uc y",
"um p",
"Ġl ot",
"is t",
"ĠL ucy",
"Ġ D",
"ot h",
"a p",
"Ġt ried",
"Ġkn ow",
"Ġsay s",
"Ġg ot",
"it ed",
"Ġwh o",
"T h",
"Ġkn e",
"u st",
"Ġman y",
"ĠB ob",
"nd er",
"Ġin t",
"Ġab out",
"Ġp ret",
"Ġd ec",
"Ġan y",
"Ġr ed",
"i ve",
"Ġkne w",
"a ce",
"Ġm ore",
"ou s",
"is e",
"Ġ v",
"Ġc are",
"all y",
"Ġp ic",
"a u",
"q u",
"Ġh ug",
"Ġlearn ed",
"Ġp o",
"Ġwa ter",
"f ter",
"Ġbec ame",
"Ġbe st",
"au se",
"ĠA nd",
"Ġo p",
"Ġg re",
"Ġ E",
"Ġex c",
"ur p",
"way s",
"â Ģ",
"Ġout side",
"Ġlaug hed",
"Ġloo k",
"Ġal ways",
"Ġdec id",
"Ġsh ow",
"Ġu n",
"an t",
"Ġro om",
"f e",
"Ġdecid ed",
"Ġh o",
"Ġbec ause",
"Ġint o",
"Ġe at",
"it e",
"Ġj ump",
"Ġp e",
"Ġb oth",
"er s",
"ĠThe n",
"Ġd ad",
"u dd",
"Ġ ke",
"Ġon e",
"ĠW hen",
"n n",
"Ġth is",
"Ġexc ited",
"Ġfa st",
"Ġn ice",
"Ġfe el",
"Y es",
"Ġr un",
"Ġl ong",
"ĠA nn",
"Ġto ld",
"Ġs k",
"Ġa m",
"urp r",
"ou r",
"Ġin side",
"u ll",
"Ġt r",
"Ġs urpr",
"Ġm o",
"ĠH is",
"in k",
"Ġpret ty",
"in y",
"Ġs or",
"Ġt ake",
"ĠF r",
"o g",
"Ġ C",
"Ġs l",
"Ġe ach",
"Ġg ave",
"h at",
"Ġmu ch",
"Ġg ra",
"le w",
"Ġro ck",
"Ġh ow",
"Ġst r",
"ar a",
"Ġan im",
"Ġanim al",
"g ed",
"Ġne ed",
"Ġth an",
"ĠAnn a",
"ĠA my",
"v en",
"et ter",
"Ġto w",
"Ġ or",
"ĠA s",
"Ġu nder",
"es s",
"Ġo ld",
"Ġsor ry",
"g e",
"is ed",
"r o",
"ur t",
"ĠS ara",
"Ġc le",
"Ġf ish",
"Ġwal ked",
"a nd",
"Ġcl o",
"he re",
"Ġbe ar",
"a se",
"a st",
"Ġha nd",
"ĠW e",
"ur n",
"Ġk ind",
"Ġhapp ened",
"Ġj ust",
"Ġfl ow",
"ĠH er",
"Ġf ood",
"Ġl ist",
"Ġdid n",
"Ġt e",
"Ġanimal s",
"Ġh ig",
"Ġwa t",
"Ġne ar",
"ĠI n",
"Ġ ide",
"Ġt ry",
"c hed",
"Ġsk y",
"in e",
"Ġs n",
"p l",
"Ġf i",
"v ing",
"Ġu s",
"ĠFr om",
"Ġide a",
"Ġb etter",
"Ġb ug",
"Ġhe ard",
"g ry",
"Ġit s",
"Ġt w",
"Ġl et",
"p ec",
"at e",
"ab le",
"f f",
"Ġ en",
"Ġcare ful",
"Ġsh are",
"Ġ if",
"Th ank",
"Ġf ly",
"Ġst or",
"i al",
"Ġf lew",
"m ore",
"Ġany more",
"Ġsp ec",
"Ġspec ial",
"i on",
"Ġc om",
"Ġlot s",
"Ġne ver",
"Ġb y",
"l f",
"re am",
"Ġd an",
"Ġb u",
"Ġf o",
"Ġw ind",
"Ġd on",
"ĠE very",
"Ġt al",
"Ġcle an",
"or t",
"Ġg r",
"Ġlo ve",
"r m",
"b er",
"Ġ end",
"op le",
"Ġe ven",
"Ġm ag",
"Ġ K",
"Ġh ard",
"Ġsh iny",
"udd en",
"Ġf ore",
"Ġo ver",
"Ġc ake",
"a k",
"Ġb ook",
"Ġco l",
"Ġt urn",
"Ġf am",
"Ġb ad",
"Ġsa fe",
"Ġa fter",
"ad y",
"udden ly",
"Ġpe ople",
"Ġpr oud",
"Ġsurpr ised",
"pec ted",
"L et",
"Ġhig h",
"Ġc u",
"Ġh urt",
"Ġc ome",
"im b",
"Ġdo or",
"ard en",
"Ġg arden",
"b b",
"Ġg round",
"Ġop ened",
"Ġpic ked",
"Ġl oud",
"Ġcl imb",
"ex pected",
"Ġun expected",
"h y",
"Ġg l",
"Ġc he",
"il d",
"Ġ im",
"Ġg ive",
"Ġwa y",
"a il",
"' m",
"Ġthan ked",
"Ġcol or",
"Ġbl ue",
"Ġst ill",
"Ġe ver",
"Ġhug ged",
"Ġ P",
"Ġc all",
"Ġf ar",
"i p",
"N o",
"Ġof f",
"Ġmag ic",
"i z",
"ag e",
"oug h",
"um my",
"Ġjump ed",
"Ġsh ould",
"Ġfam ily",
"oo l",
"Ġp ar",
"Ġk id",
"Ġsm ile",
"he s",
"ĠJ o",
"Ġpl ace",
"u ff",
"k ay",
"Ġwal k",
"Ġn ow",
"c t",
"Ġgre at",
"Ġ qu",
"e m",
"ĠS uddenly",
"le s",
"Ġstr ong",
"Ġst ay",
"Ġu nt",
"Ġst o",
"a ut",
"Ġfore st",
"t ure",
"an e",
"Ġb ra",
"itt y",
"Ġfr og",
"Ġbr o",
"Ġunt il",
"Ġbe aut",
"d y",
"Ġs qu",
"Ġst ick",
"Ġn ext",
"Ġbo at",
"le ase",
"n ing",
"ĠS ally",
"ĠA fter",
"Ġ N",
"Ġhapp ily",
"Ġlist en",
"a king",
"Ġkid s",
"Ġt ra",
"ĠK itty",
"i es",
"i ful",
"Ġbeaut iful",
"Ġa pp",
"Ġhelp ed",
"Ġd ra",
"Ġshow ed",
"Ġclo s",
"b e",
"Ġim p",
"Ġstor y",
"un ny",
"Ġwh ile",
"Ġtow n",
"re l",
"p t",
"Ġr ain",
"re ss",
"Ġpic ture",
"ĠA t",
"o y",
"Ġbe ing",
"Ġre m",
"Ġevery one",
"ar y",
"re e",
"Ġm or",
"Ġ R",
"Ġha t",
"Ġcall ed",
"Ġm et",
"Ġsto pped",
"Ġa d",
"Ġg ame",
"Ġw o",
"C an",
"Ġan gry",
"g er",
"uff y",
"Ġs oft",
"ĠF in",
"Ġop en",
"Ġtr uck",
"Ġke ep",
"Ġc ry",
"Ġy ummy",
"ĠT h",
"Ġlo st",
"Ġb ed",
"ĠL et",
"Ġwa rm",
"b y",
"v ent",
"ĠJ ack",
"Ġbra ve",
"Ġm ouse",
"Ġat e",
"o on",
"is hed",
"Ġd e",
"I t",
"f ore",
"Ġdo ll",
"s o",
"Ġcould n",
"Ġwat ch",
"Ġle ave",
"Ġal so",
"dd ed",
"Ġf ell",
"Ġgre en",
"Ġfa ce",
"Ġtw o",
"ĠF l",
"g an",
"is s",
"Ġflow ers",
"b it",
"Ġ âĢ",
"b le",
"Ġno ise",
"W hat",
"ab bit",
"ir st",
"ow l",
"Ġw here",
"a z",
"Ġso on",
"o ck",
"se lf",
"Ġsl ide",
"Ġr abbit",
"Ġho le",
"Ġ G",
"Ġbe fore",
"ir rel",
"Ġp us",
"ir ed",
"Ġsa t",
"ill y",
"Ġhe ar",
"ĠFl uffy",
"Ġu se",
"Ġp a",
"Ġke pt",
"ĠâĢ ľ"
]
}
}