gpt2_m040_tiny-stories_1024 / tokenizer.json
jonasknobloch's picture
Upload folder using huggingface_hub
8f64f52 verified
{
"version": "1.0",
"truncation": null,
"padding": null,
"added_tokens": [
{
"id": 1024,
"content": "<|endoftext|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": true,
"special": true
}
],
"normalizer": null,
"pre_tokenizer": {
"type": "ByteLevel",
"add_prefix_space": false,
"trim_offsets": true,
"use_regex": true
},
"post_processor": {
"type": "ByteLevel",
"add_prefix_space": true,
"trim_offsets": false,
"use_regex": true
},
"decoder": {
"type": "ByteLevel",
"add_prefix_space": true,
"trim_offsets": true,
"use_regex": true
},
"model": {
"type": "BPE",
"dropout": null,
"unk_token": null,
"continuing_subword_prefix": null,
"end_of_word_suffix": null,
"fuse_unk": false,
"byte_fallback": false,
"ignore_merges": false,
"vocab": {
"!": 0,
"\"": 1,
"#": 2,
"$": 3,
"%": 4,
"&": 5,
"'": 6,
"(": 7,
")": 8,
"*": 9,
"+": 10,
",": 11,
"-": 12,
".": 13,
"/": 14,
"0": 15,
"1": 16,
"2": 17,
"3": 18,
"4": 19,
"5": 20,
"6": 21,
"7": 22,
"8": 23,
"9": 24,
":": 25,
";": 26,
"<": 27,
"=": 28,
">": 29,
"?": 30,
"@": 31,
"A": 32,
"B": 33,
"C": 34,
"D": 35,
"E": 36,
"F": 37,
"G": 38,
"H": 39,
"I": 40,
"J": 41,
"K": 42,
"L": 43,
"M": 44,
"N": 45,
"O": 46,
"P": 47,
"Q": 48,
"R": 49,
"S": 50,
"T": 51,
"U": 52,
"V": 53,
"W": 54,
"X": 55,
"Y": 56,
"Z": 57,
"[": 58,
"\\": 59,
"]": 60,
"_": 61,
"`": 62,
"a": 63,
"b": 64,
"c": 65,
"d": 66,
"e": 67,
"f": 68,
"g": 69,
"h": 70,
"i": 71,
"j": 72,
"k": 73,
"l": 74,
"m": 75,
"n": 76,
"o": 77,
"p": 78,
"q": 79,
"r": 80,
"s": 81,
"t": 82,
"u": 83,
"v": 84,
"w": 85,
"x": 86,
"y": 87,
"z": 88,
"{": 89,
"|": 90,
"}": 91,
"~": 92,
"¡": 93,
"¢": 94,
"£": 95,
"¤": 96,
"¥": 97,
"¦": 98,
"§": 99,
"¨": 100,
"©": 101,
"ª": 102,
"«": 103,
"¬": 104,
"®": 105,
"¯": 106,
"°": 107,
"±": 108,
"³": 109,
"´": 110,
"µ": 111,
"¶": 112,
"·": 113,
"¸": 114,
"¹": 115,
"º": 116,
"»": 117,
"¼": 118,
"½": 119,
"¾": 120,
"¿": 121,
"Â": 122,
"Ã": 123,
"Ä": 124,
"Å": 125,
"É": 126,
"Ê": 127,
"Ñ": 128,
"Ò": 129,
"á": 130,
"â": 131,
"ã": 132,
"ä": 133,
"å": 134,
"æ": 135,
"ç": 136,
"è": 137,
"é": 138,
"î": 139,
"ï": 140,
"ð": 141,
"ĉ": 142,
"Ċ": 143,
"Ġ": 144,
"Ģ": 145,
"ģ": 146,
"Ĥ": 147,
"ĥ": 148,
"Ħ": 149,
"ħ": 150,
"Ĩ": 151,
"ĩ": 152,
"Ī": 153,
"ī": 154,
"Ĭ": 155,
"ĭ": 156,
"Į": 157,
"į": 158,
"İ": 159,
"ı": 160,
"IJ": 161,
"ij": 162,
"Ĵ": 163,
"ĵ": 164,
"Ķ": 165,
"ķ": 166,
"ĸ": 167,
"ĺ": 168,
"Ļ": 169,
"ļ": 170,
"Ľ": 171,
"ľ": 172,
"Ŀ": 173,
"ŀ": 174,
"Ł": 175,
"ł": 176,
"Ń": 177,
"he": 178,
"Ġt": 179,
"Ġa": 180,
"Ġs": 181,
"nd": 182,
"Ġw": 183,
"Ġthe": 184,
"ed": 185,
"Ġb": 186,
"ĠT": 187,
"Ġto": 188,
"Ġand": 189,
"Ġh": 190,
"Ġf": 191,
"in": 192,
"Ġwa": 193,
"re": 194,
"it": 195,
"ou": 196,
"Ġl": 197,
"Ġd": 198,
"Ġc": 199,
"Ġp": 200,
"ay": 201,
"er": 202,
"Ġm": 203,
"om": 204,
"Ġwas": 205,
"Ġhe": 206,
"im": 207,
"is": 208,
"ĠS": 209,
"ar": 210,
"Ġn": 211,
"on": 212,
"Ġsa": 213,
"id": 214,
"ll": 215,
"Ġha": 216,
"Ġg": 217,
"at": 218,
"ing": 219,
"ot": 220,
"ĠThe": 221,
"en": 222,
"an": 223,
"le": 224,
"end": 225,
"or": 226,
"of": 227,
"Ġ\"": 228,
"am": 229,
"ĠH": 230,
"ir": 231,
"et": 232,
"Ġit": 233,
"Ġth": 234,
"ig": 235,
"il": 236,
"ĠHe": 237,
"Ġin": 238,
"Ġpl": 239,
"ĠO": 240,
"ow": 241,
"ver": 242,
"ri": 243,
"ut": 244,
"Ġbe": 245,
"Ġu": 246,
"Ġplay": 247,
"Ġsaid": 248,
"pp": 249,
"ith": 250,
"Ġwith": 251,
"Ġday": 252,
"ex": 253,
"Ġy": 254,
"oo": 255,
"ce": 256,
"Ġr": 257,
"ĠI": 258,
"ck": 259,
"Ġher": 260,
"ĠL": 261,
"ld": 262,
"Ġhis": 263,
"ne": 264,
"ke": 265,
"ĠB": 266,
"Ġst": 267,
"Ġbig": 268,
"very": 269,
"nt": 270,
"ext": 271,
"st": 272,
"text": 273,
"Ġyou": 274,
"ve": 275,
"ĠThey": 276,
"ĠM": 277,
"Ġhapp": 278,
"ily": 279,
"Ġon": 280,
"un": 281,
"ked": 282,
"all": 283,
"riend": 284,
"Ġfriend": 285,
"Ġli": 286,
"Ġthey": 287,
"Ġwe": 288,
"Ġhad": 289,
"Ġnot": 290,
"her": 291,
"Ġup": 292,
"Ġwant": 293,
"Ġof": 294,
"ad": 295,
"se": 296,
"Ġ<": 297,
"|>": 298,
"Ġ<|": 299,
"Ġe": 300,
"itt": 301,
"Ġdo": 302,
"ĠA": 303,
"ĠTim": 304,
"Ġhappy": 305,
"ent": 306,
"Ġvery": 307,
"Ġthat": 308,
"Ġsaw": 309,
"ould": 310,
"'s": 311,
"Ġmom": 312,
"Ġfor": 313,
"Ġsh": 314,
"ittle": 315,
"ĠShe": 316,
"ime": 317,
"Ġlittle": 318,
"Ġshe": 319,
"Ġk": 320,
"ch": 321,
"Ġtime": 322,
"oftext": 323,
".\"": 324,
"Ġnam": 325,
"es": 326,
"ound": 327,
"Ġso": 328,
"nce": 329,
"Ġnamed": 330,
"Ġthere": 331,
"Ġbo": 332,
"Ġwere": 333,
"Ġne": 334,
"out": 335,
"Ġwanted": 336,
"Ġbut": 337,
"ue": 338,
"Ġfriends": 339,
"!\"": 340,
"ird": 341,
"ht": 342,
"Ġan": 343,
"al": 344,
"ug": 345,
"Ġbird": 346,
"ake": 347,
"ved": 348,
"el": 349,
"ome": 350,
"ĠIt": 351,
"Ġtoo": 352,
"Ġhel": 353,
"ĠĊ": 354,
"Ġhelp": 355,
"ide": 356,
"Ġwent": 357,
"Ġwh": 358,
"Ġis": 359,
"ry": 360,
"Ġsm": 361,
"Ġall": 362,
"Ġloo": 363,
"ter": 364,
"Ġlo": 365,
"endoftext": 366,
"Ġupon": 367,
"ame": 368,
"ore": 369,
"ill": 370,
"ind": 371,
"Ġdid": 372,
"Ġfun": 373,
"ra": 374,
"Ġtoy": 375,
"Ġas": 376,
"get": 377,
"Ġj": 378,
"Ġre": 379,
"Ġat": 380,
"ĠLily": 381,
"ur": 382,
"ĠOne": 383,
"ly": 384,
"gether": 385,
"ack": 386,
"Ġse": 387,
"Ġo": 388,
"Ġtogether": 389,
"ĠTom": 390,
"Ġtre": 391,
"Ġcat": 392,
"ood": 393,
"Ġcould": 394,
"Ġdog": 395,
"ec": 396,
"art": 397,
"Ġcan": 398,
"ax": 399,
"Ġtheir": 400,
"my": 401,
"ard": 402,
"ark": 403,
"Ġgir": 404,
"Ġhim": 405,
"um": 406,
"Ġro": 407,
"Ġplayed": 408,
"Ġball": 409,
"?\"": 410,
"Ġgirl": 411,
"way": 412,
"ĠW": 413,
"hen": 414,
"Ġgo": 415,
"Ġfr": 416,
"Ġare": 417,
"Ġle": 418,
"Ġout": 419,
"ain": 420,
"'t": 421,
"Ġthem": 422,
"Ġsad": 423,
"ul": 424,
"other": 425,
"Ġboy": 426,
"Ġtree": 427,
"Ġhave": 428,
"Ġcl": 429,
"Ġman": 430,
"one": 431,
"oug": 432,
"Ġloved": 433,
"Ġlooked": 434,
"ic": 435,
"Ġfound": 436,
"Ġsp": 437,
"ĠOnce": 438,
"ĠJ": 439,
"Ġback": 440,
"Ġla": 441,
"Ġlike": 442,
"hing": 443,
"own": 444,
"ful": 445,
"Ġsc": 446,
"are": 447,
"side": 448,
"hed": 449,
"Ġme": 450,
"ight": 451,
"ong": 452,
"Ġpark": 453,
"op": 454,
"ell": 455,
"Ġstart": 456,
"ick": 457,
"elt": 458,
"Ġmake": 459,
"Ġwould": 460,
"pot": 461,
"round": 462,
"Ġcar": 463,
"Ġfa": 464,
"Ġsay": 465,
"Ġfelt": 466,
"ĠF": 467,
"Ġno": 468,
"Ġsee": 469,
"ob": 470,
"ag": 471,
"Ġasked": 472,
"ia": 473,
"Ġother": 474,
"omet": 475,
"Ġnew": 476,
"ice": 477,
"ouse": 478,
"Ġstarted": 479,
"Ġcame": 480,
"ss": 481,
"Ġal": 482,
"ared": 483,
"Ġsomet": 484,
"Ġag": 485,
"Ġgood": 486,
"ought": 487,
"Ġbr": 488,
"Ġsmall": 489,
"ade": 490,
"Ġwal": 491,
"Ġlaug": 492,
"ook": 493,
"Ġthing": 494,
"Ġex": 495,
"Ġfind": 496,
"Ġwor": 497,
"Ġco": 498,
"ried": 499,
"Ġput": 500,
"Ġaway": 501,
"Ġevery": 502,
"ĠY": 503,
"Ġwhat": 504,
"Ġthought": 505,
"Ġsomething": 506,
"Ġfrom": 507,
"Ġmade": 508,
"Ġhome": 509,
"ĠBut": 510,
"Ġplaying": 511,
"ile": 512,
"ud": 513,
"us": 514,
"ach": 515,
"ie": 516,
"uc": 517,
"ĠSue": 518,
"arn": 519,
"Ġran": 520,
"ny": 521,
"Ġfl": 522,
"ave": 523,
"Ġsome": 524,
"now": 525,
"Ġsmil": 526,
"Ġagain": 527,
"ust": 528,
"ĠMax": 529,
"ure": 530,
"Ġhouse": 531,
"Ġdown": 532,
"Ġpr": 533,
"king": 534,
"Ġscared": 535,
"Ġtook": 536,
"Ġlearn": 537,
"hat": 538,
"Ġtoys": 539,
"ep": 540,
"if": 541,
"ab": 542,
"Ġwill": 543,
"ret": 544,
"Ġbox": 545,
"ank": 546,
"Ġbl": 547,
"uck": 548,
"Ġmy": 549,
"Ġyour": 550,
"Ġthings": 551,
"Ġaround": 552,
"Ġlot": 553,
"oud": 554,
"Ġfe": 555,
"ish": 556,
"Ġlived": 557,
"Ġsun": 558,
"ump": 559,
"ist": 560,
"Ġthen": 561,
"ĠBen": 562,
"as": 563,
"Ġch": 564,
",\"": 565,
"Ġwhen": 566,
"ĠD": 567,
"Ġbec": 568,
"Ġab": 569,
"ty": 570,
"ĠSam": 571,
"Ġsw": 572,
"Ġdec": 573,
"Ġget": 574,
"new": 575,
"ucy": 576,
"ap": 577,
"ĠLucy": 578,
"Ġdecid": 579,
"pped": 580,
"ĠSo": 581,
"oth": 582,
"Ġliked": 583,
"Ġtried": 584,
"Ġknow": 585,
"uch": 586,
"Ġgot": 587,
"Ġany": 588,
"use": 589,
"ause": 590,
"Ġwho": 591,
"ened": 592,
"nder": 593,
"ally": 594,
"Ġmany": 595,
"Ġint": 596,
"fter": 597,
"Ġabout": 598,
"Ġpret": 599,
"ive": 600,
"ĠE": 601,
"ace": 602,
"Ġshow": 603,
"Ġred": 604,
"ous": 605,
"Ġjump": 606,
"ited": 607,
"qu": 608,
"Ġmore": 609,
"ise": 610,
"Ġv": 611,
"Ġhug": 612,
"Ġcare": 613,
"urp": 614,
"Ġpo": 615,
"Ġun": 616,
"Ġlook": 617,
"Ġlearned": 618,
"Ġwater": 619,
"nn": 620,
"Ġbest": 621,
"Ġsmiled": 622,
"Ġop": 623,
"ant": 624,
"Ġgre": 625,
"Ġexc": 626,
"ect": 627,
"ways": 628,
"âĢ": 629,
"Ġoutside": 630,
"Ġalways": 631,
"fe": 632,
"Ġroom": 633,
"Ġho": 634,
"nna": 635,
"ite": 636,
"Ġpe": 637,
"Ġinto": 638,
"Ġeat": 639,
"ower": 640,
"Ġboth": 641,
"ĠSpot": 642,
"our": 643,
"Ġdad": 644,
"Ġsor": 645,
"ara": 646,
"Ġke": 647,
"Ġone": 648,
"Ġfeel": 649,
"urpr": 650,
"Ġsurpr": 651,
"Ġnice": 652,
"ĠC": 653,
"Ġexcited": 654,
"Ġthis": 655,
"hank": 656,
"Ġfast": 657,
"Ġthan": 658,
"Ġrun": 659,
"Ġlong": 660,
"imal": 661,
"Ġanimal": 662,
"Ġam": 663,
"Ġmo": 664,
"Ġsk": 665,
"Ġtold": 666,
"ink": 667,
"Ġtr": 668,
"Ġinside": 669,
"ull": 670,
"ĠMia": 671,
"ĠMom": 672,
"Ġgra": 673,
"og": 674,
"Ġrock": 675,
"Ġpretty": 676,
"iny": 677,
"Ġpick": 678,
"Ġtake": 679,
"Ġeach": 680,
"Ġgave": 681,
"Ġsl": 682,
"Ġmuch": 683,
"den": 684,
"rom": 685,
"Ġstr": 686,
"Ġhow": 687,
"Ġneed": 688,
"Ġtow": 689,
"ven": 690,
"etter": 691,
"Ġor": 692,
"ĠYou": 693,
"ĠAs": 694,
"Ġunder": 695,
"here": 696,
"Ġold": 697,
"Ġflower": 698,
"ge": 699,
"ro": 700,
"urt": 701,
"pl": 702,
"ged": 703,
"ase": 704,
"lew": 705,
"and": 706,
"Ġcle": 707,
"Ġfish": 708,
"ast": 709,
"ess": 710,
"Ġlist": 711,
"Ġclo": 712,
"Ġtry": 713,
"Ġbear": 714,
"Ġhand": 715,
"Ġkind": 716,
"urn": 717,
"more": 718,
"ĠWe": 719,
"Ġte": 720,
"Ġsurpris": 721,
"Ġsays": 722,
"Ġjust": 723,
"Ġfood": 724,
"Ġnear": 725,
"pect": 726,
"ine": 727,
"dy": 728,
"Ġhig": 729,
"ĠBob": 730,
"Ġwat": 731,
"Ġfi": 732,
"Ġide": 733,
"ĠIn": 734,
"Ġsky": 735,
"his": 736,
"ving": 737,
"Ġtw": 738,
"Ġus": 739,
"ĠK": 740,
"Ġidea": 741,
"Ġbetter": 742,
"Ġbug": 743,
"ate": 744,
"Ġheard": 745,
"Ġen": 746,
"gry": 747,
"Ġits": 748,
"lf": 749,
"able": 750,
"ff": 751,
"Ġlet": 752,
"ber": 753,
"Ġcareful": 754,
"eci": 755,
"Ġshare": 756,
"Ġknew": 757,
"ion": 758,
"Ġif": 759,
"Ġdan": 760,
"Ġcol": 761,
"Ġfly": 762,
"Ġfo": 763,
"Ġstor": 764,
"Ġflew": 765,
"pected": 766,
"expected": 767,
"ream": 768,
"ĠAnd": 769,
"Ġcom": 770,
"ecial": 771,
"Ġspecial": 772,
"Ġcolor": 773,
"Ġgr": 774,
"ac": 775,
"Ġnever": 776,
"Ġlove": 777,
"Ġby": 778,
"ort": 779,
"Ġbecame": 780,
"Ġwind": 781,
"Ġdon": 782,
"rm": 783,
"Ġbu": 784,
"Ġtal": 785,
"Ġclean": 786,
"Ġlaughed": 787,
"Ġend": 788,
"Ġeven": 789,
"ople": 790,
"hy": 791,
"Ġdecided": 792,
"Ġmag": 793,
"Ġbecause": 794,
"Ġhard": 795,
"Ġover": 796,
"Ġshiny": 797,
"Ġclim": 798,
"Ġclimb": 799,
"bb": 800,
"Ġcake": 801,
"ak": 802,
"Ġbook": 803,
"Ġturn": 804,
"ĠP": 805,
"ĠThen": 806,
"Ġfam": 807,
"ady": 808,
"Ġhurt": 809,
"Ġbad": 810,
"Ġsafe": 811,
"Ġafter": 812,
"Ġproud": 813,
"Ġfore": 814,
"Ġche": 815,
"Ġpeople": 816,
"Ġcu": 817,
"Ġgl": 818,
"Ġhigh": 819,
"ĠN": 820,
"Ġloud": 821,
"Ġcome": 822,
"arden": 823,
"Ġdoor": 824,
"Ġgarden": 825,
"Ġgive": 826,
"Ġground": 827,
"Ġim": 828,
"Ġopened": 829,
"Ġpicked": 830,
"ail": 831,
"ĠWhen": 832,
"ild": 833,
"uff": 834,
"iz": 835,
"Yes": 836,
"Ġway": 837,
"Ġblue": 838,
"'m": 839,
"ane": 840,
"Ġstill": 841,
"kay": 842,
"udden": 843,
"Ġever": 844,
"Ġhugged": 845,
"ip": 846,
"Ġcall": 847,
"age": 848,
"Ġstay": 849,
"ock": 850,
"be": 851,
"Ġoff": 852,
"Ġfar": 853,
"Ġmagic": 854,
"ough": 855,
"Ġqu": 856,
"ĠSara": 857,
"ĠHis": 858,
"opped": 859,
"Ġshould": 860,
"Ġplace": 861,
"Ġpic": 862,
"Ġad": 863,
"ool": 864,
"Ġfamily": 865,
"Ġkid": 866,
"Ġwalk": 867,
"Ġyum": 868,
"lease": 869,
"Ġnow": 870,
"em": 871,
"Ġgreat": 872,
"ture": 873,
"Ġstrong": 874,
"aut": 875,
"Ġforest": 876,
"ĠAnna": 877,
"Ġunt": 878,
"ĠAmy": 879,
"No": 880,
"Ġbra": 881,
"Ġfrog": 882,
"Ġapp": 883,
"Ġpicture": 884,
"Ġbro": 885,
"oy": 886,
"ary": 887,
"Ġuntil": 888,
"Ġstick": 889,
"Ġsqu": 890,
"Ġbeaut": 891,
"ning": 892,
"ct": 893,
"Ġwo": 894,
"Ġnext": 895,
"Ġboat": 896,
"Ġsorry": 897,
"Ġlisten": 898,
"Ġtra": 899,
"pt": 900,
"ĠR": 901,
"Ġkids": 902,
"iful": 903,
"Ġbeautiful": 904,
"aking": 905,
"ded": 906,
"Ġdra": 907,
"Ġhat": 908,
"Ġrain": 909,
"Ġclos": 910,
"Ġstory": 911,
"rel": 912,
"Ġwhile": 913,
"Ġwalked": 914,
"ers": 915,
"Ġtown": 916,
"ress": 917,
"Ġimp": 918,
"Ġsof": 919,
"self": 920,
"illy": 921,
"ĠAt": 922,
"uddenly": 923,
"by": 924,
"Ġcry": 925,
"Ġbeing": 926,
"dded": 927,
"ree": 928,
"Ġmor": 929,
"Ġcalled": 930,
"unny": 931,
"Ġmet": 932,
"Ġhappened": 933,
"Ġgame": 934,
"Ġpart": 935,
"ĠHer": 936,
"Ġdidn": 937,
"vent": 938,
"Ġrem": 939,
"Ġopen": 940,
"Ġanimals": 941,
"Ġtruck": 942,
"hes": 943,
"ger": 944,
"Ġdoll": 945,
"ĠEvery": 946,
"Ġangry": 947,
"Ġsoft": 948,
"ma": 949,
"Ġkeep": 950,
"oon": 951,
"az": 952,
"Ġlost": 953,
"Ġbed": 954,
"ĠFrom": 955,
"ble": 956,
"Ġwarm": 957,
"Ġexpl": 958,
"iss": 959,
"ĠG": 960,
"Ġbrave": 961,
"Ġmouse": 962,
"ched": 963,
"Ġate": 964,
"Ġde": 965,
"uffy": 966,
"Ġhole": 967,
"It": 968,
"fore": 969,
"so": 970,
"Ġwatch": 971,
"Ġleave": 972,
"Ġsn": 973,
"Ġalso": 974,
"ies": 975,
"Ġfell": 976,
"Ġgreen": 977,
"Thank": 978,
"Ġface": 979,
"gan": 980,
"Ġtwo": 981,
"bit": 982,
"abbit": 983,
"ĠâĢ": 984,
"owl": 985,
"Ġnoise": 986,
"Ġanymore": 987,
"ush": 988,
"ĠFl": 989,
"ello": 990,
"ars": 991,
"Ġwhere": 992,
"Ġswing": 993,
"irst": 994,
"Ġcook": 995,
"Ġlots": 996,
"Ġsoon": 997,
"Ġrabbit": 998,
"Ġslide": 999,
"irrel": 1000,
"air": 1001,
"Ġbefore": 1002,
"Ġsquirrel": 1003,
"Ġjo": 1004,
"Ġthink": 1005,
"Ġsat": 1006,
"ft": 1007,
"Ġfin": 1008,
"ĠFluffy": 1009,
"day": 1010,
"Ġuse": 1011,
"Ġkept": 1012,
"ĠKitt": 1013,
"Hi": 1014,
"ĠâĢľ": 1015,
"âĢĿ": 1016,
"ired": 1017,
"Ġyell": 1018,
"aug": 1019,
"aught": 1020,
"Ġstore": 1021,
"Ġpain": 1022,
"Ġhands": 1023
},
"merges": [
"h e",
"Ġ t",
"Ġ a",
"Ġ s",
"n d",
"Ġ w",
"Ġt he",
"e d",
"Ġ b",
"Ġ T",
"Ġt o",
"Ġa nd",
"Ġ h",
"Ġ f",
"i n",
"Ġw a",
"r e",
"i t",
"o u",
"Ġ l",
"Ġ d",
"Ġ c",
"Ġ p",
"a y",
"e r",
"Ġ m",
"o m",
"Ġwa s",
"Ġ he",
"i m",
"i s",
"Ġ S",
"a r",
"Ġ n",
"o n",
"Ġs a",
"i d",
"l l",
"Ġh a",
"Ġ g",
"a t",
"in g",
"o t",
"ĠT he",
"e n",
"a n",
"l e",
"e nd",
"o r",
"o f",
"Ġ \"",
"a m",
"Ġ H",
"i r",
"e t",
"Ġ it",
"Ġt h",
"i g",
"i l",
"ĠH e",
"Ġ in",
"Ġp l",
"Ġ O",
"o w",
"v er",
"r i",
"u t",
"Ġb e",
"Ġ u",
"Ġpl ay",
"Ġsa id",
"p p",
"it h",
"Ġw ith",
"Ġd ay",
"e x",
"Ġ y",
"o o",
"c e",
"Ġ r",
"Ġ I",
"c k",
"Ġhe r",
"Ġ L",
"l d",
"Ġh is",
"n e",
"k e",
"Ġ B",
"Ġs t",
"Ġb ig",
"ver y",
"n t",
"ex t",
"s t",
"t ext",
"Ġy ou",
"v e",
"ĠThe y",
"Ġ M",
"Ġha pp",
"il y",
"Ġ on",
"u n",
"k ed",
"a ll",
"ri end",
"Ġf riend",
"Ġl i",
"Ġthe y",
"Ġw e",
"Ġha d",
"Ġn ot",
"he r",
"Ġu p",
"Ġwa nt",
"Ġ of",
"a d",
"s e",
"Ġ <",
"| >",
"Ġ< |",
"Ġ e",
"it t",
"Ġd o",
"Ġ A",
"ĠT im",
"Ġhapp y",
"en t",
"Ġ very",
"Ġth at",
"Ġsa w",
"ou ld",
"' s",
"Ġm om",
"Ġf or",
"Ġs h",
"itt le",
"ĠS he",
"im e",
"Ġl ittle",
"Ġs he",
"Ġ k",
"c h",
"Ġt ime",
"of text",
". \"",
"Ġn am",
"e s",
"ou nd",
"Ġs o",
"n ce",
"Ġnam ed",
"Ġthe re",
"Ġb o",
"Ġwe re",
"Ġn e",
"ou t",
"Ġwant ed",
"Ġb ut",
"u e",
"Ġfriend s",
"! \"",
"ir d",
"h t",
"Ġa n",
"a l",
"u g",
"Ġb ird",
"a ke",
"v ed",
"e l",
"om e",
"ĠI t",
"Ġto o",
"Ġhe l",
"Ġ Ċ",
"Ġhel p",
"id e",
"Ġw ent",
"Ġw h",
"Ġ is",
"r y",
"Ġs m",
"Ġa ll",
"Ġl oo",
"t er",
"Ġl o",
"end oftext",
"Ġup on",
"am e",
"o re",
"i ll",
"i nd",
"Ġd id",
"Ġf un",
"r a",
"Ġto y",
"Ġa s",
"g et",
"Ġ j",
"Ġ re",
"Ġa t",
"ĠL ily",
"u r",
"ĠO ne",
"l y",
"get her",
"a ck",
"Ġs e",
"Ġ o",
"Ġto gether",
"ĠT om",
"Ġt re",
"Ġc at",
"oo d",
"Ġc ould",
"Ġdo g",
"e c",
"ar t",
"Ġc an",
"a x",
"Ġthe ir",
"m y",
"ar d",
"ar k",
"Ġg ir",
"Ġh im",
"u m",
"Ġr o",
"Ġplay ed",
"Ġb all",
"? \"",
"Ġgir l",
"w ay",
"Ġ W",
"he n",
"Ġg o",
"Ġf r",
"Ġa re",
"Ġl e",
"Ġ out",
"a in",
"' t",
"Ġthe m",
"Ġsa d",
"u l",
"ot her",
"Ġbo y",
"Ġtre e",
"Ġha ve",
"Ġc l",
"Ġm an",
"on e",
"ou g",
"Ġlo ved",
"Ġloo ked",
"i c",
"Ġf ound",
"Ġs p",
"ĠO nce",
"Ġ J",
"Ġb ack",
"Ġl a",
"Ġli ke",
"h ing",
"ow n",
"f ul",
"Ġs c",
"a re",
"s ide",
"he d",
"Ġm e",
"ig ht",
"on g",
"Ġp ark",
"o p",
"e ll",
"Ġst art",
"i ck",
"el t",
"Ġm ake",
"Ġw ould",
"p ot",
"r ound",
"Ġc ar",
"Ġf a",
"Ġs ay",
"Ġf elt",
"Ġ F",
"Ġn o",
"Ġse e",
"o b",
"a g",
"Ġas ked",
"i a",
"Ġ other",
"om et",
"Ġne w",
"i ce",
"ou se",
"Ġstart ed",
"Ġc ame",
"s s",
"Ġa l",
"ar ed",
"Ġs omet",
"Ġa g",
"Ġg ood",
"oug ht",
"Ġb r",
"Ġsm all",
"ad e",
"Ġwa l",
"Ġla ug",
"oo k",
"Ġth ing",
"Ġ ex",
"Ġf ind",
"Ġw or",
"Ġc o",
"ri ed",
"Ġp ut",
"Ġa way",
"Ġe very",
"Ġ Y",
"Ġwh at",
"Ġth ought",
"Ġsomet hing",
"Ġfr om",
"Ġm ade",
"Ġh ome",
"ĠB ut",
"Ġplay ing",
"i le",
"u d",
"u s",
"a ch",
"i e",
"u c",
"ĠS ue",
"ar n",
"Ġr an",
"n y",
"Ġf l",
"a ve",
"Ġs ome",
"n ow",
"Ġsm il",
"Ġag ain",
"u st",
"ĠM ax",
"u re",
"Ġh ouse",
"Ġd own",
"Ġp r",
"k ing",
"Ġsc ared",
"Ġtoo k",
"Ġle arn",
"h at",
"Ġtoy s",
"e p",
"i f",
"a b",
"Ġw ill",
"re t",
"Ġbo x",
"an k",
"Ġb l",
"u ck",
"Ġm y",
"Ġyou r",
"Ġthing s",
"Ġa round",
"Ġl ot",
"ou d",
"Ġf e",
"is h",
"Ġli ved",
"Ġs un",
"um p",
"is t",
"Ġthe n",
"ĠB en",
"a s",
"Ġc h",
", \"",
"Ġw hen",
"Ġ D",
"Ġbe c",
"Ġa b",
"t y",
"ĠS am",
"Ġs w",
"Ġd ec",
"Ġg et",
"ne w",
"uc y",
"a p",
"ĠL ucy",
"Ġdec id",
"pp ed",
"ĠS o",
"ot h",
"Ġli ked",
"Ġt ried",
"Ġk now",
"u ch",
"Ġg ot",
"Ġan y",
"u se",
"a use",
"Ġwh o",
"en ed",
"nd er",
"all y",
"Ġman y",
"Ġin t",
"f ter",
"Ġab out",
"Ġp ret",
"i ve",
"Ġ E",
"a ce",
"Ġsh ow",
"Ġr ed",
"ou s",
"Ġj ump",
"it ed",
"q u",
"Ġm ore",
"is e",
"Ġ v",
"Ġh ug",
"Ġc are",
"ur p",
"Ġp o",
"Ġu n",
"Ġloo k",
"Ġlearn ed",
"Ġwa ter",
"n n",
"Ġbe st",
"Ġsmil ed",
"Ġo p",
"an t",
"Ġg re",
"Ġex c",
"ec t",
"way s",
"â Ģ",
"Ġout side",
"Ġal ways",
"f e",
"Ġro om",
"Ġh o",
"nn a",
"it e",
"Ġp e",
"Ġint o",
"Ġe at",
"ow er",
"Ġb oth",
"ĠS pot",
"ou r",
"Ġd ad",
"Ġs or",
"ar a",
"Ġ ke",
"Ġon e",
"Ġfe el",
"urp r",
"Ġs urpr",
"Ġn ice",
"Ġ C",
"Ġexc ited",
"Ġth is",
"h ank",
"Ġfa st",
"Ġth an",
"Ġr un",
"Ġl ong",
"im al",
"Ġan imal",
"Ġa m",
"Ġm o",
"Ġs k",
"Ġto ld",
"in k",
"Ġt r",
"Ġin side",
"u ll",
"ĠM ia",
"ĠM om",
"Ġg ra",
"o g",
"Ġro ck",
"Ġpret ty",
"in y",
"Ġp ick",
"Ġt ake",
"Ġe ach",
"Ġg ave",
"Ġs l",
"Ġm uch",
"d en",
"r om",
"Ġst r",
"Ġh ow",
"Ġne ed",
"Ġto w",
"v en",
"et ter",
"Ġ or",
"ĠY ou",
"ĠA s",
"Ġu nder",
"he re",
"Ġo ld",
"Ġfl ower",
"g e",
"r o",
"ur t",
"p l",
"g ed",
"a se",
"le w",
"a nd",
"Ġc le",
"Ġf ish",
"a st",
"es s",
"Ġl ist",
"Ġcl o",
"Ġt ry",
"Ġbe ar",
"Ġha nd",
"Ġk ind",
"ur n",
"m ore",
"ĠW e",
"Ġt e",
"Ġsurpr is",
"Ġsay s",
"Ġj ust",
"Ġf ood",
"Ġne ar",
"p ect",
"in e",
"d y",
"Ġh ig",
"ĠB ob",
"Ġwa t",
"Ġf i",
"Ġ ide",
"ĠI n",
"Ġsk y",
"h is",
"v ing",
"Ġt w",
"Ġu s",
"Ġ K",
"Ġide a",
"Ġb etter",
"Ġb ug",
"at e",
"Ġhe ard",
"Ġ en",
"g ry",
"Ġit s",
"l f",
"ab le",
"f f",
"Ġl et",
"b er",
"Ġcare ful",
"ec i",
"Ġsh are",
"Ġk new",
"i on",
"Ġ if",
"Ġd an",
"Ġco l",
"Ġf ly",
"Ġf o",
"Ġst or",
"Ġf lew",
"pect ed",
"ex pected",
"re am",
"ĠA nd",
"Ġc om",
"eci al",
"Ġsp ecial",
"Ġcol or",
"Ġg r",
"a c",
"Ġne ver",
"Ġlo ve",
"Ġb y",
"or t",
"Ġbec ame",
"Ġw ind",
"Ġd on",
"r m",
"Ġb u",
"Ġt al",
"Ġcle an",
"Ġlaug hed",
"Ġ end",
"Ġe ven",
"op le",
"h y",
"Ġdecid ed",
"Ġm ag",
"Ġbec ause",
"Ġh ard",
"Ġo ver",
"Ġsh iny",
"Ġcl im",
"Ġclim b",
"b b",
"Ġc ake",
"a k",
"Ġb ook",
"Ġt urn",
"Ġ P",
"ĠThe n",
"Ġf am",
"ad y",
"Ġh urt",
"Ġb ad",
"Ġsa fe",
"Ġa fter",
"Ġpr oud",
"Ġf ore",
"Ġc he",
"Ġpe ople",
"Ġc u",
"Ġg l",
"Ġhig h",
"Ġ N",
"Ġl oud",
"Ġc ome",
"ard en",
"Ġdo or",
"Ġg arden",
"Ġg ive",
"Ġg round",
"Ġ im",
"Ġop ened",
"Ġpick ed",
"a il",
"ĠW hen",
"il d",
"u ff",
"i z",
"Y es",
"Ġwa y",
"Ġbl ue",
"' m",
"an e",
"Ġst ill",
"k ay",
"ud den",
"Ġe ver",
"Ġhug ged",
"i p",
"Ġc all",
"ag e",
"Ġst ay",
"o ck",
"b e",
"Ġof f",
"Ġf ar",
"Ġmag ic",
"oug h",
"Ġ qu",
"ĠS ara",
"ĠH is",
"o pped",
"Ġsh ould",
"Ġpl ace",
"Ġp ic",
"Ġa d",
"oo l",
"Ġfam ily",
"Ġk id",
"Ġwal k",
"Ġy um",
"le ase",
"Ġn ow",
"e m",
"Ġgre at",
"t ure",
"Ġstr ong",
"a ut",
"Ġfore st",
"ĠA nna",
"Ġu nt",
"ĠA my",
"N o",
"Ġb ra",
"Ġfr og",
"Ġa pp",
"Ġpic ture",
"Ġbr o",
"o y",
"ar y",
"Ġunt il",
"Ġst ick",
"Ġs qu",
"Ġbe aut",
"n ing",
"c t",
"Ġw o",
"Ġn ext",
"Ġbo at",
"Ġsor ry",
"Ġlist en",
"Ġt ra",
"p t",
"Ġ R",
"Ġkid s",
"i ful",
"Ġbeaut iful",
"a king",
"d ed",
"Ġd ra",
"Ġha t",
"Ġr ain",
"Ġclo s",
"Ġstor y",
"re l",
"Ġwh ile",
"Ġwal ked",
"er s",
"Ġtow n",
"re ss",
"Ġim p",
"Ġs of",
"se lf",
"ill y",
"ĠA t",
"udden ly",
"b y",
"Ġc ry",
"Ġbe ing",
"d ded",
"re e",
"Ġm or",
"Ġcall ed",
"un ny",
"Ġm et",
"Ġhapp ened",
"Ġg ame",
"Ġp art",
"ĠH er",
"Ġdid n",
"v ent",
"Ġre m",
"Ġop en",
"Ġanimal s",
"Ġtr uck",
"he s",
"g er",
"Ġdo ll",
"ĠE very",
"Ġan gry",
"Ġsof t",
"m a",
"Ġke ep",
"o on",
"a z",
"Ġlo st",
"Ġb ed",
"ĠF rom",
"b le",
"Ġwa rm",
"Ġex pl",
"is s",
"Ġ G",
"Ġbra ve",
"Ġm ouse",
"c hed",
"Ġat e",
"Ġd e",
"uff y",
"Ġho le",
"I t",
"f ore",
"s o",
"Ġwat ch",
"Ġle ave",
"Ġs n",
"Ġal so",
"i es",
"Ġf ell",
"Ġgre en",
"T hank",
"Ġfa ce",
"g an",
"Ġtw o",
"b it",
"ab bit",
"Ġ âĢ",
"ow l",
"Ġno ise",
"Ġany more",
"us h",
"ĠF l",
"ell o",
"ar s",
"Ġw here",
"Ġsw ing",
"ir st",
"Ġc ook",
"Ġlot s",
"Ġso on",
"Ġr abbit",
"Ġsl ide",
"ir rel",
"a ir",
"Ġbe fore",
"Ġsqu irrel",
"Ġj o",
"Ġth ink",
"Ġsa t",
"f t",
"Ġf in",
"ĠFl uffy",
"d ay",
"Ġu se",
"Ġke pt",
"ĠK itt",
"H i",
"ĠâĢ ľ",
"âĢ Ŀ",
"ir ed",
"Ġy ell",
"a ug",
"aug ht",
"Ġst ore",
"Ġp ain",
"Ġhand s"
]
}
}