jonasknobloch's picture
Upload folder using huggingface_hub
46b5190 verified
{
"version": "1.0",
"truncation": null,
"padding": null,
"added_tokens": [
{
"id": 1024,
"content": "<|endoftext|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": true,
"special": true
}
],
"normalizer": null,
"pre_tokenizer": {
"type": "ByteLevel",
"add_prefix_space": false,
"trim_offsets": true,
"use_regex": true
},
"post_processor": {
"type": "ByteLevel",
"add_prefix_space": true,
"trim_offsets": false,
"use_regex": true
},
"decoder": {
"type": "ByteLevel",
"add_prefix_space": true,
"trim_offsets": true,
"use_regex": true
},
"model": {
"type": "BPE",
"dropout": null,
"unk_token": null,
"continuing_subword_prefix": null,
"end_of_word_suffix": null,
"fuse_unk": false,
"byte_fallback": false,
"ignore_merges": false,
"vocab": {
"!": 0,
"\"": 1,
"#": 2,
"$": 3,
"%": 4,
"&": 5,
"'": 6,
"(": 7,
")": 8,
"*": 9,
"+": 10,
",": 11,
"-": 12,
".": 13,
"/": 14,
"0": 15,
"1": 16,
"2": 17,
"3": 18,
"4": 19,
"5": 20,
"6": 21,
"7": 22,
"8": 23,
"9": 24,
":": 25,
";": 26,
"<": 27,
"=": 28,
">": 29,
"?": 30,
"@": 31,
"A": 32,
"B": 33,
"C": 34,
"D": 35,
"E": 36,
"F": 37,
"G": 38,
"H": 39,
"I": 40,
"J": 41,
"K": 42,
"L": 43,
"M": 44,
"N": 45,
"O": 46,
"P": 47,
"Q": 48,
"R": 49,
"S": 50,
"T": 51,
"U": 52,
"V": 53,
"W": 54,
"X": 55,
"Y": 56,
"Z": 57,
"[": 58,
"\\": 59,
"]": 60,
"_": 61,
"`": 62,
"a": 63,
"b": 64,
"c": 65,
"d": 66,
"e": 67,
"f": 68,
"g": 69,
"h": 70,
"i": 71,
"j": 72,
"k": 73,
"l": 74,
"m": 75,
"n": 76,
"o": 77,
"p": 78,
"q": 79,
"r": 80,
"s": 81,
"t": 82,
"u": 83,
"v": 84,
"w": 85,
"x": 86,
"y": 87,
"z": 88,
"{": 89,
"|": 90,
"}": 91,
"~": 92,
"¡": 93,
"¢": 94,
"£": 95,
"¤": 96,
"¥": 97,
"¦": 98,
"§": 99,
"¨": 100,
"©": 101,
"ª": 102,
"«": 103,
"¬": 104,
"®": 105,
"¯": 106,
"°": 107,
"±": 108,
"³": 109,
"´": 110,
"µ": 111,
"¶": 112,
"·": 113,
"¸": 114,
"¹": 115,
"º": 116,
"»": 117,
"¼": 118,
"½": 119,
"¾": 120,
"¿": 121,
"Â": 122,
"Ã": 123,
"Ä": 124,
"Å": 125,
"É": 126,
"Ê": 127,
"Ñ": 128,
"Ò": 129,
"á": 130,
"â": 131,
"ã": 132,
"ä": 133,
"å": 134,
"æ": 135,
"ç": 136,
"è": 137,
"é": 138,
"î": 139,
"ï": 140,
"ð": 141,
"ĉ": 142,
"Ċ": 143,
"Ġ": 144,
"Ģ": 145,
"ģ": 146,
"Ĥ": 147,
"ĥ": 148,
"Ħ": 149,
"ħ": 150,
"Ĩ": 151,
"ĩ": 152,
"Ī": 153,
"ī": 154,
"Ĭ": 155,
"ĭ": 156,
"Į": 157,
"į": 158,
"İ": 159,
"ı": 160,
"IJ": 161,
"ij": 162,
"Ĵ": 163,
"ĵ": 164,
"Ķ": 165,
"ķ": 166,
"ĸ": 167,
"ĺ": 168,
"Ļ": 169,
"ļ": 170,
"Ľ": 171,
"ľ": 172,
"Ŀ": 173,
"ŀ": 174,
"Ł": 175,
"ł": 176,
"Ń": 177,
"he": 178,
"Ġt": 179,
"Ġa": 180,
"Ġs": 181,
"nd": 182,
"Ġw": 183,
"Ġthe": 184,
"ed": 185,
"ĠT": 186,
"Ġb": 187,
"Ġto": 188,
"Ġand": 189,
"Ġh": 190,
"Ġf": 191,
"in": 192,
"Ġwa": 193,
"re": 194,
"ou": 195,
"it": 196,
"Ġl": 197,
"Ġd": 198,
"Ġc": 199,
"Ġp": 200,
"ay": 201,
"er": 202,
"om": 203,
"Ġm": 204,
"Ġwas": 205,
"im": 206,
"ĠS": 207,
"Ġhe": 208,
"is": 209,
"ar": 210,
"Ġn": 211,
"on": 212,
"Ġsa": 213,
"id": 214,
"ll": 215,
"Ġha": 216,
"at": 217,
"Ġg": 218,
"ing": 219,
"hey": 220,
"ot": 221,
"en": 222,
"an": 223,
"le": 224,
"end": 225,
"or": 226,
"of": 227,
"am": 228,
"Ġ\"": 229,
"ĠH": 230,
"ir": 231,
"et": 232,
"il": 233,
"Ġth": 234,
"Ġit": 235,
"ig": 236,
"ĠO": 237,
"ĠHe": 238,
"Ġin": 239,
"Ġpl": 240,
"ow": 241,
"ut": 242,
"ver": 243,
"ri": 244,
"Ġbe": 245,
"ex": 246,
"Ġu": 247,
"Ġplay": 248,
"Ġsaid": 249,
"pp": 250,
"ce": 251,
"ith": 252,
"Ġwith": 253,
"Ġday": 254,
"Ġy": 255,
"oo": 256,
"ĠL": 257,
"Ġr": 258,
"ne": 259,
"ck": 260,
"ĠI": 261,
"ĠB": 262,
"Ġher": 263,
"ext": 264,
"text": 265,
"ld": 266,
"Ġhis": 267,
"ke": 268,
"Ġst": 269,
"very": 270,
"ĠM": 271,
"Ġbig": 272,
"nt": 273,
"st": 274,
"Ġyou": 275,
"ily": 276,
"ve": 277,
"Ġhapp": 278,
"un": 279,
"Ġon": 280,
"Ġli": 281,
"all": 282,
"riend": 283,
"Ġfriend": 284,
"Ġthey": 285,
"Ġwe": 286,
"Ġhad": 287,
"her": 288,
"Ġnot": 289,
"Ġup": 290,
"Ġwant": 291,
"se": 292,
"Ġof": 293,
"ad": 294,
"ĠA": 295,
"Ġ<": 296,
"|>": 297,
"Ġ<|": 298,
"Ġe": 299,
"Ġdo": 300,
"itt": 301,
"ked": 302,
"ent": 303,
"Ġhappy": 304,
"Ġvery": 305,
"ould": 306,
"Ġthat": 307,
"Ġsaw": 308,
"'s": 309,
"Ġmom": 310,
"Ġfor": 311,
"Ġsh": 312,
"ittle": 313,
"nce": 314,
"ime": 315,
"Ġlittle": 316,
"Ġk": 317,
"Ġshe": 318,
"ch": 319,
"Ġtime": 320,
".\"": 321,
"Ġnam": 322,
"ound": 323,
"Ġso": 324,
"Ġthere": 325,
"ue": 326,
"Ġnamed": 327,
"Ġbo": 328,
"Ġwere": 329,
"es": 330,
"Ġne": 331,
"out": 332,
"Ġbut": 333,
"Ġwanted": 334,
"ĠThe": 335,
"ug": 336,
"Ġfriends": 337,
"!\"": 338,
"Ġan": 339,
"al": 340,
"ird": 341,
"ht": 342,
"ake": 343,
"Ġbird": 344,
"ome": 345,
"Ġhel": 346,
"Ġhelp": 347,
"el": 348,
"ĠIt": 349,
"Ġtoo": 350,
"oftext": 351,
"ry": 352,
"ĠĊ": 353,
"ved": 354,
"ide": 355,
"Ġwent": 356,
"Ġwh": 357,
"Ġis": 358,
"ter": 359,
"Ġall": 360,
"Ġloo": 361,
"ĠThey": 362,
"Ġlo": 363,
"Ġupon": 364,
"ame": 365,
"ill": 366,
"Ġdid": 367,
"ore": 368,
"ra": 369,
"ind": 370,
"Ġfun": 371,
"ly": 372,
"Ġre": 373,
"Ġj": 374,
"Ġtoy": 375,
"Ġas": 376,
"get": 377,
"ur": 378,
"Ġat": 379,
"ack": 380,
"Ġse": 381,
"Ġsm": 382,
"gether": 383,
"Ġo": 384,
"Ġtogether": 385,
"Ġtre": 386,
"ax": 387,
"Ġcat": 388,
"ood": 389,
"Ġcould": 390,
"ec": 391,
"my": 392,
"ĠTim": 393,
"Ġdog": 394,
"art": 395,
"Ġcan": 396,
"Ġtheir": 397,
"ark": 398,
"ard": 399,
"ĠW": 400,
"um": 401,
"hen": 402,
"Ġro": 403,
"Ġhim": 404,
"irl": 405,
"Ġplayed": 406,
"Ġball": 407,
"?\"": 408,
"Ġgirl": 409,
"way": 410,
"Ġgo": 411,
"rom": 412,
"ĠShe": 413,
"Ġle": 414,
"Ġare": 415,
"Ġout": 416,
"ain": 417,
"Ġthem": 418,
"'t": 419,
"ul": 420,
"Ġsad": 421,
"other": 422,
"one": 423,
"Ġcl": 424,
"Ġboy": 425,
"Ġtree": 426,
"Ġhave": 427,
"Ġman": 428,
"pot": 429,
"ĠJ": 430,
"Ġla": 431,
"oug": 432,
"Ġloved": 433,
"Ġlooked": 434,
"Ġfound": 435,
"ic": 436,
"Ġback": 437,
"Ġlike": 438,
"Ġsp": 439,
"ful": 440,
"own": 441,
"are": 442,
"Ġsay": 443,
"ro": 444,
"ia": 445,
"hing": 446,
"side": 447,
"ell": 448,
"Ġme": 449,
"Ġsc": 450,
"ight": 451,
"ĠF": 452,
"Ġpark": 453,
"ong": 454,
"ick": 455,
"Ġstart": 456,
"Ġmake": 457,
"Ġwould": 458,
"elt": 459,
"Ġcar": 460,
"Ġno": 461,
"round": 462,
"Ġfa": 463,
"Ġfelt": 464,
"Ġsee": 465,
"Ġother": 466,
"Ġlaug": 467,
"op": 468,
"ss": 469,
"ag": 470,
"ob": 471,
"Ġasked": 472,
"ice": 473,
"Ġnew": 474,
"ouse": 475,
"omet": 476,
"Ġstarted": 477,
"Ġcame": 478,
"endoftext": 479,
"Ġal": 480,
"Ġwal": 481,
"Ġsomet": 482,
"Ġag": 483,
"ared": 484,
"Ġgood": 485,
"Ġsmall": 486,
"ook": 487,
"ought": 488,
"ĠY": 489,
"ade": 490,
"hed": 491,
"ĠLily": 492,
"ud": 493,
"Ġevery": 494,
"ĠTom": 495,
"Ġco": 496,
"ĠOne": 497,
"Ġex": 498,
"Ġthing": 499,
"Ġfind": 500,
"Ġwor": 501,
"Ġput": 502,
"ile": 503,
"Ġaway": 504,
"Ġthought": 505,
"Ġwhat": 506,
"Ġsomething": 507,
"Ġfrom": 508,
"Ġmade": 509,
"Ġhome": 510,
"hat": 511,
"Ġplaying": 512,
"us": 513,
"ie": 514,
"ried": 515,
"ny": 516,
"ach": 517,
"Ġfl": 518,
"uc": 519,
"arn": 520,
"Ġran": 521,
"Ġsome": 522,
"ave": 523,
"now": 524,
"ust": 525,
"ble": 526,
"ank": 527,
"ure": 528,
"Ġagain": 529,
"Ġlot": 530,
"Ġlook": 531,
"Ġhouse": 532,
"Ġdown": 533,
"came": 534,
"Ġscared": 535,
"Ġtook": 536,
"Ġbl": 537,
"ep": 538,
"Ġlearn": 539,
"Ġtoys": 540,
"ret": 541,
"uck": 542,
"ump": 543,
"Ġwill": 544,
"if": 545,
"Ġbox": 546,
"Ġyour": 547,
"Ġmy": 548,
"oud": 549,
"Ġfe": 550,
"Ġthings": 551,
"Ġaround": 552,
"ĠD": 553,
"Ġdec": 554,
"Ġdecid": 555,
"ish": 556,
"ist": 557,
"new": 558,
"Ġsun": 559,
"Ġbr": 560,
"Ġlived": 561,
"Ġch": 562,
"as": 563,
"Ġthen": 564,
"ca": 565,
",\"": 566,
"Ġwhen": 567,
"ty": 568,
"use": 569,
"cause": 570,
"Ġget": 571,
"ally": 572,
"Ġany": 573,
"ucy": 574,
"ĠLucy": 575,
"Ġsw": 576,
"fter": 577,
"oth": 578,
"Ġknow": 579,
"uch": 580,
"Ġtried": 581,
"ĠE": 582,
"nder": 583,
"Ġsmil": 584,
"Ġgot": 585,
"Ġshow": 586,
"Ġwho": 587,
"Ġjump": 588,
"ap": 589,
"Ġab": 590,
"ĠOnce": 591,
"Ġmany": 592,
"pped": 593,
"Ġint": 594,
"Ġpret": 595,
"nn": 596,
"ĠSo": 597,
"ive": 598,
"Ġabout": 599,
"Ġhappen": 600,
"nna": 601,
"ace": 602,
"ous": 603,
"Ġred": 604,
"qu": 605,
"urp": 606,
"Ġun": 607,
"Ġv": 608,
"Ġhug": 609,
"Ġmore": 610,
"ise": 611,
"Ġpo": 612,
"Ġcare": 613,
"king": 614,
"ect": 615,
"Ġwater": 616,
"Ġlearned": 617,
"pen": 618,
"ant": 619,
"Ġbest": 620,
"ara": 621,
"Ġsor": 622,
"Ġgre": 623,
"Ġexc": 624,
"Ġexcit": 625,
"hank": 626,
"Ġta": 627,
"ways": 628,
"ower": 629,
"âĢ": 630,
"Ġoutside": 631,
"Ġpr": 632,
"Ġalways": 633,
"ĠC": 634,
"Ġpe": 635,
"Ġthan": 636,
"fe": 637,
"Ġho": 638,
"Ġroom": 639,
"Ġeat": 640,
"Ġinto": 641,
"Ġopen": 642,
"our": 643,
"imal": 644,
"Ġanimal": 645,
"urpr": 646,
"Ġsurpr": 647,
"Ġboth": 648,
"Ġfeel": 649,
"Ġdad": 650,
"ite": 651,
"Ġke": 652,
"Ġone": 653,
"den": 654,
"Ġnice": 655,
"Ġexcited": 656,
"Ġthis": 657,
"Ġfast": 658,
"Ġmo": 659,
"Ġam": 660,
"Ġlong": 661,
"Ġrun": 662,
"ink": 663,
"Ġsk": 664,
"Ġgra": 665,
"Ġtold": 666,
"Ġrock": 667,
"Ġinside": 668,
"ull": 669,
"Ġpretty": 670,
"iny": 671,
"bb": 672,
"Ġpick": 673,
"Ġtr": 674,
"Ġtake": 675,
"Ġflower": 676,
"Ġeach": 677,
"Ġgave": 678,
"Ġmuch": 679,
"Ġsl": 680,
"here": 681,
"Ġneed": 682,
"Ġhow": 683,
"Ġtow": 684,
"Ġstr": 685,
"ven": 686,
"etter": 687,
"Ġor": 688,
"pl": 689,
"Ġsurpris": 690,
"ĠAs": 691,
"Ġunder": 692,
"more": 693,
"Ġold": 694,
"ĠBut": 695,
"ge": 696,
"his": 697,
"isten": 698,
"Ġlisten": 699,
"Ġtry": 700,
"urt": 701,
"dy": 702,
"and": 703,
"ĠK": 704,
"Ġcle": 705,
"Ġfish": 706,
"pect": 707,
"ĠSue": 708,
"ase": 709,
"Ġclo": 710,
"Ġbear": 711,
"Ġkind": 712,
"Ġhand": 713,
"urn": 714,
"Ġfle": 715,
"ĠWe": 716,
"ged": 717,
"Ġte": 718,
"Ġnear": 719,
"ĠMax": 720,
"lf": 721,
"ine": 722,
"Ġjust": 723,
"Ġfood": 724,
"Ġfi": 725,
"Ġwat": 726,
"Ġhig": 727,
"Ġtw": 728,
"Ġide": 729,
"pected": 730,
"expected": 731,
"ĠIn": 732,
"by": 733,
"Ġcol": 734,
"Ġcolor": 735,
"Ġsky": 736,
"Ġen": 737,
"ess": 738,
"Ġfo": 739,
"ate": 740,
"ving": 741,
"Ġus": 742,
"Ġidea": 743,
"Ġbetter": 744,
"Ġheard": 745,
"Ġbug": 746,
"gry": 747,
"Ġits": 748,
"ff": 749,
"Ġlet": 750,
"Ġdan": 751,
"ĠBen": 752,
"ion": 753,
"ac": 754,
"ream": 755,
"eci": 756,
"Ġcareful": 757,
"Ġshare": 758,
"Ġif": 759,
"Ġgr": 760,
"Ġlove": 761,
"Ġfly": 762,
"Ġstor": 763,
"Ġcom": 764,
"Ġflew": 765,
"ĠSam": 766,
"hy": 767,
"be": 768,
"ber": 769,
"ecial": 770,
"Ġspecial": 771,
"ort": 772,
"Ġnever": 773,
"Ġby": 774,
"Ġwind": 775,
"Ġbu": 776,
"rm": 777,
"Ġdon": 778,
"Ġclim": 779,
"Ġclimb": 780,
"Ġtal": 781,
"Ġclean": 782,
"ĠN": 783,
"ĠP": 784,
"Ġend": 785,
"Ġeven": 786,
"ople": 787,
"Ġmag": 788,
"Ġliked": 789,
"Ġhard": 790,
"Ġover": 791,
"Ġshiny": 792,
"Ġbook": 793,
"Ġcake": 794,
"Ġwait": 795,
"ane": 796,
"Ġjo": 797,
"Ġche": 798,
"Ġhurt": 799,
"Ġfr": 800,
"opped": 801,
"Ġturn": 802,
"Ġproud": 803,
"ady": 804,
"Ġfam": 805,
"Ġbad": 806,
"Ġgl": 807,
"Ġafter": 808,
"Ġsafe": 809,
"Ġcu": 810,
"Ġgive": 811,
"Ġpeople": 812,
"Ġloud": 813,
"iz": 814,
"kay": 815,
"Ġhigh": 816,
"Ġim": 817,
"ock": 818,
"arden": 819,
"Ġgarden": 820,
"Ġcome": 821,
"Ġdoor": 822,
"Ġyum": 823,
"Ġground": 824,
"Ġopened": 825,
"Ġpicked": 826,
"Ġstay": 827,
"ĠMom": 828,
"Ġfore": 829,
"uff": 830,
"Ġbea": 831,
"ild": 832,
"Ġra": 833,
"Ġblue": 834,
"dd": 835,
"Ġway": 836,
"Ġqu": 837,
"'m": 838,
"Ġstill": 839,
"Ġever": 840,
"ip": 841,
"Ġhugged": 842,
"age": 843,
"Ġcall": 844,
"Ġoff": 845,
"Ġfar": 846,
"Ġpic": 847,
"Ġplace": 848,
"ough": 849,
"Ġmagic": 850,
"dded": 851,
"lease": 852,
"Ġshould": 853,
"Ġsmiled": 854,
"rog": 855,
"ture": 856,
"ool": 857,
"Ġwalk": 858,
"Ġfamily": 859,
"Ġkid": 860,
"ary": 861,
"Ġpicture": 862,
"Ġwo": 863,
"em": 864,
"Ġma": 865,
"Ġapp": 866,
"illy": 867,
"Ġnow": 868,
"udden": 869,
"Ġgreat": 870,
"Ġpa": 871,
"self": 872,
"Ġca": 873,
"Ġstrong": 874,
"Ġfrog": 875,
"Ġbra": 876,
"ĠR": 877,
"Ġforest": 878,
"ĠSpot": 879,
"No": 880,
"Ġunt": 881,
"Ġbro": 882,
"Ġstick": 883,
"Ġsqu": 884,
"Ġuntil": 885,
"ct": 886,
"Ġbeaut": 887,
"ning": 888,
"Ġtra": 889,
"Ġnext": 890,
"Ġboat": 891,
"ak": 892,
"pt": 893,
"Ġhat": 894,
"Ġrain": 895,
"Ġcry": 896,
"Ġkids": 897,
"Ġdra": 898,
"Ġbeauti": 899,
"Ġbeautiful": 900,
"ma": 901,
"Ġclos": 902,
"Ġstory": 903,
"rel": 904,
"Ġad": 905,
"Ġwhile": 906,
"ress": 907,
"Ġtown": 908,
"Ġexpl": 909,
"Ġsof": 910,
"ger": 911,
"ĠAt": 912,
"Ġbeing": 913,
"ree": 914,
"Ġimp": 915,
"ĠMia": 916,
"Ġdoll": 917,
"vent": 918,
"Ġmor": 919,
"Ġcalled": 920,
"ello": 921,
"ĠG": 922,
"Ġmet": 923,
"Ġtruck": 924,
"Ġgame": 925,
"Ġpart": 926,
"oon": 927,
"iss": 928,
"Ġsoft": 929,
"Ġangry": 930,
"Ġkeep": 931,
"ear": 932,
"unny": 933,
"Ġbed": 934,
"Ġwarm": 935,
"Ġlost": 936,
"Ġrem": 937,
"Ġbrave": 938,
"Ġmouse": 939,
"Ġate": 940,
"Ġsn": 941,
"Ġhole": 942,
"It": 943,
"fore": 944,
"ĠYou": 945,
"so": 946,
"Ġwatch": 947,
"Ġswing": 948,
"Ġleave": 949,
"Ġcook": 950,
"Ġalso": 951,
"Ġfell": 952,
"oy": 953,
"Ġgreen": 954,
"gan": 955,
"ers": 956,
"Ġface": 957,
"Ġtwo": 958,
"bbit": 959,
"uffy": 960,
"owl": 961,
"Ġthink": 962,
"Ġfin": 963,
"ĠâĢ": 964,
"ush": 965,
"Ġnoise": 966,
"Ġwhere": 967,
"az": 968,
"day": 969,
"Ġde": 970,
"obo": 971,
"Ġrabbit": 972,
"ĠFl": 973,
"irrel": 974,
"Ġsoon": 975,
"irst": 976,
"oh": 977,
"ohn": 978,
"Ġapple": 979,
"able": 980,
"Ġslide": 981,
"Ġsound": 982,
"ft": 983,
"Ġsquirrel": 984,
"Ġask": 985,
"Ġbefore": 986,
"ched": 987,
"Ġcla": 988,
"Ġyell": 989,
"Ġsat": 990,
"joy": 991,
"Ġenjoy": 992,
"ĠFluffy": 993,
"Ġblock": 994,
"Ġuse": 995,
"ught": 996,
"ired": 997,
"Ġkept": 998,
"uit": 999,
"Hi": 1000,
"ĠâĢľ": 1001,
"âĢĿ": 1002,
"leep": 1003,
"ious": 1004,
"Ġcra": 1005,
"Ġpain": 1006,
"Ġstore": 1007,
"Ġhands": 1008,
"Ġbirds": 1009,
"hes": 1010,
"air": 1011,
"Ġgoing": 1012,
"Ġshout": 1013,
"Ġreal": 1014,
"Ġsays": 1015,
"Ġhaving": 1016,
"Ġfunny": 1017,
"Ġhop": 1018,
"Ġey": 1019,
"ĠAnd": 1020,
"Ġcatch": 1021,
"Ġbre": 1022,
"Ġwis": 1023
},
"merges": [
"h e",
"Ġ t",
"Ġ a",
"Ġ s",
"n d",
"Ġ w",
"Ġt he",
"e d",
"Ġ T",
"Ġ b",
"Ġt o",
"Ġa nd",
"Ġ h",
"Ġ f",
"i n",
"Ġw a",
"r e",
"o u",
"i t",
"Ġ l",
"Ġ d",
"Ġ c",
"Ġ p",
"a y",
"e r",
"o m",
"Ġ m",
"Ġwa s",
"i m",
"Ġ S",
"Ġ he",
"i s",
"a r",
"Ġ n",
"o n",
"Ġs a",
"i d",
"l l",
"Ġh a",
"a t",
"Ġ g",
"in g",
"he y",
"o t",
"e n",
"a n",
"l e",
"e nd",
"o r",
"o f",
"a m",
"Ġ \"",
"Ġ H",
"i r",
"e t",
"i l",
"Ġt h",
"Ġ it",
"i g",
"Ġ O",
"ĠH e",
"Ġ in",
"Ġp l",
"o w",
"u t",
"v er",
"r i",
"Ġb e",
"e x",
"Ġ u",
"Ġpl ay",
"Ġsa id",
"p p",
"c e",
"it h",
"Ġw ith",
"Ġd ay",
"Ġ y",
"o o",
"Ġ L",
"Ġ r",
"n e",
"c k",
"Ġ I",
"Ġ B",
"Ġhe r",
"ex t",
"t ext",
"l d",
"Ġh is",
"k e",
"Ġs t",
"ver y",
"Ġ M",
"Ġb ig",
"n t",
"s t",
"Ġy ou",
"il y",
"v e",
"Ġha pp",
"u n",
"Ġ on",
"Ġl i",
"a ll",
"ri end",
"Ġf riend",
"Ġthe y",
"Ġw e",
"Ġha d",
"he r",
"Ġn ot",
"Ġu p",
"Ġwa nt",
"s e",
"Ġ of",
"a d",
"Ġ A",
"Ġ <",
"| >",
"Ġ< |",
"Ġ e",
"Ġd o",
"it t",
"k ed",
"en t",
"Ġhapp y",
"Ġ very",
"ou ld",
"Ġth at",
"Ġsa w",
"' s",
"Ġm om",
"Ġf or",
"Ġs h",
"itt le",
"n ce",
"im e",
"Ġl ittle",
"Ġ k",
"Ġs he",
"c h",
"Ġt ime",
". \"",
"Ġn am",
"ou nd",
"Ġs o",
"Ġthe re",
"u e",
"Ġnam ed",
"Ġb o",
"Ġwe re",
"e s",
"Ġn e",
"ou t",
"Ġb ut",
"Ġwant ed",
"ĠT he",
"u g",
"Ġfriend s",
"! \"",
"Ġa n",
"a l",
"ir d",
"h t",
"a ke",
"Ġb ird",
"om e",
"Ġhe l",
"Ġhel p",
"e l",
"ĠI t",
"Ġto o",
"of text",
"r y",
"Ġ Ċ",
"v ed",
"id e",
"Ġw ent",
"Ġw h",
"Ġ is",
"t er",
"Ġa ll",
"Ġl oo",
"ĠT hey",
"Ġl o",
"Ġup on",
"am e",
"i ll",
"Ġd id",
"o re",
"r a",
"i nd",
"Ġf un",
"l y",
"Ġ re",
"Ġ j",
"Ġto y",
"Ġa s",
"g et",
"u r",
"Ġa t",
"a ck",
"Ġs e",
"Ġs m",
"get her",
"Ġ o",
"Ġto gether",
"Ġt re",
"a x",
"Ġc at",
"oo d",
"Ġc ould",
"e c",
"m y",
"ĠT im",
"Ġdo g",
"ar t",
"Ġc an",
"Ġthe ir",
"ar k",
"ar d",
"Ġ W",
"u m",
"he n",
"Ġr o",
"Ġh im",
"ir l",
"Ġplay ed",
"Ġb all",
"? \"",
"Ġg irl",
"w ay",
"Ġg o",
"r om",
"ĠS he",
"Ġl e",
"Ġa re",
"Ġ out",
"a in",
"Ġthe m",
"' t",
"u l",
"Ġsa d",
"ot her",
"on e",
"Ġc l",
"Ġbo y",
"Ġtre e",
"Ġha ve",
"Ġm an",
"p ot",
"Ġ J",
"Ġl a",
"ou g",
"Ġlo ved",
"Ġloo ked",
"Ġf ound",
"i c",
"Ġb ack",
"Ġli ke",
"Ġs p",
"f ul",
"ow n",
"a re",
"Ġs ay",
"r o",
"i a",
"h ing",
"s ide",
"e ll",
"Ġm e",
"Ġs c",
"ig ht",
"Ġ F",
"Ġp ark",
"on g",
"i ck",
"Ġst art",
"Ġm ake",
"Ġw ould",
"el t",
"Ġc ar",
"Ġn o",
"r ound",
"Ġf a",
"Ġf elt",
"Ġse e",
"Ġ other",
"Ġla ug",
"o p",
"s s",
"a g",
"o b",
"Ġas ked",
"i ce",
"Ġne w",
"ou se",
"om et",
"Ġstart ed",
"Ġc ame",
"end oftext",
"Ġa l",
"Ġwa l",
"Ġs omet",
"Ġa g",
"ar ed",
"Ġg ood",
"Ġsm all",
"oo k",
"oug ht",
"Ġ Y",
"ad e",
"he d",
"ĠL ily",
"u d",
"Ġe very",
"ĠT om",
"Ġc o",
"ĠO ne",
"Ġ ex",
"Ġth ing",
"Ġf ind",
"Ġw or",
"Ġp ut",
"i le",
"Ġa way",
"Ġth ought",
"Ġwh at",
"Ġsomet hing",
"Ġf rom",
"Ġm ade",
"Ġh ome",
"h at",
"Ġplay ing",
"u s",
"i e",
"ri ed",
"n y",
"a ch",
"Ġf l",
"u c",
"ar n",
"Ġr an",
"Ġs ome",
"a ve",
"n ow",
"u st",
"b le",
"an k",
"u re",
"Ġag ain",
"Ġl ot",
"Ġloo k",
"Ġh ouse",
"Ġd own",
"c ame",
"Ġsc ared",
"Ġtoo k",
"Ġb l",
"e p",
"Ġle arn",
"Ġtoy s",
"re t",
"u ck",
"um p",
"Ġw ill",
"i f",
"Ġbo x",
"Ġyou r",
"Ġm y",
"ou d",
"Ġf e",
"Ġthing s",
"Ġa round",
"Ġ D",
"Ġd ec",
"Ġdec id",
"is h",
"is t",
"ne w",
"Ġs un",
"Ġb r",
"Ġli ved",
"Ġc h",
"a s",
"Ġthe n",
"c a",
", \"",
"Ġw hen",
"t y",
"u se",
"ca use",
"Ġg et",
"all y",
"Ġan y",
"uc y",
"ĠL ucy",
"Ġs w",
"f ter",
"ot h",
"Ġk now",
"u ch",
"Ġt ried",
"Ġ E",
"nd er",
"Ġsm il",
"Ġg ot",
"Ġsh ow",
"Ġwh o",
"Ġj ump",
"a p",
"Ġa b",
"ĠO nce",
"Ġman y",
"pp ed",
"Ġin t",
"Ġp ret",
"n n",
"ĠS o",
"i ve",
"Ġab out",
"Ġhapp en",
"nn a",
"a ce",
"ou s",
"Ġr ed",
"q u",
"ur p",
"Ġu n",
"Ġ v",
"Ġh ug",
"Ġm ore",
"is e",
"Ġp o",
"Ġc are",
"k ing",
"ec t",
"Ġwa ter",
"Ġlearn ed",
"p en",
"an t",
"Ġbe st",
"ar a",
"Ġs or",
"Ġg re",
"Ġex c",
"Ġexc it",
"h ank",
"Ġt a",
"way s",
"ow er",
"â Ģ",
"Ġout side",
"Ġp r",
"Ġal ways",
"Ġ C",
"Ġp e",
"Ġth an",
"f e",
"Ġh o",
"Ġro om",
"Ġe at",
"Ġint o",
"Ġo pen",
"ou r",
"im al",
"Ġan imal",
"urp r",
"Ġs urpr",
"Ġb oth",
"Ġfe el",
"Ġd ad",
"it e",
"Ġ ke",
"Ġon e",
"d en",
"Ġn ice",
"Ġexcit ed",
"Ġth is",
"Ġfa st",
"Ġm o",
"Ġa m",
"Ġl ong",
"Ġr un",
"in k",
"Ġs k",
"Ġg ra",
"Ġto ld",
"Ġro ck",
"Ġin side",
"u ll",
"Ġpret ty",
"in y",
"b b",
"Ġp ick",
"Ġt r",
"Ġt ake",
"Ġfl ower",
"Ġe ach",
"Ġg ave",
"Ġm uch",
"Ġs l",
"he re",
"Ġne ed",
"Ġh ow",
"Ġto w",
"Ġst r",
"v en",
"et ter",
"Ġ or",
"p l",
"Ġsurpr is",
"ĠA s",
"Ġu nder",
"m ore",
"Ġo ld",
"ĠB ut",
"g e",
"h is",
"ist en",
"Ġl isten",
"Ġt ry",
"ur t",
"d y",
"a nd",
"Ġ K",
"Ġc le",
"Ġf ish",
"p ect",
"ĠS ue",
"a se",
"Ġcl o",
"Ġbe ar",
"Ġk ind",
"Ġha nd",
"ur n",
"Ġf le",
"ĠW e",
"g ed",
"Ġt e",
"Ġne ar",
"ĠM ax",
"l f",
"in e",
"Ġj ust",
"Ġf ood",
"Ġf i",
"Ġwa t",
"Ġh ig",
"Ġt w",
"Ġ ide",
"pect ed",
"ex pected",
"ĠI n",
"b y",
"Ġco l",
"Ġcol or",
"Ġsk y",
"Ġ en",
"es s",
"Ġf o",
"at e",
"v ing",
"Ġu s",
"Ġide a",
"Ġb etter",
"Ġhe ard",
"Ġb ug",
"g ry",
"Ġit s",
"f f",
"Ġl et",
"Ġd an",
"ĠB en",
"i on",
"a c",
"re am",
"ec i",
"Ġcare ful",
"Ġsh are",
"Ġ if",
"Ġg r",
"Ġlo ve",
"Ġf ly",
"Ġst or",
"Ġc om",
"Ġfle w",
"ĠS am",
"h y",
"b e",
"b er",
"eci al",
"Ġsp ecial",
"or t",
"Ġne ver",
"Ġb y",
"Ġw ind",
"Ġb u",
"r m",
"Ġd on",
"Ġcl im",
"Ġclim b",
"Ġt al",
"Ġcle an",
"Ġ N",
"Ġ P",
"Ġ end",
"Ġe ven",
"op le",
"Ġm ag",
"Ġli ked",
"Ġh ard",
"Ġo ver",
"Ġsh iny",
"Ġb ook",
"Ġc ake",
"Ġwa it",
"an e",
"Ġj o",
"Ġc he",
"Ġh urt",
"Ġf r",
"o pped",
"Ġt urn",
"Ġpr oud",
"ad y",
"Ġf am",
"Ġb ad",
"Ġg l",
"Ġa fter",
"Ġsa fe",
"Ġc u",
"Ġg ive",
"Ġpe ople",
"Ġl oud",
"i z",
"k ay",
"Ġhig h",
"Ġ im",
"o ck",
"ard en",
"Ġg arden",
"Ġc ome",
"Ġdo or",
"Ġy um",
"Ġg round",
"Ġopen ed",
"Ġpick ed",
"Ġst ay",
"ĠM om",
"Ġf ore",
"u ff",
"Ġbe a",
"il d",
"Ġr a",
"Ġbl ue",
"d d",
"Ġwa y",
"Ġ qu",
"' m",
"Ġst ill",
"Ġe ver",
"i p",
"Ġhug ged",
"ag e",
"Ġc all",
"Ġof f",
"Ġf ar",
"Ġp ic",
"Ġpl ace",
"oug h",
"Ġmag ic",
"dd ed",
"le ase",
"Ġsh ould",
"Ġsmil ed",
"ro g",
"t ure",
"oo l",
"Ġwal k",
"Ġfam ily",
"Ġk id",
"ar y",
"Ġpic ture",
"Ġw o",
"e m",
"Ġm a",
"Ġa pp",
"ill y",
"Ġn ow",
"ud den",
"Ġgre at",
"Ġp a",
"se lf",
"Ġc a",
"Ġstr ong",
"Ġf rog",
"Ġb ra",
"Ġ R",
"Ġfore st",
"ĠS pot",
"N o",
"Ġu nt",
"Ġb ro",
"Ġst ick",
"Ġs qu",
"Ġunt il",
"c t",
"Ġbea ut",
"n ing",
"Ġt ra",
"Ġn ext",
"Ġbo at",
"a k",
"p t",
"Ġha t",
"Ġr ain",
"Ġc ry",
"Ġkid s",
"Ġd ra",
"Ġbeaut i",
"Ġbeauti ful",
"m a",
"Ġclo s",
"Ġstor y",
"re l",
"Ġa d",
"Ġwh ile",
"re ss",
"Ġtow n",
"Ġex pl",
"Ġs of",
"g er",
"ĠA t",
"Ġbe ing",
"re e",
"Ġim p",
"ĠM ia",
"Ġdo ll",
"v ent",
"Ġm or",
"Ġcall ed",
"ell o",
"Ġ G",
"Ġm et",
"Ġtr uck",
"Ġg ame",
"Ġp art",
"o on",
"is s",
"Ġsof t",
"Ġan gry",
"Ġke ep",
"e ar",
"un ny",
"Ġb ed",
"Ġwa rm",
"Ġlo st",
"Ġre m",
"Ġbra ve",
"Ġm ouse",
"Ġat e",
"Ġs n",
"Ġho le",
"I t",
"f ore",
"ĠY ou",
"s o",
"Ġwat ch",
"Ġsw ing",
"Ġle ave",
"Ġc ook",
"Ġal so",
"Ġf ell",
"o y",
"Ġgre en",
"g an",
"er s",
"Ġfa ce",
"Ġtw o",
"bb it",
"uff y",
"ow l",
"Ġth ink",
"Ġf in",
"Ġ âĢ",
"us h",
"Ġno ise",
"Ġw here",
"a z",
"d ay",
"Ġd e",
"ob o",
"Ġra bbit",
"ĠF l",
"ir rel",
"Ġso on",
"ir st",
"o h",
"oh n",
"Ġapp le",
"a ble",
"Ġsl ide",
"Ġs ound",
"f t",
"Ġsqu irrel",
"Ġas k",
"Ġbe fore",
"c hed",
"Ġcl a",
"Ġy ell",
"Ġsa t",
"j oy",
"Ġen joy",
"ĠFl uffy",
"Ġbl ock",
"Ġu se",
"ug ht",
"ir ed",
"Ġke pt",
"u it",
"H i",
"ĠâĢ ľ",
"âĢ Ŀ",
"le ep",
"i ous",
"Ġc ra",
"Ġp ain",
"Ġst ore",
"Ġhand s",
"Ġbird s",
"he s",
"a ir",
"Ġgo ing",
"Ġsh out",
"Ġre al",
"Ġsay s",
"Ġha ving",
"Ġfun ny",
"Ġh op",
"Ġe y",
"ĠA nd",
"Ġcat ch",
"Ġb re",
"Ġw is"
]
}
}