gpt2_m080_tiny-stories_1024 / tokenizer.json
jonasknobloch's picture
Upload folder using huggingface_hub
0dbd291 verified
{
"version": "1.0",
"truncation": null,
"padding": null,
"added_tokens": [
{
"id": 1024,
"content": "<|endoftext|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": true,
"special": true
}
],
"normalizer": null,
"pre_tokenizer": {
"type": "ByteLevel",
"add_prefix_space": false,
"trim_offsets": true,
"use_regex": true
},
"post_processor": {
"type": "ByteLevel",
"add_prefix_space": true,
"trim_offsets": false,
"use_regex": true
},
"decoder": {
"type": "ByteLevel",
"add_prefix_space": true,
"trim_offsets": true,
"use_regex": true
},
"model": {
"type": "BPE",
"dropout": null,
"unk_token": null,
"continuing_subword_prefix": null,
"end_of_word_suffix": null,
"fuse_unk": false,
"byte_fallback": false,
"ignore_merges": false,
"vocab": {
"!": 0,
"\"": 1,
"#": 2,
"$": 3,
"%": 4,
"&": 5,
"'": 6,
"(": 7,
")": 8,
"*": 9,
"+": 10,
",": 11,
"-": 12,
".": 13,
"/": 14,
"0": 15,
"1": 16,
"2": 17,
"3": 18,
"4": 19,
"5": 20,
"6": 21,
"7": 22,
"8": 23,
"9": 24,
":": 25,
";": 26,
"<": 27,
"=": 28,
">": 29,
"?": 30,
"@": 31,
"A": 32,
"B": 33,
"C": 34,
"D": 35,
"E": 36,
"F": 37,
"G": 38,
"H": 39,
"I": 40,
"J": 41,
"K": 42,
"L": 43,
"M": 44,
"N": 45,
"O": 46,
"P": 47,
"Q": 48,
"R": 49,
"S": 50,
"T": 51,
"U": 52,
"V": 53,
"W": 54,
"X": 55,
"Y": 56,
"Z": 57,
"[": 58,
"\\": 59,
"]": 60,
"_": 61,
"`": 62,
"a": 63,
"b": 64,
"c": 65,
"d": 66,
"e": 67,
"f": 68,
"g": 69,
"h": 70,
"i": 71,
"j": 72,
"k": 73,
"l": 74,
"m": 75,
"n": 76,
"o": 77,
"p": 78,
"q": 79,
"r": 80,
"s": 81,
"t": 82,
"u": 83,
"v": 84,
"w": 85,
"x": 86,
"y": 87,
"z": 88,
"{": 89,
"|": 90,
"}": 91,
"~": 92,
"¡": 93,
"¢": 94,
"£": 95,
"¤": 96,
"¥": 97,
"¦": 98,
"§": 99,
"¨": 100,
"©": 101,
"ª": 102,
"«": 103,
"¬": 104,
"®": 105,
"¯": 106,
"°": 107,
"±": 108,
"³": 109,
"´": 110,
"µ": 111,
"¶": 112,
"·": 113,
"¸": 114,
"¹": 115,
"º": 116,
"»": 117,
"¼": 118,
"½": 119,
"¾": 120,
"¿": 121,
"Â": 122,
"Ã": 123,
"Ä": 124,
"Å": 125,
"É": 126,
"Ê": 127,
"Ñ": 128,
"Ò": 129,
"á": 130,
"â": 131,
"ã": 132,
"ä": 133,
"å": 134,
"æ": 135,
"ç": 136,
"è": 137,
"é": 138,
"î": 139,
"ï": 140,
"ð": 141,
"ĉ": 142,
"Ċ": 143,
"Ġ": 144,
"Ģ": 145,
"ģ": 146,
"Ĥ": 147,
"ĥ": 148,
"Ħ": 149,
"ħ": 150,
"Ĩ": 151,
"ĩ": 152,
"Ī": 153,
"ī": 154,
"Ĭ": 155,
"ĭ": 156,
"Į": 157,
"į": 158,
"İ": 159,
"ı": 160,
"IJ": 161,
"ij": 162,
"Ĵ": 163,
"ĵ": 164,
"Ķ": 165,
"ķ": 166,
"ĸ": 167,
"ĺ": 168,
"Ļ": 169,
"ļ": 170,
"Ľ": 171,
"ľ": 172,
"Ŀ": 173,
"ŀ": 174,
"Ł": 175,
"ł": 176,
"Ń": 177,
"he": 178,
"Ġt": 179,
"Ġa": 180,
"Ġs": 181,
"nd": 182,
"Ġw": 183,
"Ġthe": 184,
"ed": 185,
"ĠT": 186,
"Ġb": 187,
"Ġto": 188,
"Ġand": 189,
"Ġh": 190,
"Ġf": 191,
"in": 192,
"Ġwa": 193,
"re": 194,
"ou": 195,
"it": 196,
"Ġl": 197,
"Ġd": 198,
"Ġc": 199,
"Ġp": 200,
"ay": 201,
"er": 202,
"om": 203,
"Ġm": 204,
"Ġwas": 205,
"im": 206,
"ĠS": 207,
"Ġhe": 208,
"is": 209,
"on": 210,
"ar": 211,
"Ġn": 212,
"Ġsa": 213,
"id": 214,
"ll": 215,
"Ġha": 216,
"hey": 217,
"at": 218,
"Ġg": 219,
"ing": 220,
"en": 221,
"ot": 222,
"an": 223,
"le": 224,
"end": 225,
"or": 226,
"of": 227,
"am": 228,
"Ġ\"": 229,
"ĠH": 230,
"ir": 231,
"et": 232,
"il": 233,
"Ġth": 234,
"Ġit": 235,
"ĠO": 236,
"ig": 237,
"ĠHe": 238,
"Ġin": 239,
"Ġpl": 240,
"ow": 241,
"ut": 242,
"ver": 243,
"ri": 244,
"Ġbe": 245,
"ex": 246,
"Ġu": 247,
"ce": 248,
"Ġplay": 249,
"pp": 250,
"Ġsaid": 251,
"ith": 252,
"Ġwith": 253,
"Ġday": 254,
"Ġy": 255,
"oo": 256,
"ne": 257,
"ĠL": 258,
"Ġr": 259,
"ĠB": 260,
"ext": 261,
"text": 262,
"ck": 263,
"ĠI": 264,
"Ġher": 265,
"ld": 266,
"Ġhis": 267,
"ke": 268,
"ĠM": 269,
"very": 270,
"Ġst": 271,
"nt": 272,
"Ġbig": 273,
"st": 274,
"ily": 275,
"Ġyou": 276,
"ve": 277,
"Ġhapp": 278,
"un": 279,
"Ġon": 280,
"Ġli": 281,
"all": 282,
"riend": 283,
"Ġfriend": 284,
"Ġthey": 285,
"Ġwe": 286,
"Ġhad": 287,
"her": 288,
"Ġnot": 289,
"Ġwant": 290,
"Ġup": 291,
"se": 292,
"ĠA": 293,
"ad": 294,
"Ġof": 295,
"Ġ<": 296,
"|>": 297,
"Ġ<|": 298,
"Ġe": 299,
"Ġdo": 300,
"itt": 301,
"ent": 302,
"Ġhappy": 303,
"Ġvery": 304,
"ould": 305,
"Ġthat": 306,
"ook": 307,
"Ġsaw": 308,
"nce": 309,
"Ġmom": 310,
"'s": 311,
"Ġfor": 312,
"Ġsh": 313,
"ittle": 314,
"ime": 315,
"Ġlittle": 316,
"Ġk": 317,
"Ġshe": 318,
"ch": 319,
"Ġtime": 320,
"Ġnam": 321,
".\"": 322,
"ound": 323,
"Ġso": 324,
"ue": 325,
"Ġnamed": 326,
"Ġthere": 327,
"Ġbo": 328,
"Ġwere": 329,
"Ġne": 330,
"out": 331,
"Ġbut": 332,
"Ġwanted": 333,
"es": 334,
"ug": 335,
"Ġan": 336,
"Ġfriends": 337,
"!\"": 338,
"al": 339,
"ird": 340,
"ht": 341,
"ake": 342,
"hen": 343,
"Ġbird": 344,
"Ġhel": 345,
"Ġhelp": 346,
"ome": 347,
"ry": 348,
"el": 349,
"ĠIt": 350,
"Ġtoo": 351,
"ĠĊ": 352,
"ide": 353,
"Ġwent": 354,
"Ġwh": 355,
"ved": 356,
"ter": 357,
"Ġis": 358,
"Ġall": 359,
"Ġlook": 360,
"Ġlo": 361,
"oftext": 362,
"ame": 363,
"Ġupon": 364,
"ill": 365,
"Ġdid": 366,
"ra": 367,
"ore": 368,
"ly": 369,
"ind": 370,
"Ġre": 371,
"Ġfun": 372,
"Ġj": 373,
"Ġtoy": 374,
"Ġas": 375,
"ur": 376,
"get": 377,
"Ġat": 378,
"ack": 379,
"Ġse": 380,
"gether": 381,
"Ġo": 382,
"ax": 383,
"Ġtre": 384,
"Ġtogether": 385,
"ked": 386,
"Ġcat": 387,
"Ġsm": 388,
"ood": 389,
"Ġcould": 390,
"my": 391,
"ec": 392,
"Ġdog": 393,
"art": 394,
"Ġcan": 395,
"ĠW": 396,
"Ġtheir": 397,
"ark": 398,
"um": 399,
"ard": 400,
"Ġro": 401,
"Ġhim": 402,
"irl": 403,
"Ġball": 404,
"Ġplayed": 405,
"ĠThe": 406,
"?\"": 407,
"Ġgirl": 408,
"rom": 409,
"way": 410,
"Ġgo": 411,
"Ġle": 412,
"Ġare": 413,
"ain": 414,
"Ġout": 415,
"Ġthem": 416,
"'t": 417,
"ul": 418,
"ĠThey": 419,
"Ġsad": 420,
"other": 421,
"one": 422,
"Ġcl": 423,
"pot": 424,
"Ġboy": 425,
"Ġtree": 426,
"Ġla": 427,
"ĠJ": 428,
"Ġhave": 429,
"Ġman": 430,
"oug": 431,
"Ġloved": 432,
"Ġlooked": 433,
"ic": 434,
"Ġfound": 435,
"Ġback": 436,
"Ġlike": 437,
"Ġsp": 438,
"ful": 439,
"ia": 440,
"Ġsay": 441,
"own": 442,
"are": 443,
"ell": 444,
"ro": 445,
"side": 446,
"Ġme": 447,
"ĠF": 448,
"hing": 449,
"ight": 450,
"Ġsc": 451,
"ong": 452,
"Ġpark": 453,
"ick": 454,
"Ġmake": 455,
"Ġstart": 456,
"Ġwould": 457,
"Ġlaug": 458,
"elt": 459,
"ĠTim": 460,
"Ġno": 461,
"Ġcar": 462,
"ob": 463,
"round": 464,
"Ġfa": 465,
"Ġother": 466,
"Ġfelt": 467,
"Ġsee": 468,
"op": 469,
"ss": 470,
"ag": 471,
"Ġasked": 472,
"ice": 473,
"Ġnew": 474,
"ouse": 475,
"Ġstarted": 476,
"Ġcame": 477,
"omet": 478,
"Ġwal": 479,
"Ġal": 480,
"Ġsomet": 481,
"Ġag": 482,
"ĠShe": 483,
"ĠY": 484,
"Ġgood": 485,
"Ġsmall": 486,
"ared": 487,
"ade": 488,
"ought": 489,
"ud": 490,
"Ġevery": 491,
"Ġco": 492,
"Ġex": 493,
"Ġthing": 494,
"ile": 495,
"Ġfind": 496,
"Ġwor": 497,
"hat": 498,
"Ġput": 499,
"Ġaway": 500,
"Ġthought": 501,
"Ġwhat": 502,
"Ġsomething": 503,
"Ġfrom": 504,
"Ġmade": 505,
"Ġhome": 506,
"us": 507,
"Ġplaying": 508,
"ie": 509,
"ny": 510,
"Ġtri": 511,
"hed": 512,
"Ġfl": 513,
"ach": 514,
"uc": 515,
"arn": 516,
"ank": 517,
"Ġran": 518,
"Ġsome": 519,
"ave": 520,
"ust": 521,
"Ġlot": 522,
"now": 523,
"ble": 524,
"ure": 525,
"came": 526,
"Ġagain": 527,
"Ġhouse": 528,
"Ġdown": 529,
"Ġtook": 530,
"Ġbl": 531,
"Ġscared": 532,
"ump": 533,
"ep": 534,
"Ġlearn": 535,
"uck": 536,
"Ġtoys": 537,
"ret": 538,
"Ġdec": 539,
"Ġdecid": 540,
"new": 541,
"Ġwill": 542,
"Ġbox": 543,
"if": 544,
"ĠD": 545,
"Ġyour": 546,
"Ġmy": 547,
"Ġfe": 548,
"ist": 549,
"oud": 550,
"Ġaround": 551,
"Ġthings": 552,
"ish": 553,
"Ġbr": 554,
"ca": 555,
"Ġsun": 556,
"Ġch": 557,
"Ġlived": 558,
"as": 559,
"Ġthen": 560,
",\"": 561,
"Ġwhen": 562,
"use": 563,
"cause": 564,
"ally": 565,
"ty": 566,
"Ġget": 567,
"Ġany": 568,
"fter": 569,
"endoftext": 570,
"ucy": 571,
"ĠE": 572,
"ĠLucy": 573,
"oth": 574,
"Ġknow": 575,
"Ġshow": 576,
"Ġjump": 577,
"nder": 578,
"uch": 579,
"Ġtried": 580,
"Ġsw": 581,
"Ġgot": 582,
"nn": 583,
"ap": 584,
"Ġwho": 585,
"Ġhappen": 586,
"nna": 587,
"ĠTom": 588,
"Ġab": 589,
"Ġmany": 590,
"Ġint": 591,
"Ġpret": 592,
"ive": 593,
"pped": 594,
"Ġabout": 595,
"ace": 596,
"ĠSo": 597,
"Ġun": 598,
"urp": 599,
"qu": 600,
"ĠLily": 601,
"ous": 602,
"Ġred": 603,
"ĠOne": 604,
"Ġsmil": 605,
"Ġhug": 606,
"Ġv": 607,
"ise": 608,
"Ġmore": 609,
"Ġpo": 610,
"Ġcare": 611,
"hank": 612,
"ara": 613,
"Ġsor": 614,
"ect": 615,
"king": 616,
"Ġwater": 617,
"pen": 618,
"Ġlearned": 619,
"ant": 620,
"Ġbest": 621,
"cit": 622,
"Ġexcit": 623,
"ower": 624,
"Ġgre": 625,
"Ġta": 626,
"ĠC": 627,
"Ġthan": 628,
"ways": 629,
"âĢ": 630,
"Ġoutside": 631,
"Ġpr": 632,
"Ġalways": 633,
"imal": 634,
"Ġanimal": 635,
"Ġpe": 636,
"urpr": 637,
"Ġsurpr": 638,
"fe": 639,
"Ġho": 640,
"Ġroom": 641,
"Ġeat": 642,
"our": 643,
"Ġinto": 644,
"Ġopen": 645,
"den": 646,
"Ġboth": 647,
"Ġfeel": 648,
"ite": 649,
"Ġdad": 650,
"Ġke": 651,
"Ġone": 652,
"Ġnice": 653,
"Ġexcited": 654,
"Ġmo": 655,
"Ġthis": 656,
"Ġam": 657,
"Ġfast": 658,
"Ġlong": 659,
"Ġrun": 660,
"Ġgra": 661,
"ink": 662,
"Ġsk": 663,
"Ġrock": 664,
"Ġtold": 665,
"Ġinside": 666,
"ull": 667,
"Ġpretty": 668,
"bb": 669,
"iny": 670,
"Ġpick": 671,
"Ġflower": 672,
"Ġtr": 673,
"Ġtake": 674,
"here": 675,
"Ġeach": 676,
"Ġgave": 677,
"Ġmuch": 678,
"Ġsurpris": 679,
"Ġsl": 680,
"Ġneed": 681,
"Ġtow": 682,
"Ġhow": 683,
"pl": 684,
"Ġstr": 685,
"ven": 686,
"more": 687,
"etter": 688,
"Ġor": 689,
"his": 690,
"ĠAs": 691,
"Ġunder": 692,
"Ġold": 693,
"isten": 694,
"Ġlisten": 695,
"Ġtry": 696,
"dy": 697,
"ge": 698,
"ĠOnce": 699,
"ĠK": 700,
"urt": 701,
"pect": 702,
"and": 703,
"Ġcle": 704,
"Ġfish": 705,
"ase": 706,
"Ġclo": 707,
"Ġkind": 708,
"Ġbear": 709,
"urn": 710,
"Ġhand": 711,
"Ġfle": 712,
"ĠWe": 713,
"Ġte": 714,
"lf": 715,
"pected": 716,
"expected": 717,
"Ġnear": 718,
"Ġcol": 719,
"Ġcolor": 720,
"ine": 721,
"Ġjust": 722,
"Ġfood": 723,
"Ġfi": 724,
"by": 725,
"Ġtw": 726,
"Ġwat": 727,
"ged": 728,
"Ġhig": 729,
"Ġide": 730,
"Ġen": 731,
"Ġfo": 732,
"ess": 733,
"ĠIn": 734,
"Ġsky": 735,
"ate": 736,
"ving": 737,
"Ġus": 738,
"Ġidea": 739,
"Ġbetter": 740,
"Ġheard": 741,
"Ġbug": 742,
"gry": 743,
"ff": 744,
"Ġits": 745,
"Ġdan": 746,
"ac": 747,
"Ġlet": 748,
"ion": 749,
"ream": 750,
"be": 751,
"Ġgr": 752,
"eci": 753,
"Ġcareful": 754,
"Ġshare": 755,
"Ġlove": 756,
"hy": 757,
"Ġif": 758,
"Ġcom": 759,
"Ġfly": 760,
"Ġstor": 761,
"Ġflew": 762,
"ber": 763,
"ecial": 764,
"Ġspecial": 765,
"ort": 766,
"Ġnever": 767,
"Ġby": 768,
"Ġwind": 769,
"Ġclim": 770,
"Ġclimb": 771,
"Ġbu": 772,
"ĠN": 773,
"rm": 774,
"ĠP": 775,
"Ġdon": 776,
"Ġtal": 777,
"Ġclean": 778,
"Ġend": 779,
"Ġeven": 780,
"ople": 781,
"opped": 782,
"ane": 783,
"Ġwait": 784,
"Ġmag": 785,
"Ġhard": 786,
"Ġjo": 787,
"Ġover": 788,
"Ġshiny": 789,
"Ġbook": 790,
"Ġche": 791,
"Ġfr": 792,
"Ġcake": 793,
"Ġhurt": 794,
"Ġyum": 795,
"Ġturn": 796,
"Ġproud": 797,
"ady": 798,
"Ġgl": 799,
"kay": 800,
"Ġfam": 801,
"Ġcu": 802,
"Ġbad": 803,
"Ġafter": 804,
"ock": 805,
"iz": 806,
"Ġgive": 807,
"Ġsafe": 808,
"Ġloud": 809,
"Ġpeople": 810,
"Ġstay": 811,
"Ġim": 812,
"Ġhigh": 813,
"Ġgard": 814,
"Ġgarden": 815,
"Ġdoor": 816,
"Ġcome": 817,
"Ġground": 818,
"Ġopened": 819,
"Ġpicked": 820,
"dd": 821,
"uff": 822,
"Ġbea": 823,
"ild": 824,
"Ġfore": 825,
"Ġra": 826,
"Ġqu": 827,
"Ġblue": 828,
"Ġway": 829,
"'m": 830,
"dded": 831,
"Ġstill": 832,
"Ġever": 833,
"ip": 834,
"Ġhugged": 835,
"age": 836,
"Ġcall": 837,
"lease": 838,
"Ġpic": 839,
"Ġplace": 840,
"Ġoff": 841,
"Ġfar": 842,
"ough": 843,
"Ġmagic": 844,
"ĠBut": 845,
"Ġshould": 846,
"ture": 847,
"rog": 848,
"ary": 849,
"Ġwo": 850,
"illy": 851,
"Ġpicture": 852,
"Ġwalk": 853,
"ool": 854,
"Ġfamily": 855,
"self": 856,
"Ġkid": 857,
"Ġma": 858,
"Ġapp": 859,
"em": 860,
"Ġnow": 861,
"Ġpa": 862,
"ĠSue": 863,
"Ġgreat": 864,
"Ġca": 865,
"ĠR": 866,
"Ġstrong": 867,
"Ġfrog": 868,
"Ġbra": 869,
"Ġforest": 870,
"No": 871,
"udden": 872,
"Ġunt": 873,
"Ġbro": 874,
"Ġstick": 875,
"Ġsqu": 876,
"ct": 877,
"Ġuntil": 878,
"ĠMax": 879,
"Ġbeaut": 880,
"Ġtra": 881,
"ning": 882,
"ma": 883,
"Ġnext": 884,
"Ġboat": 885,
"ak": 886,
"Ġcry": 887,
"pt": 888,
"Ġhat": 889,
"Ġrain": 890,
"Ġkids": 891,
"Ġdra": 892,
"iful": 893,
"Ġexpl": 894,
"Ġbeautiful": 895,
"ĠMom": 896,
"Ġad": 897,
"Ġclos": 898,
"rel": 899,
"Ġstory": 900,
"ĠBen": 901,
"Ġwhile": 902,
"ello": 903,
"ress": 904,
"Ġtown": 905,
"Ġsof": 906,
"ger": 907,
"ĠAt": 908,
"ree": 909,
"Ġbeing": 910,
"Ġdoll": 911,
"ĠG": 912,
"vent": 913,
"Ġimp": 914,
"Ġcri": 915,
"Ġmor": 916,
"ĠSam": 917,
"Ġcalled": 918,
"Ġmet": 919,
"oon": 920,
"Ġtruck": 921,
"iss": 922,
"Ġgame": 923,
"Ġpart": 924,
"Ġcook": 925,
"Ġsoft": 926,
"Ġangry": 927,
"Ġkeep": 928,
"ear": 929,
"Ġwarm": 930,
"Ġbed": 931,
"Ġlost": 932,
"Ġrem": 933,
"Ġbrave": 934,
"unny": 935,
"Ġmouse": 936,
"Ġswing": 937,
"Ġate": 938,
"Ġsn": 939,
"Ġhole": 940,
"oy": 941,
"It": 942,
"fore": 943,
"so": 944,
"Ġwatch": 945,
"Ġliked": 946,
"Ġleave": 947,
"obo": 948,
"Ġalso": 949,
"Ġfell": 950,
"Ġthink": 951,
"Ġfin": 952,
"Ġgreen": 953,
"gan": 954,
"az": 955,
"Ġface": 956,
"owl": 957,
"Ġtwo": 958,
"bbit": 959,
"day": 960,
"ĠâĢ": 961,
"uffy": 962,
"ush": 963,
"Ġnoise": 964,
"Ġwhere": 965,
"oh": 966,
"ohn": 967,
"Ġde": 968,
"Ġapple": 969,
"Ġsound": 970,
"Ġcla": 971,
"Ġrabbit": 972,
"able": 973,
"Ġblock": 974,
"Ġask": 975,
"irrel": 976,
"Ġsoon": 977,
"ĠFl": 978,
"ers": 979,
"joy": 980,
"Ġenjoy": 981,
"Ġslide": 982,
"ft": 983,
"irst": 984,
"Ġsquirrel": 985,
"Ġyell": 986,
"Ġbefore": 987,
"ught": 988,
"Ġsat": 989,
"ĠFluffy": 990,
"uit": 991,
"ious": 992,
"Ġuse": 993,
"Ġkept": 994,
"ired": 995,
"Ġshout": 996,
"ĠâĢľ": 997,
"Hi": 998,
"âĢĿ": 999,
"leep": 1000,
"Ġcra": 1001,
"Ġpain": 1002,
"ched": 1003,
"Ġstore": 1004,
"Ġreal": 1005,
"Ġwis": 1006,
"Ġhands": 1007,
"air": 1008,
"Ġbirds": 1009,
"Ġhop": 1010,
"Ġgoing": 1011,
"Ġhaving": 1012,
"Ġfunny": 1013,
"Ġey": 1014,
"Ġbre": 1015,
"Ġcatch": 1016,
"Ġmess": 1017,
"Ġpull": 1018,
"Ġcon": 1019,
"Ġsmiled": 1020,
"Ġfix": 1021,
"Ġthr": 1022,
"ember": 1023
},
"merges": [
"h e",
"Ġ t",
"Ġ a",
"Ġ s",
"n d",
"Ġ w",
"Ġt he",
"e d",
"Ġ T",
"Ġ b",
"Ġt o",
"Ġa nd",
"Ġ h",
"Ġ f",
"i n",
"Ġw a",
"r e",
"o u",
"i t",
"Ġ l",
"Ġ d",
"Ġ c",
"Ġ p",
"a y",
"e r",
"o m",
"Ġ m",
"Ġwa s",
"i m",
"Ġ S",
"Ġ he",
"i s",
"o n",
"a r",
"Ġ n",
"Ġs a",
"i d",
"l l",
"Ġh a",
"he y",
"a t",
"Ġ g",
"in g",
"e n",
"o t",
"a n",
"l e",
"e nd",
"o r",
"o f",
"a m",
"Ġ \"",
"Ġ H",
"i r",
"e t",
"i l",
"Ġt h",
"Ġ it",
"Ġ O",
"i g",
"ĠH e",
"Ġ in",
"Ġp l",
"o w",
"u t",
"v er",
"r i",
"Ġb e",
"e x",
"Ġ u",
"c e",
"Ġpl ay",
"p p",
"Ġsa id",
"it h",
"Ġw ith",
"Ġd ay",
"Ġ y",
"o o",
"n e",
"Ġ L",
"Ġ r",
"Ġ B",
"ex t",
"t ext",
"c k",
"Ġ I",
"Ġhe r",
"l d",
"Ġh is",
"k e",
"Ġ M",
"ver y",
"Ġs t",
"n t",
"Ġb ig",
"s t",
"il y",
"Ġy ou",
"v e",
"Ġha pp",
"u n",
"Ġ on",
"Ġl i",
"a ll",
"ri end",
"Ġf riend",
"Ġthe y",
"Ġw e",
"Ġha d",
"he r",
"Ġn ot",
"Ġwa nt",
"Ġu p",
"s e",
"Ġ A",
"a d",
"Ġ of",
"Ġ <",
"| >",
"Ġ< |",
"Ġ e",
"Ġd o",
"it t",
"en t",
"Ġhapp y",
"Ġ very",
"ou ld",
"Ġth at",
"oo k",
"Ġsa w",
"n ce",
"Ġm om",
"' s",
"Ġf or",
"Ġs h",
"itt le",
"im e",
"Ġl ittle",
"Ġ k",
"Ġs he",
"c h",
"Ġt ime",
"Ġn am",
". \"",
"ou nd",
"Ġs o",
"u e",
"Ġnam ed",
"Ġthe re",
"Ġb o",
"Ġwe re",
"Ġn e",
"ou t",
"Ġb ut",
"Ġwant ed",
"e s",
"u g",
"Ġa n",
"Ġfriend s",
"! \"",
"a l",
"ir d",
"h t",
"a ke",
"he n",
"Ġb ird",
"Ġhe l",
"Ġhel p",
"om e",
"r y",
"e l",
"ĠI t",
"Ġto o",
"Ġ Ċ",
"id e",
"Ġw ent",
"Ġw h",
"v ed",
"t er",
"Ġ is",
"Ġa ll",
"Ġl ook",
"Ġl o",
"of text",
"am e",
"Ġup on",
"i ll",
"Ġd id",
"r a",
"o re",
"l y",
"i nd",
"Ġ re",
"Ġf un",
"Ġ j",
"Ġto y",
"Ġa s",
"u r",
"g et",
"Ġa t",
"a ck",
"Ġs e",
"get her",
"Ġ o",
"a x",
"Ġt re",
"Ġto gether",
"k ed",
"Ġc at",
"Ġs m",
"oo d",
"Ġc ould",
"m y",
"e c",
"Ġdo g",
"ar t",
"Ġc an",
"Ġ W",
"Ġthe ir",
"ar k",
"u m",
"ar d",
"Ġr o",
"Ġh im",
"ir l",
"Ġb all",
"Ġplay ed",
"ĠT he",
"? \"",
"Ġg irl",
"r om",
"w ay",
"Ġg o",
"Ġl e",
"Ġa re",
"a in",
"Ġ out",
"Ġthe m",
"' t",
"u l",
"ĠT hey",
"Ġsa d",
"ot her",
"on e",
"Ġc l",
"p ot",
"Ġbo y",
"Ġtre e",
"Ġl a",
"Ġ J",
"Ġha ve",
"Ġm an",
"ou g",
"Ġlo ved",
"Ġlook ed",
"i c",
"Ġf ound",
"Ġb ack",
"Ġli ke",
"Ġs p",
"f ul",
"i a",
"Ġs ay",
"ow n",
"a re",
"e ll",
"r o",
"s ide",
"Ġm e",
"Ġ F",
"h ing",
"ig ht",
"Ġs c",
"on g",
"Ġp ark",
"i ck",
"Ġm ake",
"Ġst art",
"Ġw ould",
"Ġla ug",
"el t",
"ĠT im",
"Ġn o",
"Ġc ar",
"o b",
"r ound",
"Ġf a",
"Ġ other",
"Ġf elt",
"Ġse e",
"o p",
"s s",
"a g",
"Ġas ked",
"i ce",
"Ġne w",
"ou se",
"Ġstart ed",
"Ġc ame",
"om et",
"Ġwa l",
"Ġa l",
"Ġs omet",
"Ġa g",
"ĠS he",
"Ġ Y",
"Ġg ood",
"Ġsm all",
"ar ed",
"ad e",
"oug ht",
"u d",
"Ġe very",
"Ġc o",
"Ġ ex",
"Ġth ing",
"i le",
"Ġf ind",
"Ġw or",
"h at",
"Ġp ut",
"Ġa way",
"Ġth ought",
"Ġwh at",
"Ġsomet hing",
"Ġf rom",
"Ġm ade",
"Ġh ome",
"u s",
"Ġplay ing",
"i e",
"n y",
"Ġt ri",
"he d",
"Ġf l",
"a ch",
"u c",
"ar n",
"an k",
"Ġr an",
"Ġs ome",
"a ve",
"u st",
"Ġl ot",
"n ow",
"b le",
"u re",
"c ame",
"Ġag ain",
"Ġh ouse",
"Ġd own",
"Ġtoo k",
"Ġb l",
"Ġsc ared",
"um p",
"e p",
"Ġle arn",
"u ck",
"Ġtoy s",
"re t",
"Ġd ec",
"Ġdec id",
"ne w",
"Ġw ill",
"Ġbo x",
"i f",
"Ġ D",
"Ġyou r",
"Ġm y",
"Ġf e",
"is t",
"ou d",
"Ġa round",
"Ġthing s",
"is h",
"Ġb r",
"c a",
"Ġs un",
"Ġc h",
"Ġli ved",
"a s",
"Ġthe n",
", \"",
"Ġw hen",
"u se",
"ca use",
"all y",
"t y",
"Ġg et",
"Ġan y",
"f ter",
"end oftext",
"uc y",
"Ġ E",
"ĠL ucy",
"ot h",
"Ġk now",
"Ġsh ow",
"Ġj ump",
"nd er",
"u ch",
"Ġtri ed",
"Ġs w",
"Ġg ot",
"n n",
"a p",
"Ġwh o",
"Ġhapp en",
"nn a",
"ĠT om",
"Ġa b",
"Ġman y",
"Ġin t",
"Ġp ret",
"i ve",
"pp ed",
"Ġab out",
"a ce",
"ĠS o",
"Ġu n",
"ur p",
"q u",
"ĠL ily",
"ou s",
"Ġr ed",
"ĠO ne",
"Ġsm il",
"Ġh ug",
"Ġ v",
"is e",
"Ġm ore",
"Ġp o",
"Ġc are",
"h ank",
"ar a",
"Ġs or",
"ec t",
"k ing",
"Ġwa ter",
"p en",
"Ġlearn ed",
"an t",
"Ġbe st",
"c it",
"Ġex cit",
"ow er",
"Ġg re",
"Ġt a",
"Ġ C",
"Ġth an",
"way s",
"â Ģ",
"Ġout side",
"Ġp r",
"Ġal ways",
"im al",
"Ġan imal",
"Ġp e",
"urp r",
"Ġs urpr",
"f e",
"Ġh o",
"Ġro om",
"Ġe at",
"ou r",
"Ġint o",
"Ġo pen",
"d en",
"Ġb oth",
"Ġfe el",
"it e",
"Ġd ad",
"Ġ ke",
"Ġon e",
"Ġn ice",
"Ġexcit ed",
"Ġm o",
"Ġth is",
"Ġa m",
"Ġfa st",
"Ġl ong",
"Ġr un",
"Ġg ra",
"in k",
"Ġs k",
"Ġro ck",
"Ġto ld",
"Ġin side",
"u ll",
"Ġpret ty",
"b b",
"in y",
"Ġp ick",
"Ġfl ower",
"Ġt r",
"Ġt ake",
"he re",
"Ġe ach",
"Ġg ave",
"Ġm uch",
"Ġsurpr is",
"Ġs l",
"Ġne ed",
"Ġto w",
"Ġh ow",
"p l",
"Ġst r",
"v en",
"m ore",
"et ter",
"Ġ or",
"h is",
"ĠA s",
"Ġu nder",
"Ġo ld",
"ist en",
"Ġl isten",
"Ġt ry",
"d y",
"g e",
"ĠO nce",
"Ġ K",
"ur t",
"p ect",
"a nd",
"Ġc le",
"Ġf ish",
"a se",
"Ġcl o",
"Ġk ind",
"Ġbe ar",
"ur n",
"Ġha nd",
"Ġf le",
"ĠW e",
"Ġt e",
"l f",
"pect ed",
"ex pected",
"Ġne ar",
"Ġco l",
"Ġcol or",
"in e",
"Ġj ust",
"Ġf ood",
"Ġf i",
"b y",
"Ġt w",
"Ġwa t",
"g ed",
"Ġh ig",
"Ġ ide",
"Ġ en",
"Ġf o",
"es s",
"ĠI n",
"Ġsk y",
"at e",
"v ing",
"Ġu s",
"Ġide a",
"Ġb etter",
"Ġhe ard",
"Ġb ug",
"g ry",
"f f",
"Ġit s",
"Ġd an",
"a c",
"Ġl et",
"i on",
"re am",
"b e",
"Ġg r",
"ec i",
"Ġcare ful",
"Ġsh are",
"Ġlo ve",
"h y",
"Ġ if",
"Ġc om",
"Ġf ly",
"Ġst or",
"Ġfle w",
"b er",
"eci al",
"Ġsp ecial",
"or t",
"Ġne ver",
"Ġb y",
"Ġw ind",
"Ġcl im",
"Ġclim b",
"Ġb u",
"Ġ N",
"r m",
"Ġ P",
"Ġd on",
"Ġt al",
"Ġcle an",
"Ġ end",
"Ġe ven",
"op le",
"o pped",
"an e",
"Ġwa it",
"Ġm ag",
"Ġh ard",
"Ġj o",
"Ġo ver",
"Ġsh iny",
"Ġb ook",
"Ġc he",
"Ġf r",
"Ġc ake",
"Ġh urt",
"Ġy um",
"Ġt urn",
"Ġpr oud",
"ad y",
"Ġg l",
"k ay",
"Ġf am",
"Ġc u",
"Ġb ad",
"Ġa fter",
"o ck",
"i z",
"Ġg ive",
"Ġsa fe",
"Ġl oud",
"Ġpe ople",
"Ġst ay",
"Ġ im",
"Ġhig h",
"Ġg ard",
"Ġgard en",
"Ġdo or",
"Ġc ome",
"Ġg round",
"Ġopen ed",
"Ġpick ed",
"d d",
"u ff",
"Ġbe a",
"il d",
"Ġf ore",
"Ġr a",
"Ġ qu",
"Ġbl ue",
"Ġwa y",
"' m",
"dd ed",
"Ġst ill",
"Ġe ver",
"i p",
"Ġhug ged",
"ag e",
"Ġc all",
"le ase",
"Ġp ic",
"Ġpl ace",
"Ġof f",
"Ġf ar",
"oug h",
"Ġmag ic",
"ĠB ut",
"Ġsh ould",
"t ure",
"ro g",
"ar y",
"Ġw o",
"ill y",
"Ġpic ture",
"Ġwal k",
"oo l",
"Ġfam ily",
"se lf",
"Ġk id",
"Ġm a",
"Ġa pp",
"e m",
"Ġn ow",
"Ġp a",
"ĠS ue",
"Ġgre at",
"Ġc a",
"Ġ R",
"Ġstr ong",
"Ġf rog",
"Ġb ra",
"Ġfore st",
"N o",
"ud den",
"Ġu nt",
"Ġb ro",
"Ġst ick",
"Ġs qu",
"c t",
"Ġunt il",
"ĠM ax",
"Ġbea ut",
"Ġt ra",
"n ing",
"m a",
"Ġn ext",
"Ġbo at",
"a k",
"Ġc ry",
"p t",
"Ġha t",
"Ġr ain",
"Ġkid s",
"Ġd ra",
"i ful",
"Ġex pl",
"Ġbeaut iful",
"ĠM om",
"Ġa d",
"Ġclo s",
"re l",
"Ġstor y",
"ĠB en",
"Ġwh ile",
"ell o",
"re ss",
"Ġtow n",
"Ġs of",
"g er",
"ĠA t",
"re e",
"Ġbe ing",
"Ġdo ll",
"Ġ G",
"v ent",
"Ġim p",
"Ġc ri",
"Ġm or",
"ĠS am",
"Ġcall ed",
"Ġm et",
"o on",
"Ġtr uck",
"is s",
"Ġg ame",
"Ġp art",
"Ġc ook",
"Ġsof t",
"Ġan gry",
"Ġke ep",
"e ar",
"Ġwa rm",
"Ġb ed",
"Ġlo st",
"Ġre m",
"Ġbra ve",
"un ny",
"Ġm ouse",
"Ġsw ing",
"Ġat e",
"Ġs n",
"Ġho le",
"o y",
"I t",
"f ore",
"s o",
"Ġwat ch",
"Ġli ked",
"Ġle ave",
"ob o",
"Ġal so",
"Ġf ell",
"Ġth ink",
"Ġf in",
"Ġgre en",
"g an",
"a z",
"Ġfa ce",
"ow l",
"Ġtw o",
"bb it",
"d ay",
"Ġ âĢ",
"uff y",
"us h",
"Ġno ise",
"Ġw here",
"o h",
"oh n",
"Ġd e",
"Ġapp le",
"Ġs ound",
"Ġcl a",
"Ġra bbit",
"a ble",
"Ġbl ock",
"Ġas k",
"ir rel",
"Ġso on",
"ĠF l",
"er s",
"j oy",
"Ġen joy",
"Ġsl ide",
"f t",
"ir st",
"Ġsqu irrel",
"Ġy ell",
"Ġbe fore",
"ug ht",
"Ġsa t",
"ĠFl uffy",
"u it",
"i ous",
"Ġu se",
"Ġke pt",
"ir ed",
"Ġsh out",
"ĠâĢ ľ",
"H i",
"âĢ Ŀ",
"le ep",
"Ġc ra",
"Ġp ain",
"c hed",
"Ġst ore",
"Ġre al",
"Ġw is",
"Ġhand s",
"a ir",
"Ġbird s",
"Ġh op",
"Ġgo ing",
"Ġha ving",
"Ġfun ny",
"Ġe y",
"Ġb re",
"Ġcat ch",
"Ġm ess",
"Ġp ull",
"Ġc on",
"Ġsmil ed",
"Ġfi x",
"Ġth r",
"em ber"
]
}
}