{"speaker_cond": true, "speaker_emb_size": 256, "tokenizer": {"name": "custom", "pat_str": "'s|'t|'re|'ve|'m|'ll|'d| ?\\p{L}+| ?\\p{N}+| ?[^\\s\\p{L}\\p{N}]+|\\s+(?!\\S)|\\s+", "mergeable_ranks": {"\u0000": 0, "\u0001": 1, "\u0002": 2, "\u0003": 3, "\u0004": 4, "\u0005": 5, "\u0006": 6, "\u0007": 7, "\b": 8, "\t": 9, "\n": 10, "\u000b": 11, "\f": 12, "\r": 13, "\u000e": 14, "\u000f": 15, "\u0010": 16, "\u0011": 17, "\u0012": 18, "\u0013": 19, "\u0014": 20, "\u0015": 21, "\u0016": 22, "\u0017": 23, "\u0018": 24, "\u0019": 25, "\u001a": 26, "\u001b": 27, "\u001c": 28, "\u001d": 29, "\u001e": 30, "\u001f": 31, " ": 32, "!": 33, "\"": 34, "#": 35, "$": 36, "%": 37, "&": 38, "'": 39, "(": 40, ")": 41, "*": 42, "+": 43, ",": 44, "-": 45, ".": 46, "/": 47, "0": 48, "1": 49, "2": 50, "3": 51, "4": 52, "5": 53, "6": 54, "7": 55, "8": 56, "9": 57, ":": 58, ";": 59, "<": 60, "=": 61, ">": 62, "?": 63, "@": 64, "A": 65, "B": 66, "C": 67, "D": 68, "E": 69, "F": 70, "G": 71, "H": 72, "I": 73, "J": 74, "K": 75, "L": 76, "M": 77, "N": 78, "O": 79, "P": 80, "Q": 81, "R": 82, "S": 83, "T": 84, "U": 85, "V": 86, "W": 87, "X": 88, "Y": 89, "Z": 90, "[": 91, "\\": 92, "]": 93, "^": 94, "_": 95, "`": 96, "a": 97, "b": 98, "c": 99, "d": 100, "e": 101, "f": 102, "g": 103, "h": 104, "i": 105, "j": 106, "k": 107, "l": 108, "m": 109, "n": 110, "o": 111, "p": 112, "q": 113, "r": 114, "s": 115, "t": 116, "u": 117, "v": 118, "w": 119, "x": 120, "y": 121, "z": 122, "{": 123, "|": 124, "}": 125, "~": 126, "\u007f": 127, "\\x80": 128, "\\x81": 129, "\\x82": 130, "\\x83": 131, "\\x84": 132, "\\x85": 133, "\\x86": 134, "\\x87": 135, "\\x88": 136, "\\x89": 137, "\\x8a": 138, "\\x8b": 139, "\\x8c": 140, "\\x8d": 141, "\\x8e": 142, "\\x8f": 143, "\\x90": 144, "\\x91": 145, "\\x92": 146, "\\x93": 147, "\\x94": 148, "\\x95": 149, "\\x96": 150, "\\x97": 151, "\\x98": 152, "\\x99": 153, "\\x9a": 154, "\\x9b": 155, "\\x9c": 156, "\\x9d": 157, "\\x9e": 158, "\\x9f": 159, "\\xa0": 160, "\\xa1": 161, "\\xa2": 162, "\\xa3": 163, "\\xa4": 164, "\\xa5": 165, "\\xa6": 166, "\\xa7": 167, "\\xa8": 168, "\\xa9": 169, "\\xaa": 170, "\\xab": 171, "\\xac": 172, "\\xad": 173, "\\xae": 174, "\\xaf": 175, "\\xb0": 176, "\\xb1": 177, "\\xb2": 178, "\\xb3": 179, "\\xb4": 180, "\\xb5": 181, "\\xb6": 182, "\\xb7": 183, "\\xb8": 184, "\\xb9": 185, "\\xba": 186, "\\xbb": 187, "\\xbc": 188, "\\xbd": 189, "\\xbe": 190, "\\xbf": 191, "\\xc0": 192, "\\xc1": 193, "\\xc2": 194, "\\xc3": 195, "\\xc4": 196, "\\xc5": 197, "\\xc6": 198, "\\xc7": 199, "\\xc8": 200, "\\xc9": 201, "\\xca": 202, "\\xcb": 203, "\\xcc": 204, "\\xcd": 205, "\\xce": 206, "\\xcf": 207, "\\xd0": 208, "\\xd1": 209, "\\xd2": 210, "\\xd3": 211, "\\xd4": 212, "\\xd5": 213, "\\xd6": 214, "\\xd7": 215, "\\xd8": 216, "\\xd9": 217, "\\xda": 218, "\\xdb": 219, "\\xdc": 220, "\\xdd": 221, "\\xde": 222, "\\xdf": 223, "\\xe0": 224, "\\xe1": 225, "\\xe2": 226, "\\xe3": 227, "\\xe4": 228, "\\xe5": 229, "\\xe6": 230, "\\xe7": 231, "\\xe8": 232, "\\xe9": 233, "\\xea": 234, "\\xeb": 235, "\\xec": 236, "\\xed": 237, "\\xee": 238, "\\xef": 239, "\\xf0": 240, "\\xf1": 241, "\\xf2": 242, "\\xf3": 243, "\\xf4": 244, "\\xf5": 245, "\\xf6": 246, "\\xf7": 247, "\\xf8": 248, "\\xf9": 249, "\\xfa": 250, "\\xfb": 251, "\\xfc": 252, "\\xfd": 253, "\\xfe": 254, "\\xff": 255, " t": 256, "he": 257, " a": 258, "in": 259, " the": 260, " w": 261, " s": 262, "re": 263, " o": 264, "nd": 265, "ha": 266, "er": 267, "ou": 268, " b": 269, "ed": 270, "is": 271, " m": 272, "it": 273, " f": 274, " c": 275, "en": 276, "on": 277, " to": 278, " of": 279, "ing": 280, " and": 281, "or": 282, " d": 283, " p": 284, "ll": 285, "es": 286, "as": 287, " h": 288, " he": 289, " l": 290, " in": 291, "ar": 292, "an": 293, " n": 294, "at": 295, " ha": 296, "om": 297, " g": 298, " be": 299, "hat": 300, "le": 301, "ot": 302, "ow": 303, "ut": 304, " e": 305, "ic": 306, "ve": 307, " was": 308, "id": 309, " y": 310, "ld": 311, "ly": 312, "im": 313, "st": 314, " th": 315, "se": 316, " it": 317, "gh": 318, " that": 319, "ent": 320, " re": 321, " you": 322, " I": 323, " on": 324, "ce": 325, "ver": 326, "ay": 327, "et": 328, " u": 329, "ion": 330, "al": 331, "ir": 332, "ith": 333, " for": 334, "The": 335, " as": 336, " his": 337, " wh": 338, " is": 339, " with": 340, " we": 341, " st": 342, "ur": 343, "ad": 344, "ght": 345, "ro": 346, " not": 347, "ac": 348, " had": 349, " an": 350, "her": 351, "ri": 352, " her": 353, "ould": 354, "oo": 355, " sa": 356, " at": 357, "ill": 358, "ke": 359, "ter": 360, "ain": 361, "am": 362, " me": 363, "if": 364, " se": 365, " him": 366, "ct": 367, "'s": 368, "red": 369, "ch": 370, ".\"": 371, " su": 372, " she": 373, " have": 374, "ess": 375, " so": 376, "il": 377, "--": 378, " M": 379, " r": 380, "ore": 381, "pp": 382, "ome": 383, " k": 384, " de": 385, "all": 386, " my": 387, "ight": 388, " said": 389, " but": 390, " fr": 391, " do": 392, " all": 393, "ul": 394, " ne": 395, ",\"": 396, "and": 397, "ge": 398, "ich": 399, " con": 400, "qu": 401, " sh": 402, " by": 403, "He": 404, " up": 405, "th": 406, "pe": 407, " they": 408, " were": 409, " this": 410, " from": 411, " ex": 412, "us": 413, " which": 414, "ust": 415, " S": 416, "ble": 417, "ant": 418, "est": 419, " whe": 420, "very": 421, "ard": 422, "res": 423, "nt": 424, " C": 425, " or": 426, " are": 427, "It": 428, " one": 429, "ous": 430, " fe": 431, "out": 432, " man": 433, "our": 434, " al": 435, " li": 436, "lf": 437, "ation": 438, "ood": 439, " no": 440, " v": 441, " them": 442, "ind": 443, " kn": 444, " \"": 445, "ers": 446, " int": 447, " would": 448, "'t": 449, "ist": 450, "os": 451, " who": 452, "em": 453, "ra": 454, "ong": 455, " will": 456, "art": 457, "ast": 458, "ked": 459, "ie": 460, " out": 461, "one": 462, "ol": 463, " ab": 464, "ound": 465, "?\"": 466, " A": 467, " there": 468, " go": 469, " wor": 470, " com": 471, " B": 472, " been": 473, " le": 474, "han": 475, "un": 476, "ak": 477, "itt": 478, "ate": 479, "um": 480, "ig": 481, " their": 482, "ell": 483, "ough": 484, "pt": 485, "ive": 486, " P": 487, " j": 488, "own": 489, "ame": 490, "ry": 491, "self": 492, " pl": 493, "ack": 494, "ort": 495, " could": 496, "ven": 497, "ake": 498, " can": 499, "reat": 500, "hed": 501, " pro": 502, "But": 503, "ther": 504, "ide": 505, " when": 506, "ace": 507, " qu": 508, "ure": 509, " ag": 510, " what": 511}, "special_tokens": {"<|endoftext|>": 512}, "offset": 2049}}