goldfish-models
commited on
Commit
•
cd3aed5
1
Parent(s):
45e7f72
Upload ton_latn_10mb tokenizer.
Browse files- added_tokens.json +1 -0
- special_tokens_map.json +1 -0
- spiece.model +3 -0
- tokenizer.json +0 -0
- tokenizer_config.json +1 -0
added_tokens.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"[XXXXX38]": 48122, "[XXXXX181]": 48265, "[XXXXX636]": 48720, "[XXXXX103]": 48187, "[XXXXX664]": 48748, "[XXXXX386]": 48470, "[XXXXX749]": 48833, "[XXXXX168]": 48252, "[XXXXX588]": 48672, "[XXXXX576]": 48660, "[XXXXX78]": 48162, "[XXXXX3]": 48087, "[XXXXX1047]": 49131, "[XXXXX577]": 48661, "[XXXXX453]": 48537, "[XXXXX782]": 48866, "[XXXXX114]": 48198, "[XXXXX353]": 48437, "[XXXXX991]": 49075, "[XXXXX780]": 48864, "[XXXXX845]": 48929, "[XXXXX553]": 48637, "[XXXXX514]": 48598, "[XXXXX689]": 48773, "[XXXXX487]": 48571, "[XXXXX329]": 48413, "[XXXXX207]": 48291, "[XXXXX398]": 48482, "[XXXXX523]": 48607, "[XXXXX656]": 48740, "[XXXXX805]": 48889, "[XXXXX528]": 48612, "[XXXXX789]": 48873, "[XXXXX125]": 48209, "[XXXXX322]": 48406, "[XXXXX548]": 48632, "[XXXXX10]": 48094, "[XXXXX755]": 48839, "[XXXXX408]": 48492, "[XXXXX1060]": 49144, "[XXXXX757]": 48841, "[XXXXX753]": 48837, "[XXXXX874]": 48958, "[XXXXX23]": 48107, "[XXXXX454]": 48538, "[XXXXX306]": 48390, "[XXXXX819]": 48903, "[XXXXX393]": 48477, "[XXXXX519]": 48603, "[XXXXX129]": 48213, "[XXXXX261]": 48345, "[XXXXX171]": 48255, "[XXXXX248]": 48332, "[XXXXX809]": 48893, "[XXXXX909]": 48993, "[XXXXX172]": 48256, "[XXXXX502]": 48586, "[XXXXX6]": 48090, "[XXXXX75]": 48159, "[XXXXX986]": 49070, "[XXXXX571]": 48655, "[XXXXX236]": 48320, "[XXXXX891]": 48975, "[XXXXX151]": 48235, "[XXXXX57]": 48141, "[XXXXX1003]": 49087, "[XXXXX1035]": 49119, "[XXXXX28]": 48112, "[XXXXX124]": 48208, "[XXXXX727]": 48811, "[XXXXX1041]": 49125, "[XXXXX705]": 48789, "[XXXXX354]": 48438, "[XXXXX66]": 48150, "[XXXXX488]": 48572, "[XXXXX1039]": 49123, "[XXXXX794]": 48878, "[XXXXX1043]": 49127, "[XXXXX369]": 48453, "[XXXXX13]": 48097, "[XXXXX128]": 48212, "[XXXXX637]": 48721, "[XXXXX401]": 48485, "[XXXXX544]": 48628, "[XXXXX24]": 48108, "[XXXXX875]": 48959, "[XXXXX942]": 49026, "[XXXXX216]": 48300, "[XXXXX834]": 48918, "[XXXXX535]": 48619, "[XXXXX773]": 48857, "[XXXXX743]": 48827, "[XXXXX902]": 48986, "[XXXXX432]": 48516, "[XXXXX989]": 49073, "[XXXXX205]": 48289, "[XXXXX70]": 48154, "[XXXXX900]": 48984, "[XXXXX880]": 48964, "[XXXXX635]": 48719, "[XXXXX714]": 48798, "[XXXXX478]": 48562, "[XXXXX718]": 48802, "[XXXXX79]": 48163, "[XXXXX670]": 48754, "[XXXXX46]": 48130, "[XXXXX8]": 48092, "[XXXXX45]": 48129, "[XXXXX247]": 48331, "[XXXXX796]": 48880, "[XXXXX225]": 48309, "[XXXXX313]": 48397, "[XXXXX196]": 48280, "[XXXXX638]": 48722, "[XXXXX56]": 48140, "[XXXXX955]": 49039, "[XXXXX611]": 48695, "[XXXXX980]": 49064, "[XXXXX58]": 48142, "[XXXXX933]": 49017, "[XXXXX1004]": 49088, "[XXXXX712]": 48796, "[XXXXX96]": 48180, "[XXXXX982]": 49066, "[XXXXX831]": 48915, "[XXXXX579]": 48663, "[XXXXX16]": 48100, "[XXXXX318]": 48402, "[XXXXX1013]": 49097, "[XXXXX620]": 48704, "[XXXXX556]": 48640, "[XXXXX108]": 48192, "[XXXXX71]": 48155, "[XXXXX258]": 48342, "[XXXXX792]": 48876, "[XXXXX1057]": 49141, "[XXXXX380]": 48464, "[XXXXX690]": 48774, "[XXXXX622]": 48706, "[XXXXX1009]": 49093, "[XXXXX993]": 49077, "[XXXXX901]": 48985, "[XXXXX410]": 48494, "[XXXXX92]": 48176, "[XXXXX1056]": 49140, "[XXXXX0]": 48084, "[XXXXX265]": 48349, "[XXXXX186]": 48270, "[XXXXX274]": 48358, "[XXXXX961]": 49045, "[XXXXX530]": 48614, "[XXXXX467]": 48551, "[XXXXX430]": 48514, "[XXXXX438]": 48522, "[XXXXX551]": 48635, "[XXXXX226]": 48310, "[XXXXX907]": 48991, "[XXXXX138]": 48222, "[XXXXX192]": 48276, "[XXXXX696]": 48780, "[XXXXX529]": 48613, "[XXXXX165]": 48249, "[XXXXX992]": 49076, "[XXXXX698]": 48782, "[XXXXX511]": 48595, "[XXXXX222]": 48306, "[XXXXX489]": 48573, "[XXXXX683]": 48767, "[XXXXX739]": 48823, "[XXXXX374]": 48458, "[XXXXX69]": 48153, "[XXXXX866]": 48950, "[XXXXX632]": 48716, "[XXXXX701]": 48785, "[XXXXX117]": 48201, "[XXXXX568]": 48652, "[XXXXX144]": 48228, "[XXXXX977]": 49061, "[XXXXX719]": 48803, "[XXXXX1025]": 49109, "[XXXXX302]": 48386, "[XXXXX928]": 49012, "[XXXXX623]": 48707, "[XXXXX1033]": 49117, "[XXXXX281]": 48365, "[XXXXX1022]": 49106, "[XXXXX1052]": 49136, "[XXXXX93]": 48177, "[XXXXX842]": 48926, "[XXXXX824]": 48908, "[XXXXX315]": 48399, "[XXXXX290]": 48374, "[XXXXX359]": 48443, "[XXXXX81]": 48165, "[XXXXX716]": 48800, "[XXXXX917]": 49001, "[XXXXX910]": 48994, "[XXXXX296]": 48380, "[XXXXX239]": 48323, "[XXXXX152]": 48236, "[XXXXX521]": 48605, "[XXXXX418]": 48502, "[XXXXX64]": 48148, "[XXXXX777]": 48861, "[XXXXX468]": 48552, "[XXXXX527]": 48611, "[XXXXX693]": 48777, "[XXXXX485]": 48569, "[XXXXX160]": 48244, "[XXXXX257]": 48341, "[XXXXX150]": 48234, "[XXXXX166]": 48250, "[XXXXX590]": 48674, "[XXXXX90]": 48174, "[XXXXX651]": 48735, "[XXXXX976]": 49060, "[XXXXX1023]": 49107, "[XXXXX407]": 48491, "[XXXXX883]": 48967, "[XXXXX649]": 48733, "[XXXXX161]": 48245, "[XXXXX9]": 48093, "[XXXXX688]": 48772, "[XXXXX214]": 48298, "[XXXXX655]": 48739, "[XXXXX801]": 48885, "[XXXXX501]": 48585, "[XXXXX919]": 49003, "[MASK]": 48083, "[XXXXX357]": 48441, "[XXXXX188]": 48272, "[XXXXX774]": 48858, "[XXXXX828]": 48912, "[XXXXX462]": 48546, "[XXXXX284]": 48368, "[XXXXX644]": 48728, "[XXXXX74]": 48158, "[XXXXX1029]": 49113, "[XXXXX256]": 48340, "[XXXXX640]": 48724, "[XXXXX734]": 48818, "[XXXXX599]": 48683, "[XXXXX189]": 48273, "[XXXXX1053]": 49137, "[XXXXX878]": 48962, "[XXXXX710]": 48794, "[XXXXX814]": 48898, "[XXXXX44]": 48128, "[XXXXX465]": 48549, "[XXXXX406]": 48490, "[XXXXX1027]": 49111, "[XXXXX587]": 48671, "[XXXXX299]": 48383, "[XXXXX499]": 48583, "[XXXXX768]": 48852, "[XXXXX413]": 48497, "[XXXXX939]": 49023, "[XXXXX970]": 49054, "[XXXXX201]": 48285, "[XXXXX507]": 48591, "[XXXXX272]": 48356, "[XXXXX440]": 48524, "[XXXXX853]": 48937, "[XXXXX109]": 48193, "[XXXXX370]": 48454, "[XXXXX127]": 48211, "[XXXXX783]": 48867, "[XXXXX235]": 48319, "[XXXXX476]": 48560, "[XXXXX751]": 48835, "[XXXXX470]": 48554, "[XXXXX255]": 48339, "[XXXXX119]": 48203, "[XXXXX889]": 48973, "[XXXXX474]": 48558, "[XXXXX162]": 48246, "[XXXXX55]": 48139, "[XXXXX859]": 48943, "[XXXXX431]": 48515, "[XXXXX263]": 48347, "[XXXXX550]": 48634, "[XXXXX833]": 48917, "[XXXXX307]": 48391, "[XXXXX382]": 48466, "[XXXXX827]": 48911, "[XXXXX18]": 48102, "[XXXXX735]": 48819, "[XXXXX1020]": 49104, "[XXXXX415]": 48499, "[XXXXX1055]": 49139, "[XXXXX368]": 48452, "[XXXXX53]": 48137, "[XXXXX695]": 48779, "[XXXXX524]": 48608, "[XXXXX251]": 48335, "[XXXXX123]": 48207, "[XXXXX402]": 48486, "[XXXXX210]": 48294, "[XXXXX126]": 48210, "[XXXXX145]": 48229, "[XXXXX12]": 48096, "[XXXXX708]": 48792, "[XXXXX958]": 49042, "[XXXXX706]": 48790, "[XXXXX573]": 48657, "[XXXXX973]": 49057, "[XXXXX1066]": 49150, "[XXXXX246]": 48330, "[XXXXX198]": 48282, "[XXXXX229]": 48313, "[XXXXX285]": 48369, "[XXXXX813]": 48897, "[XXXXX532]": 48616, "[XXXXX349]": 48433, "[XXXXX1016]": 49100, "[XXXXX59]": 48143, "[XXXXX469]": 48553, "[XXXXX703]": 48787, "[XXXXX266]": 48350, "[XXXXX327]": 48411, "[XXXXX905]": 48989, "[XXXXX941]": 49025, "[XXXXX887]": 48971, "[XXXXX554]": 48638, "[XXXXX990]": 49074, "[XXXXX1024]": 49108, "[XXXXX301]": 48385, "[XXXXX113]": 48197, "[XXXXX452]": 48536, "[XXXXX549]": 48633, "[XXXXX91]": 48175, "[XXXXX106]": 48190, "[XXXXX574]": 48658, "[XXXXX1000]": 49084, "[XXXXX278]": 48362, "[XXXXX314]": 48398, "[XXXXX311]": 48395, "[XXXXX861]": 48945, "[XXXXX219]": 48303, "[XXXXX450]": 48534, "[XXXXX480]": 48564, "[XXXXX756]": 48840, "[XXXXX444]": 48528, "[XXXXX964]": 49048, "[XXXXX36]": 48120, "[XXXXX100]": 48184, "[XXXXX208]": 48292, "[XXXXX1011]": 49095, "[XXXXX921]": 49005, "[XXXXX1061]": 49145, "[XXXXX581]": 48665, "[XXXXX283]": 48367, "[XXXXX537]": 48621, "[XXXXX112]": 48196, "[XXXXX567]": 48651, "[XXXXX397]": 48481, "[XXXXX601]": 48685, "[XXXXX52]": 48136, "[XXXXX984]": 49068, "[XXXXX822]": 48906, "[XXXXX60]": 48144, "[XXXXX343]": 48427, "[XXXXX20]": 48104, "[XXXXX987]": 49071, "[XXXXX456]": 48540, "[XXXXX436]": 48520, "[XXXXX675]": 48759, "[XXXXX694]": 48778, "[XXXXX625]": 48709, "[XXXXX595]": 48679, "[XXXXX542]": 48626, "[XXXXX557]": 48641, "[XXXXX648]": 48732, "[XXXXX788]": 48872, "[XXXXX918]": 49002, "[XXXXX726]": 48810, "[XXXXX295]": 48379, "[XXXXX215]": 48299, "[XXXXX424]": 48508, "[XXXXX373]": 48457, "[XXXXX839]": 48923, "[XXXXX395]": 48479, "[XXXXX190]": 48274, "[XXXXX183]": 48267, "[XXXXX840]": 48924, "[XXXXX366]": 48450, "[XXXXX913]": 48997, "[XXXXX906]": 48990, "[XXXXX409]": 48493, "[XXXXX463]": 48547, "[XXXXX422]": 48506, "[XXXXX854]": 48938, "[XXXXX570]": 48654, "[XXXXX603]": 48687, "[XXXXX1]": 48085, "[XXXXX602]": 48686, "[XXXXX508]": 48592, "[XXXXX981]": 49065, "[XXXXX968]": 49052, "[XXXXX341]": 48425, "[XXXXX340]": 48424, "[XXXXX885]": 48969, "[XXXXX691]": 48775, "[XXXXX761]": 48845, "[XXXXX459]": 48543, "[XXXXX95]": 48179, "[XXXXX810]": 48894, "[XXXXX652]": 48736, "[XXXXX800]": 48884, "[XXXXX1048]": 49132, "[XXXXX911]": 48995, "[XXXXX969]": 49053, "[XXXXX806]": 48890, "[XXXXX490]": 48574, "[XXXXX67]": 48151, "[XXXXX297]": 48381, "[XXXXX983]": 49067, "[XXXXX195]": 48279, "[XXXXX785]": 48869, "[XXXXX1037]": 49121, "[XXXXX665]": 48749, "[XXXXX178]": 48262, "[XXXXX35]": 48119, "[XXXXX419]": 48503, "[XXXXX231]": 48315, "[XXXXX737]": 48821, "[XXXXX630]": 48714, "[XXXXX730]": 48814, "[XXXXX879]": 48963, "[XXXXX321]": 48405, "[XXXXX812]": 48896, "[XXXXX862]": 48946, "[XXXXX390]": 48474, "[XXXXX575]": 48659, "[XXXXX497]": 48581, "[XXXXX775]": 48859, "[XXXXX1044]": 49128, "[XXXXX927]": 49011, "[XXXXX1002]": 49086, "[XXXXX924]": 49008, "[XXXXX428]": 48512, "[XXXXX473]": 48557, "[XXXXX584]": 48668, "[XXXXX795]": 48879, "[XXXXX358]": 48442, "[XXXXX447]": 48531, "[XXXXX427]": 48511, "[XXXXX140]": 48224, "[XXXXX417]": 48501, "[XXXXX616]": 48700, "[XXXXX80]": 48164, "[XXXXX898]": 48982, "[XXXXX362]": 48446, "[XXXXX960]": 49044, "[XXXXX631]": 48715, "[XXXXX717]": 48801, "[XXXXX61]": 48145, "[XXXXX784]": 48868, "[XXXXX316]": 48400, "[XXXXX118]": 48202, "[XXXXX803]": 48887, "[XXXXX978]": 49062, "[XXXXX199]": 48283, "[XXXXX674]": 48758, "[XXXXX972]": 49056, "[XXXXX858]": 48942, "[XXXXX565]": 48649, "[XXXXX825]": 48909, "[XXXXX389]": 48473, "[XXXXX268]": 48352, "[XXXXX721]": 48805, "[XXXXX915]": 48999, "[XXXXX957]": 49041, "[XXXXX540]": 48624, "[XXXXX948]": 49032, "[XXXXX934]": 49018, "[XXXXX224]": 48308, "[XXXXX197]": 48281, "[XXXXX1008]": 49092, "[XXXXX491]": 48575, "[XXXXX326]": 48410, "[XXXXX139]": 48223, "[XXXXX679]": 48763, "[XXXXX1064]": 49148, "[XXXXX317]": 48401, "[XXXXX1046]": 49130, "[XXXXX745]": 48829, "[XXXXX1058]": 49142, "[XXXXX173]": 48257, "[XXXXX233]": 48317, "[XXXXX1006]": 49090, "[XXXXX288]": 48372, "[SEP]": 48081, "[XXXXX481]": 48565, "[XXXXX912]": 48996, "[XXXXX517]": 48601, "[XXXXX765]": 48849, "[XXXXX741]": 48825, "[XXXXX709]": 48793, "[XXXXX615]": 48699, "[XXXXX882]": 48966, "[XXXXX837]": 48921, "[XXXXX437]": 48521, "[XXXXX48]": 48132, "[XXXXX385]": 48469, "[XXXXX645]": 48729, "[XXXXX888]": 48972, "[XXXXX817]": 48901, "[XXXXX101]": 48185, "[XXXXX759]": 48843, "[XXXXX32]": 48116, "[XXXXX699]": 48783, "[XXXXX42]": 48126, "[XXXXX458]": 48542, "[XXXXX475]": 48559, "[XXXXX253]": 48337, "[XXXXX952]": 49036, "[XXXXX486]": 48570, "[XXXXX135]": 48219, "[XXXXX890]": 48974, "[XXXXX376]": 48460, "[XXXXX818]": 48902, "[XXXXX610]": 48694, "[XXXXX421]": 48505, "[XXXXX663]": 48747, "[XXXXX779]": 48863, "[XXXXX971]": 49055, "[XXXXX107]": 48191, "[XXXXX566]": 48650, "[XXXXX493]": 48577, "[XXXXX72]": 48156, "[XXXXX720]": 48804, "[XXXXX762]": 48846, "[XXXXX484]": 48568, "[XXXXX141]": 48225, "[XXXXX377]": 48461, "[XXXXX1031]": 49115, "[XXXXX851]": 48935, "[XXXXX243]": 48327, "<pad>": 48082, "[XXXXX654]": 48738, "[XXXXX995]": 49079, "[XXXXX954]": 49038, "[XXXXX923]": 49007, "[XXXXX73]": 48157, "[XXXXX68]": 48152, "[XXXXX403]": 48487, "[XXXXX304]": 48388, "[XXXXX732]": 48816, "[XXXXX443]": 48527, "[XXXXX332]": 48416, "[XXXXX686]": 48770, "[XXXXX15]": 48099, "[XXXXX1021]": 49105, "[XXXXX881]": 48965, "[XXXXX692]": 48776, "[XXXXX294]": 48378, "[XXXXX99]": 48183, "[XXXXX598]": 48682, "[XXXXX937]": 49021, "[XXXXX605]": 48689, "[XXXXX1042]": 49126, "[XXXXX559]": 48643, "[XXXXX87]": 48171, "[XXXXX676]": 48760, "[XXXXX920]": 49004, "[XXXXX204]": 48288, "[XXXXX241]": 48325, "[XXXXX797]": 48881, "[XXXXX808]": 48892, "[XXXXX133]": 48217, "[XXXXX661]": 48745, "[XXXXX835]": 48919, "[XXXXX931]": 49015, "[XXXXX34]": 48118, "[XXXXX292]": 48376, "[XXXXX660]": 48744, "[XXXXX672]": 48756, "[XXXXX163]": 48247, "[XXXXX289]": 48373, "[XXXXX121]": 48205, "[XXXXX344]": 48428, "[XXXXX286]": 48370, "[XXXXX849]": 48933, "[XXXXX998]": 49082, "[XXXXX414]": 48498, "[XXXXX405]": 48489, "[XXXXX287]": 48371, "[XXXXX275]": 48359, "[XXXXX1036]": 49120, "[XXXXX767]": 48851, "[XXXXX1063]": 49147, "[XXXXX763]": 48847, "[XXXXX153]": 48237, "[XXXXX227]": 48311, "[XXXXX711]": 48795, "[XXXXX555]": 48639, "[XXXXX678]": 48762, "[XXXXX776]": 48860, "[XXXXX870]": 48954, "[XXXXX646]": 48730, "[XXXXX561]": 48645, "[XXXXX769]": 48853, "[XXXXX979]": 49063, "[XXXXX137]": 48221, "[XXXXX334]": 48418, "[XXXXX170]": 48254, "[XXXXX88]": 48172, "[XXXXX17]": 48101, "[XXXXX738]": 48822, "[XXXXX303]": 48387, "[XXXXX325]": 48409, "[XXXXX606]": 48690, "[XXXXX506]": 48590, "[XXXXX254]": 48338, "[XXXXX671]": 48755, "[XXXXX130]": 48214, "[XXXXX336]": 48420, "[XXXXX1059]": 49143, "[XXXXX182]": 48266, "[XXXXX105]": 48189, "[XXXXX781]": 48865, "[XXXXX22]": 48106, "[XXXXX787]": 48871, "[XXXXX174]": 48258, "[XXXXX659]": 48743, "[XXXXX47]": 48131, "[XXXXX790]": 48874, "[XXXXX209]": 48293, "[XXXXX83]": 48167, "[XXXXX305]": 48389, "[XXXXX592]": 48676, "[XXXXX148]": 48232, "[XXXXX526]": 48610, "[XXXXX355]": 48439, "[XXXXX545]": 48629, "[XXXXX309]": 48393, "[XXXXX37]": 48121, "[XXXXX564]": 48648, "[XXXXX503]": 48587, "[XXXXX310]": 48394, "[XXXXX668]": 48752, "[XXXXX149]": 48233, "[XXXXX850]": 48934, "[XXXXX384]": 48468, "[XXXXX1007]": 49091, "[XXXXX212]": 48296, "[XXXXX496]": 48580, "[XXXXX396]": 48480, "[XXXXX873]": 48957, "[XXXXX848]": 48932, "[XXXXX597]": 48681, "[XXXXX1051]": 49135, "[XXXXX820]": 48904, "[XXXXX1001]": 49085, "[XXXXX841]": 48925, "[XXXXX360]": 48444, "[XXXXX633]": 48717, "[XXXXX930]": 49014, "[XXXXX155]": 48239, "[XXXXX533]": 48617, "[XXXXX846]": 48930, "[XXXXX802]": 48886, "[XXXXX746]": 48830, "[XXXXX791]": 48875, "[XXXXX935]": 49019, "[XXXXX169]": 48253, "[XXXXX903]": 48987, "[XXXXX538]": 48622, "[XXXXX951]": 49035, "[XXXXX520]": 48604, "[XXXXX895]": 48979, "[XXXXX513]": 48597, "[XXXXX847]": 48931, "[XXXXX713]": 48797, "[XXXXX657]": 48741, "[XXXXX541]": 48625, "[XXXXX280]": 48364, "[XXXXX351]": 48435, "[XXXXX423]": 48507, "[XXXXX771]": 48855, "[XXXXX884]": 48968, "[XXXXX722]": 48806, "[XXXXX932]": 49016, "[XXXXX985]": 49069, "[XXXXX411]": 48495, "[XXXXX869]": 48953, "[XXXXX926]": 49010, "[XXXXX76]": 48160, "[XXXXX29]": 48113, "[XXXXX681]": 48765, "[XXXXX449]": 48533, "[XXXXX132]": 48216, "[XXXXX829]": 48913, "[XXXXX856]": 48940, "[XXXXX516]": 48600, "[XXXXX627]": 48711, "[XXXXX894]": 48978, "[XXXXX312]": 48396, "[XXXXX863]": 48947, "[XXXXX426]": 48510, "[XXXXX736]": 48820, "[XXXXX451]": 48535, "[XXXXX772]": 48856, "[XXXXX943]": 49027, "[XXXXX963]": 49047, "[XXXXX175]": 48259, "[XXXXX974]": 49058, "[XXXXX621]": 48705, "[XXXXX1050]": 49134, "[XXXXX383]": 48467, "[XXXXX1010]": 49094, "[XXXXX685]": 48769, "[XXXXX498]": 48582, "[XXXXX994]": 49078, "[XXXXX715]": 48799, "[XXXXX770]": 48854, "[XXXXX617]": 48701, "[XXXXX363]": 48447, "[XXXXX220]": 48304, "[XXXXX997]": 49081, "[XXXXX134]": 48218, "[XXXXX760]": 48844, "[XXXXX270]": 48354, "[XXXXX925]": 49009, "[XXXXX471]": 48555, "[XXXXX494]": 48578, "[XXXXX260]": 48344, "[XXXXX793]": 48877, "[XXXXX872]": 48956, "[XXXXX562]": 48646, "[XXXXX1067]": 49151, "[XXXXX472]": 48556, "[XXXXX558]": 48642, "[XXXXX240]": 48324, "[XXXXX546]": 48630, "[XXXXX764]": 48848, "[XXXXX238]": 48322, "[XXXXX43]": 48127, "[XXXXX877]": 48961, "[XXXXX63]": 48147, "[XXXXX445]": 48529, "[XXXXX110]": 48194, "[XXXXX707]": 48791, "[XXXXX512]": 48596, "[XXXXX504]": 48588, "[XXXXX697]": 48781, "[XXXXX25]": 48109, "[XXXXX589]": 48673, "[XXXXX857]": 48941, "[XXXXX725]": 48809, "[XXXXX429]": 48513, "[XXXXX619]": 48703, "[XXXXX667]": 48751, "[XXXXX585]": 48669, "[XXXXX662]": 48746, "[XXXXX33]": 48117, "[XXXXX111]": 48195, "[XXXXX187]": 48271, "[XXXXX949]": 49033, "[XXXXX563]": 48647, "[XXXXX899]": 48983, "[XXXXX687]": 48771, "[XXXXX387]": 48471, "[XXXXX300]": 48384, "[XXXXX505]": 48589, "[XXXXX823]": 48907, "[XXXXX51]": 48135, "[XXXXX740]": 48824, "[XXXXX1065]": 49149, "[XXXXX85]": 48169, "[XXXXX262]": 48346, "[XXXXX908]": 48992, "[XXXXX778]": 48862, "[XXXXX1062]": 49146, "[XXXXX758]": 48842, "[XXXXX221]": 48305, "[XXXXX947]": 49031, "[XXXXX904]": 48988, "[XXXXX102]": 48186, "[XXXXX929]": 49013, "[XXXXX1026]": 49110, "[XXXXX62]": 48146, "[XXXXX752]": 48836, "[XXXXX98]": 48182, "[XXXXX836]": 48920, "[XXXXX1030]": 49114, "[XXXXX158]": 48242, "[XXXXX868]": 48952, "[XXXXX613]": 48697, "[XXXXX922]": 49006, "[XXXXX798]": 48882, "[XXXXX967]": 49051, "[XXXXX641]": 48725, "[XXXXX180]": 48264, "[XXXXX234]": 48318, "[XXXXX677]": 48761, "[XXXXX164]": 48248, "[XXXXX821]": 48905, "[XXXXX945]": 49029, "[XXXXX946]": 49030, "[XXXXX1005]": 49089, "[XXXXX335]": 48419, "[XXXXX477]": 48561, "[XXXXX531]": 48615, "[XXXXX412]": 48496, "[XXXXX356]": 48440, "[XXXXX893]": 48977, "[XXXXX586]": 48670, "[XXXXX936]": 49020, "[XXXXX522]": 48606, "[XXXXX147]": 48231, "[XXXXX852]": 48936, "[XXXXX1054]": 49138, "[XXXXX457]": 48541, "[XXXXX65]": 48149, "[XXXXX624]": 48708, "[XXXXX394]": 48478, "[XXXXX116]": 48200, "[XXXXX211]": 48295, "[XXXXX136]": 48220, "[XXXXX146]": 48230, "[XXXXX700]": 48784, "[XXXXX1019]": 49103, "[XXXXX1045]": 49129, "[XXXXX543]": 48627, "[XXXXX680]": 48764, "[XXXXX742]": 48826, "[XXXXX728]": 48812, "[XXXXX86]": 48170, "[XXXXX230]": 48314, "[XXXXX855]": 48939, "[XXXXX184]": 48268, "[XXXXX999]": 49083, "[XXXXX217]": 48301, "[XXXXX634]": 48718, "[XXXXX583]": 48667, "[XXXXX237]": 48321, "[XXXXX324]": 48408, "[XXXXX259]": 48343, "[XXXXX607]": 48691, "[XXXXX381]": 48465, "[XXXXX483]": 48567, "[XXXXX826]": 48910, "[XXXXX19]": 48103, "[XXXXX653]": 48737, "[XXXXX264]": 48348, "[XXXXX277]": 48361, "[XXXXX319]": 48403, "[XXXXX194]": 48278, "[XXXXX267]": 48351, "[XXXXX425]": 48509, "[XXXXX213]": 48297, "[XXXXX509]": 48593, "[XXXXX5]": 48089, "[XXXXX876]": 48960, "[XXXXX156]": 48240, "[XXXXX626]": 48710, "[XXXXX400]": 48484, "[XXXXX534]": 48618, "[XXXXX282]": 48366, "[XXXXX293]": 48377, "[XXXXX724]": 48808, "[XXXXX77]": 48161, "[XXXXX492]": 48576, "[XXXXX89]": 48173, "[XXXXX269]": 48353, "[XXXXX442]": 48526, "[XXXXX916]": 49000, "[XXXXX580]": 48664, "[XXXXX14]": 48098, "[XXXXX30]": 48114, "[XXXXX330]": 48414, "[XXXXX897]": 48981, "[XXXXX838]": 48922, "[XXXXX704]": 48788, "[XXXXX867]": 48951, "[XXXXX206]": 48290, "[XXXXX40]": 48124, "[CLS]": 48080, "[XXXXX629]": 48713, "[XXXXX748]": 48832, "[XXXXX747]": 48831, "[XXXXX466]": 48550, "[XXXXX525]": 48609, "[XXXXX320]": 48404, "[XXXXX799]": 48883, "[XXXXX500]": 48584, "[XXXXX811]": 48895, "[XXXXX950]": 49034, "[XXXXX966]": 49050, "[XXXXX1017]": 49101, "[XXXXX346]": 48430, "[XXXXX27]": 48111, "[XXXXX120]": 48204, "[XXXXX975]": 49059, "[XXXXX1012]": 49096, "[XXXXX956]": 49040, "[XXXXX159]": 48243, "[XXXXX642]": 48726, "[XXXXX218]": 48302, "[XXXXX142]": 48226, "[XXXXX578]": 48662, "[XXXXX223]": 48307, "[XXXXX391]": 48475, "[XXXXX252]": 48336, "[XXXXX388]": 48472, "[XXXXX953]": 49037, "[XXXXX539]": 48623, "[XXXXX446]": 48530, "[XXXXX378]": 48462, "[XXXXX245]": 48329, "[XXXXX1040]": 49124, "[XXXXX639]": 48723, "[XXXXX342]": 48426, "[XXXXX21]": 48105, "[XXXXX104]": 48188, "[XXXXX815]": 48899, "[XXXXX844]": 48928, "[XXXXX1015]": 49099, "[XXXXX702]": 48786, "[XXXXX865]": 48949, "[XXXXX434]": 48518, "[XXXXX372]": 48456, "[XXXXX914]": 48998, "[XXXXX31]": 48115, "[XXXXX1032]": 49116, "[XXXXX448]": 48532, "[XXXXX593]": 48677, "[XXXXX547]": 48631, "[XXXXX2]": 48086, "[XXXXX41]": 48125, "[XXXXX365]": 48449, "[XXXXX871]": 48955, "[XXXXX276]": 48360, "[XXXXX392]": 48476, "[XXXXX273]": 48357, "[XXXXX843]": 48927, "[XXXXX435]": 48519, "[XXXXX896]": 48980, "[XXXXX464]": 48548, "[XXXXX786]": 48870, "[XXXXX279]": 48363, "[XXXXX669]": 48753, "[XXXXX333]": 48417, "[XXXXX1018]": 49102, "[XXXXX244]": 48328, "[XXXXX455]": 48539, "[XXXXX193]": 48277, "[XXXXX495]": 48579, "[XXXXX345]": 48429, "[XXXXX404]": 48488, "[XXXXX250]": 48334, "[XXXXX518]": 48602, "[XXXXX608]": 48692, "[XXXXX643]": 48727, "[XXXXX682]": 48766, "[XXXXX232]": 48316, "[XXXXX988]": 49072, "[XXXXX959]": 49043, "[XXXXX886]": 48970, "[XXXXX536]": 48620, "[XXXXX614]": 48698, "[XXXXX371]": 48455, "[XXXXX122]": 48206, "[XXXXX673]": 48757, "[XXXXX944]": 49028, "[XXXXX1038]": 49122, "[XXXXX461]": 48545, "[XXXXX143]": 48227, "[XXXXX308]": 48392, "[XXXXX552]": 48636, "[XXXXX750]": 48834, "[XXXXX830]": 48914, "[XXXXX892]": 48976, "[XXXXX816]": 48900, "[XXXXX433]": 48517, "[XXXXX600]": 48684, "[XXXXX367]": 48451, "[XXXXX271]": 48355, "[XXXXX200]": 48284, "[XXXXX154]": 48238, "[XXXXX938]": 49022, "[XXXXX832]": 48916, "[XXXXX291]": 48375, "[XXXXX439]": 48523, "[XXXXX1049]": 49133, "[XXXXX754]": 48838, "[XXXXX569]": 48653, "[XXXXX7]": 48091, "[XXXXX364]": 48448, "[XXXXX731]": 48815, "[XXXXX337]": 48421, "[XXXXX328]": 48412, "[XXXXX647]": 48731, "[XXXXX684]": 48768, "[XXXXX420]": 48504, "[XXXXX1028]": 49112, "[XXXXX191]": 48275, "[XXXXX375]": 48459, "[XXXXX11]": 48095, "[XXXXX658]": 48742, "[XXXXX1034]": 49118, "[XXXXX582]": 48666, "[XXXXX515]": 48599, "[XXXXX996]": 49080, "[XXXXX609]": 48693, "[XXXXX131]": 48215, "[XXXXX203]": 48287, "[XXXXX185]": 48269, "[XXXXX723]": 48807, "[XXXXX167]": 48251, "[XXXXX594]": 48678, "[XXXXX510]": 48594, "[XXXXX399]": 48483, "[XXXXX331]": 48415, "[XXXXX50]": 48134, "[XXXXX591]": 48675, "[XXXXX962]": 49046, "[XXXXX864]": 48948, "[XXXXX650]": 48734, "[XXXXX361]": 48445, "[XXXXX733]": 48817, "[XXXXX352]": 48436, "[XXXXX379]": 48463, "[XXXXX228]": 48312, "[XXXXX350]": 48434, "[XXXXX4]": 48088, "[XXXXX618]": 48702, "[XXXXX97]": 48181, "[XXXXX347]": 48431, "[XXXXX628]": 48712, "[XXXXX202]": 48286, "[XXXXX744]": 48828, "[XXXXX1014]": 49098, "[XXXXX339]": 48423, "[XXXXX460]": 48544, "[XXXXX26]": 48110, "[XXXXX416]": 48500, "[XXXXX54]": 48138, "[XXXXX479]": 48563, "[XXXXX157]": 48241, "[XXXXX177]": 48261, "[XXXXX179]": 48263, "[XXXXX84]": 48168, "[XXXXX115]": 48199, "[XXXXX94]": 48178, "[XXXXX249]": 48333, "[XXXXX242]": 48326, "[XXXXX604]": 48688, "[XXXXX39]": 48123, "[XXXXX572]": 48656, "[XXXXX766]": 48850, "[XXXXX729]": 48813, "[XXXXX482]": 48566, "[XXXXX49]": 48133, "[XXXXX82]": 48166, "[XXXXX612]": 48696, "[XXXXX348]": 48432, "[XXXXX323]": 48407, "[XXXXX441]": 48525, "[XXXXX804]": 48888, "[XXXXX666]": 48750, "[XXXXX338]": 48422, "[XXXXX940]": 49024, "[XXXXX860]": 48944, "[XXXXX560]": 48644, "[XXXXX596]": 48680, "[XXXXX176]": 48260, "[XXXXX965]": 49049, "[XXXXX807]": 48891, "[XXXXX298]": 48382}
|
special_tokens_map.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"bos_token": "[CLS]", "eos_token": "[SEP]", "unk_token": "<unk>", "sep_token": "[SEP]", "pad_token": "<pad>", "cls_token": "[CLS]", "mask_token": {"content": "[MASK]", "single_word": false, "lstrip": true, "rstrip": false, "normalized": false}, "additional_special_tokens": ["[XXXXX0]", "[XXXXX1]", "[XXXXX2]", "[XXXXX3]", "[XXXXX4]", "[XXXXX5]", "[XXXXX6]", "[XXXXX7]", "[XXXXX8]", "[XXXXX9]", "[XXXXX10]", "[XXXXX11]", "[XXXXX12]", "[XXXXX13]", "[XXXXX14]", "[XXXXX15]", "[XXXXX16]", "[XXXXX17]", "[XXXXX18]", "[XXXXX19]", "[XXXXX20]", "[XXXXX21]", "[XXXXX22]", "[XXXXX23]", "[XXXXX24]", "[XXXXX25]", "[XXXXX26]", "[XXXXX27]", "[XXXXX28]", "[XXXXX29]", "[XXXXX30]", "[XXXXX31]", "[XXXXX32]", "[XXXXX33]", "[XXXXX34]", "[XXXXX35]", "[XXXXX36]", "[XXXXX37]", "[XXXXX38]", "[XXXXX39]", "[XXXXX40]", "[XXXXX41]", "[XXXXX42]", "[XXXXX43]", "[XXXXX44]", "[XXXXX45]", "[XXXXX46]", "[XXXXX47]", "[XXXXX48]", "[XXXXX49]", "[XXXXX50]", "[XXXXX51]", "[XXXXX52]", "[XXXXX53]", "[XXXXX54]", "[XXXXX55]", "[XXXXX56]", "[XXXXX57]", "[XXXXX58]", "[XXXXX59]", "[XXXXX60]", "[XXXXX61]", "[XXXXX62]", "[XXXXX63]", "[XXXXX64]", "[XXXXX65]", "[XXXXX66]", "[XXXXX67]", "[XXXXX68]", "[XXXXX69]", "[XXXXX70]", "[XXXXX71]", "[XXXXX72]", "[XXXXX73]", "[XXXXX74]", "[XXXXX75]", "[XXXXX76]", "[XXXXX77]", "[XXXXX78]", "[XXXXX79]", "[XXXXX80]", "[XXXXX81]", "[XXXXX82]", "[XXXXX83]", "[XXXXX84]", "[XXXXX85]", "[XXXXX86]", "[XXXXX87]", "[XXXXX88]", "[XXXXX89]", "[XXXXX90]", "[XXXXX91]", "[XXXXX92]", "[XXXXX93]", "[XXXXX94]", "[XXXXX95]", "[XXXXX96]", "[XXXXX97]", "[XXXXX98]", "[XXXXX99]", "[XXXXX100]", "[XXXXX101]", "[XXXXX102]", "[XXXXX103]", "[XXXXX104]", "[XXXXX105]", "[XXXXX106]", "[XXXXX107]", "[XXXXX108]", "[XXXXX109]", "[XXXXX110]", "[XXXXX111]", "[XXXXX112]", "[XXXXX113]", "[XXXXX114]", "[XXXXX115]", "[XXXXX116]", "[XXXXX117]", "[XXXXX118]", "[XXXXX119]", "[XXXXX120]", "[XXXXX121]", "[XXXXX122]", "[XXXXX123]", "[XXXXX124]", "[XXXXX125]", "[XXXXX126]", "[XXXXX127]", "[XXXXX128]", "[XXXXX129]", "[XXXXX130]", "[XXXXX131]", "[XXXXX132]", "[XXXXX133]", "[XXXXX134]", "[XXXXX135]", "[XXXXX136]", "[XXXXX137]", "[XXXXX138]", "[XXXXX139]", "[XXXXX140]", "[XXXXX141]", "[XXXXX142]", "[XXXXX143]", "[XXXXX144]", "[XXXXX145]", "[XXXXX146]", "[XXXXX147]", "[XXXXX148]", "[XXXXX149]", "[XXXXX150]", "[XXXXX151]", "[XXXXX152]", "[XXXXX153]", "[XXXXX154]", "[XXXXX155]", "[XXXXX156]", "[XXXXX157]", "[XXXXX158]", "[XXXXX159]", "[XXXXX160]", "[XXXXX161]", "[XXXXX162]", "[XXXXX163]", "[XXXXX164]", "[XXXXX165]", "[XXXXX166]", "[XXXXX167]", "[XXXXX168]", "[XXXXX169]", "[XXXXX170]", "[XXXXX171]", "[XXXXX172]", "[XXXXX173]", "[XXXXX174]", "[XXXXX175]", "[XXXXX176]", "[XXXXX177]", "[XXXXX178]", "[XXXXX179]", "[XXXXX180]", "[XXXXX181]", "[XXXXX182]", "[XXXXX183]", "[XXXXX184]", "[XXXXX185]", "[XXXXX186]", "[XXXXX187]", "[XXXXX188]", "[XXXXX189]", "[XXXXX190]", "[XXXXX191]", "[XXXXX192]", "[XXXXX193]", "[XXXXX194]", "[XXXXX195]", "[XXXXX196]", "[XXXXX197]", "[XXXXX198]", "[XXXXX199]", "[XXXXX200]", "[XXXXX201]", "[XXXXX202]", "[XXXXX203]", "[XXXXX204]", "[XXXXX205]", "[XXXXX206]", "[XXXXX207]", "[XXXXX208]", "[XXXXX209]", "[XXXXX210]", "[XXXXX211]", "[XXXXX212]", "[XXXXX213]", "[XXXXX214]", "[XXXXX215]", "[XXXXX216]", "[XXXXX217]", "[XXXXX218]", "[XXXXX219]", "[XXXXX220]", "[XXXXX221]", "[XXXXX222]", "[XXXXX223]", "[XXXXX224]", "[XXXXX225]", "[XXXXX226]", "[XXXXX227]", "[XXXXX228]", "[XXXXX229]", "[XXXXX230]", "[XXXXX231]", "[XXXXX232]", "[XXXXX233]", "[XXXXX234]", "[XXXXX235]", "[XXXXX236]", "[XXXXX237]", "[XXXXX238]", "[XXXXX239]", "[XXXXX240]", "[XXXXX241]", "[XXXXX242]", "[XXXXX243]", "[XXXXX244]", "[XXXXX245]", "[XXXXX246]", "[XXXXX247]", "[XXXXX248]", "[XXXXX249]", "[XXXXX250]", "[XXXXX251]", "[XXXXX252]", "[XXXXX253]", "[XXXXX254]", "[XXXXX255]", "[XXXXX256]", "[XXXXX257]", "[XXXXX258]", "[XXXXX259]", "[XXXXX260]", "[XXXXX261]", "[XXXXX262]", "[XXXXX263]", "[XXXXX264]", "[XXXXX265]", "[XXXXX266]", "[XXXXX267]", "[XXXXX268]", "[XXXXX269]", "[XXXXX270]", "[XXXXX271]", "[XXXXX272]", "[XXXXX273]", "[XXXXX274]", "[XXXXX275]", "[XXXXX276]", "[XXXXX277]", "[XXXXX278]", "[XXXXX279]", "[XXXXX280]", "[XXXXX281]", "[XXXXX282]", "[XXXXX283]", "[XXXXX284]", "[XXXXX285]", "[XXXXX286]", "[XXXXX287]", "[XXXXX288]", "[XXXXX289]", "[XXXXX290]", "[XXXXX291]", "[XXXXX292]", "[XXXXX293]", "[XXXXX294]", "[XXXXX295]", "[XXXXX296]", "[XXXXX297]", "[XXXXX298]", "[XXXXX299]", "[XXXXX300]", "[XXXXX301]", "[XXXXX302]", "[XXXXX303]", "[XXXXX304]", "[XXXXX305]", "[XXXXX306]", "[XXXXX307]", "[XXXXX308]", "[XXXXX309]", "[XXXXX310]", "[XXXXX311]", "[XXXXX312]", "[XXXXX313]", "[XXXXX314]", "[XXXXX315]", "[XXXXX316]", "[XXXXX317]", "[XXXXX318]", "[XXXXX319]", "[XXXXX320]", "[XXXXX321]", "[XXXXX322]", "[XXXXX323]", "[XXXXX324]", "[XXXXX325]", "[XXXXX326]", "[XXXXX327]", "[XXXXX328]", "[XXXXX329]", "[XXXXX330]", "[XXXXX331]", "[XXXXX332]", "[XXXXX333]", "[XXXXX334]", "[XXXXX335]", "[XXXXX336]", "[XXXXX337]", "[XXXXX338]", "[XXXXX339]", "[XXXXX340]", "[XXXXX341]", "[XXXXX342]", "[XXXXX343]", "[XXXXX344]", "[XXXXX345]", "[XXXXX346]", "[XXXXX347]", "[XXXXX348]", "[XXXXX349]", "[XXXXX350]", "[XXXXX351]", "[XXXXX352]", "[XXXXX353]", "[XXXXX354]", "[XXXXX355]", "[XXXXX356]", "[XXXXX357]", "[XXXXX358]", "[XXXXX359]", "[XXXXX360]", "[XXXXX361]", "[XXXXX362]", "[XXXXX363]", "[XXXXX364]", "[XXXXX365]", "[XXXXX366]", "[XXXXX367]", "[XXXXX368]", "[XXXXX369]", "[XXXXX370]", "[XXXXX371]", "[XXXXX372]", "[XXXXX373]", "[XXXXX374]", "[XXXXX375]", "[XXXXX376]", "[XXXXX377]", "[XXXXX378]", "[XXXXX379]", "[XXXXX380]", "[XXXXX381]", "[XXXXX382]", "[XXXXX383]", "[XXXXX384]", "[XXXXX385]", "[XXXXX386]", "[XXXXX387]", "[XXXXX388]", "[XXXXX389]", "[XXXXX390]", "[XXXXX391]", "[XXXXX392]", "[XXXXX393]", "[XXXXX394]", "[XXXXX395]", "[XXXXX396]", "[XXXXX397]", "[XXXXX398]", "[XXXXX399]", "[XXXXX400]", "[XXXXX401]", "[XXXXX402]", "[XXXXX403]", "[XXXXX404]", "[XXXXX405]", "[XXXXX406]", "[XXXXX407]", "[XXXXX408]", "[XXXXX409]", "[XXXXX410]", "[XXXXX411]", "[XXXXX412]", "[XXXXX413]", "[XXXXX414]", "[XXXXX415]", "[XXXXX416]", "[XXXXX417]", "[XXXXX418]", "[XXXXX419]", "[XXXXX420]", "[XXXXX421]", "[XXXXX422]", "[XXXXX423]", "[XXXXX424]", "[XXXXX425]", "[XXXXX426]", "[XXXXX427]", "[XXXXX428]", "[XXXXX429]", "[XXXXX430]", "[XXXXX431]", "[XXXXX432]", "[XXXXX433]", "[XXXXX434]", "[XXXXX435]", "[XXXXX436]", "[XXXXX437]", "[XXXXX438]", "[XXXXX439]", "[XXXXX440]", "[XXXXX441]", "[XXXXX442]", "[XXXXX443]", "[XXXXX444]", "[XXXXX445]", "[XXXXX446]", "[XXXXX447]", "[XXXXX448]", "[XXXXX449]", "[XXXXX450]", "[XXXXX451]", "[XXXXX452]", "[XXXXX453]", "[XXXXX454]", "[XXXXX455]", "[XXXXX456]", "[XXXXX457]", "[XXXXX458]", "[XXXXX459]", "[XXXXX460]", "[XXXXX461]", "[XXXXX462]", "[XXXXX463]", "[XXXXX464]", "[XXXXX465]", "[XXXXX466]", "[XXXXX467]", "[XXXXX468]", "[XXXXX469]", "[XXXXX470]", "[XXXXX471]", "[XXXXX472]", "[XXXXX473]", "[XXXXX474]", "[XXXXX475]", "[XXXXX476]", "[XXXXX477]", "[XXXXX478]", "[XXXXX479]", "[XXXXX480]", "[XXXXX481]", "[XXXXX482]", "[XXXXX483]", "[XXXXX484]", "[XXXXX485]", "[XXXXX486]", "[XXXXX487]", "[XXXXX488]", "[XXXXX489]", "[XXXXX490]", "[XXXXX491]", "[XXXXX492]", "[XXXXX493]", "[XXXXX494]", "[XXXXX495]", "[XXXXX496]", "[XXXXX497]", "[XXXXX498]", "[XXXXX499]", "[XXXXX500]", "[XXXXX501]", "[XXXXX502]", "[XXXXX503]", "[XXXXX504]", "[XXXXX505]", "[XXXXX506]", "[XXXXX507]", "[XXXXX508]", "[XXXXX509]", "[XXXXX510]", "[XXXXX511]", "[XXXXX512]", "[XXXXX513]", "[XXXXX514]", "[XXXXX515]", "[XXXXX516]", "[XXXXX517]", "[XXXXX518]", "[XXXXX519]", "[XXXXX520]", "[XXXXX521]", "[XXXXX522]", "[XXXXX523]", "[XXXXX524]", "[XXXXX525]", "[XXXXX526]", "[XXXXX527]", "[XXXXX528]", "[XXXXX529]", "[XXXXX530]", "[XXXXX531]", "[XXXXX532]", "[XXXXX533]", "[XXXXX534]", "[XXXXX535]", "[XXXXX536]", "[XXXXX537]", "[XXXXX538]", "[XXXXX539]", "[XXXXX540]", "[XXXXX541]", "[XXXXX542]", "[XXXXX543]", "[XXXXX544]", "[XXXXX545]", "[XXXXX546]", "[XXXXX547]", "[XXXXX548]", "[XXXXX549]", "[XXXXX550]", "[XXXXX551]", "[XXXXX552]", "[XXXXX553]", "[XXXXX554]", "[XXXXX555]", "[XXXXX556]", "[XXXXX557]", "[XXXXX558]", "[XXXXX559]", "[XXXXX560]", "[XXXXX561]", "[XXXXX562]", "[XXXXX563]", "[XXXXX564]", "[XXXXX565]", "[XXXXX566]", "[XXXXX567]", "[XXXXX568]", "[XXXXX569]", "[XXXXX570]", "[XXXXX571]", "[XXXXX572]", "[XXXXX573]", "[XXXXX574]", "[XXXXX575]", "[XXXXX576]", "[XXXXX577]", "[XXXXX578]", "[XXXXX579]", "[XXXXX580]", "[XXXXX581]", "[XXXXX582]", "[XXXXX583]", "[XXXXX584]", "[XXXXX585]", "[XXXXX586]", "[XXXXX587]", "[XXXXX588]", "[XXXXX589]", "[XXXXX590]", "[XXXXX591]", "[XXXXX592]", "[XXXXX593]", "[XXXXX594]", "[XXXXX595]", "[XXXXX596]", "[XXXXX597]", "[XXXXX598]", "[XXXXX599]", "[XXXXX600]", "[XXXXX601]", "[XXXXX602]", "[XXXXX603]", "[XXXXX604]", "[XXXXX605]", "[XXXXX606]", "[XXXXX607]", "[XXXXX608]", "[XXXXX609]", "[XXXXX610]", "[XXXXX611]", "[XXXXX612]", "[XXXXX613]", "[XXXXX614]", "[XXXXX615]", "[XXXXX616]", "[XXXXX617]", "[XXXXX618]", "[XXXXX619]", "[XXXXX620]", "[XXXXX621]", "[XXXXX622]", "[XXXXX623]", "[XXXXX624]", "[XXXXX625]", "[XXXXX626]", "[XXXXX627]", "[XXXXX628]", "[XXXXX629]", "[XXXXX630]", "[XXXXX631]", "[XXXXX632]", "[XXXXX633]", "[XXXXX634]", "[XXXXX635]", "[XXXXX636]", "[XXXXX637]", "[XXXXX638]", "[XXXXX639]", "[XXXXX640]", "[XXXXX641]", "[XXXXX642]", "[XXXXX643]", "[XXXXX644]", "[XXXXX645]", "[XXXXX646]", "[XXXXX647]", "[XXXXX648]", "[XXXXX649]", "[XXXXX650]", "[XXXXX651]", "[XXXXX652]", "[XXXXX653]", "[XXXXX654]", "[XXXXX655]", "[XXXXX656]", "[XXXXX657]", "[XXXXX658]", "[XXXXX659]", "[XXXXX660]", "[XXXXX661]", "[XXXXX662]", "[XXXXX663]", "[XXXXX664]", "[XXXXX665]", "[XXXXX666]", "[XXXXX667]", "[XXXXX668]", "[XXXXX669]", "[XXXXX670]", "[XXXXX671]", "[XXXXX672]", "[XXXXX673]", "[XXXXX674]", "[XXXXX675]", "[XXXXX676]", "[XXXXX677]", "[XXXXX678]", "[XXXXX679]", "[XXXXX680]", "[XXXXX681]", "[XXXXX682]", "[XXXXX683]", "[XXXXX684]", "[XXXXX685]", "[XXXXX686]", "[XXXXX687]", "[XXXXX688]", "[XXXXX689]", "[XXXXX690]", "[XXXXX691]", "[XXXXX692]", "[XXXXX693]", "[XXXXX694]", "[XXXXX695]", "[XXXXX696]", "[XXXXX697]", "[XXXXX698]", "[XXXXX699]", "[XXXXX700]", "[XXXXX701]", "[XXXXX702]", "[XXXXX703]", "[XXXXX704]", "[XXXXX705]", "[XXXXX706]", "[XXXXX707]", "[XXXXX708]", "[XXXXX709]", "[XXXXX710]", "[XXXXX711]", "[XXXXX712]", "[XXXXX713]", "[XXXXX714]", "[XXXXX715]", "[XXXXX716]", "[XXXXX717]", "[XXXXX718]", "[XXXXX719]", "[XXXXX720]", "[XXXXX721]", "[XXXXX722]", "[XXXXX723]", "[XXXXX724]", "[XXXXX725]", "[XXXXX726]", "[XXXXX727]", "[XXXXX728]", "[XXXXX729]", "[XXXXX730]", "[XXXXX731]", "[XXXXX732]", "[XXXXX733]", "[XXXXX734]", "[XXXXX735]", "[XXXXX736]", "[XXXXX737]", "[XXXXX738]", "[XXXXX739]", "[XXXXX740]", "[XXXXX741]", "[XXXXX742]", "[XXXXX743]", "[XXXXX744]", "[XXXXX745]", "[XXXXX746]", "[XXXXX747]", "[XXXXX748]", "[XXXXX749]", "[XXXXX750]", "[XXXXX751]", "[XXXXX752]", "[XXXXX753]", "[XXXXX754]", "[XXXXX755]", "[XXXXX756]", "[XXXXX757]", "[XXXXX758]", "[XXXXX759]", "[XXXXX760]", "[XXXXX761]", "[XXXXX762]", "[XXXXX763]", "[XXXXX764]", "[XXXXX765]", "[XXXXX766]", "[XXXXX767]", "[XXXXX768]", "[XXXXX769]", "[XXXXX770]", "[XXXXX771]", "[XXXXX772]", "[XXXXX773]", "[XXXXX774]", "[XXXXX775]", "[XXXXX776]", "[XXXXX777]", "[XXXXX778]", "[XXXXX779]", "[XXXXX780]", "[XXXXX781]", "[XXXXX782]", "[XXXXX783]", "[XXXXX784]", "[XXXXX785]", "[XXXXX786]", "[XXXXX787]", "[XXXXX788]", "[XXXXX789]", "[XXXXX790]", "[XXXXX791]", "[XXXXX792]", "[XXXXX793]", "[XXXXX794]", "[XXXXX795]", "[XXXXX796]", "[XXXXX797]", "[XXXXX798]", "[XXXXX799]", "[XXXXX800]", "[XXXXX801]", "[XXXXX802]", "[XXXXX803]", "[XXXXX804]", "[XXXXX805]", "[XXXXX806]", "[XXXXX807]", "[XXXXX808]", "[XXXXX809]", "[XXXXX810]", "[XXXXX811]", "[XXXXX812]", "[XXXXX813]", "[XXXXX814]", "[XXXXX815]", "[XXXXX816]", "[XXXXX817]", "[XXXXX818]", "[XXXXX819]", "[XXXXX820]", "[XXXXX821]", "[XXXXX822]", "[XXXXX823]", "[XXXXX824]", "[XXXXX825]", "[XXXXX826]", "[XXXXX827]", "[XXXXX828]", "[XXXXX829]", "[XXXXX830]", "[XXXXX831]", "[XXXXX832]", "[XXXXX833]", "[XXXXX834]", "[XXXXX835]", "[XXXXX836]", "[XXXXX837]", "[XXXXX838]", "[XXXXX839]", "[XXXXX840]", "[XXXXX841]", "[XXXXX842]", "[XXXXX843]", "[XXXXX844]", "[XXXXX845]", "[XXXXX846]", "[XXXXX847]", "[XXXXX848]", "[XXXXX849]", "[XXXXX850]", "[XXXXX851]", "[XXXXX852]", "[XXXXX853]", "[XXXXX854]", "[XXXXX855]", "[XXXXX856]", "[XXXXX857]", "[XXXXX858]", "[XXXXX859]", "[XXXXX860]", "[XXXXX861]", "[XXXXX862]", "[XXXXX863]", "[XXXXX864]", "[XXXXX865]", "[XXXXX866]", "[XXXXX867]", "[XXXXX868]", "[XXXXX869]", "[XXXXX870]", "[XXXXX871]", "[XXXXX872]", "[XXXXX873]", "[XXXXX874]", "[XXXXX875]", "[XXXXX876]", "[XXXXX877]", "[XXXXX878]", "[XXXXX879]", "[XXXXX880]", "[XXXXX881]", "[XXXXX882]", "[XXXXX883]", "[XXXXX884]", "[XXXXX885]", "[XXXXX886]", "[XXXXX887]", "[XXXXX888]", "[XXXXX889]", "[XXXXX890]", "[XXXXX891]", "[XXXXX892]", "[XXXXX893]", "[XXXXX894]", "[XXXXX895]", "[XXXXX896]", "[XXXXX897]", "[XXXXX898]", "[XXXXX899]", "[XXXXX900]", "[XXXXX901]", "[XXXXX902]", "[XXXXX903]", "[XXXXX904]", "[XXXXX905]", "[XXXXX906]", "[XXXXX907]", "[XXXXX908]", "[XXXXX909]", "[XXXXX910]", "[XXXXX911]", "[XXXXX912]", "[XXXXX913]", "[XXXXX914]", "[XXXXX915]", "[XXXXX916]", "[XXXXX917]", "[XXXXX918]", "[XXXXX919]", "[XXXXX920]", "[XXXXX921]", "[XXXXX922]", "[XXXXX923]", "[XXXXX924]", "[XXXXX925]", "[XXXXX926]", "[XXXXX927]", "[XXXXX928]", "[XXXXX929]", "[XXXXX930]", "[XXXXX931]", "[XXXXX932]", "[XXXXX933]", "[XXXXX934]", "[XXXXX935]", "[XXXXX936]", "[XXXXX937]", "[XXXXX938]", "[XXXXX939]", "[XXXXX940]", "[XXXXX941]", "[XXXXX942]", "[XXXXX943]", "[XXXXX944]", "[XXXXX945]", "[XXXXX946]", "[XXXXX947]", "[XXXXX948]", "[XXXXX949]", "[XXXXX950]", "[XXXXX951]", "[XXXXX952]", "[XXXXX953]", "[XXXXX954]", "[XXXXX955]", "[XXXXX956]", "[XXXXX957]", "[XXXXX958]", "[XXXXX959]", "[XXXXX960]", "[XXXXX961]", "[XXXXX962]", "[XXXXX963]", "[XXXXX964]", "[XXXXX965]", "[XXXXX966]", "[XXXXX967]", "[XXXXX968]", "[XXXXX969]", "[XXXXX970]", "[XXXXX971]", "[XXXXX972]", "[XXXXX973]", "[XXXXX974]", "[XXXXX975]", "[XXXXX976]", "[XXXXX977]", "[XXXXX978]", "[XXXXX979]", "[XXXXX980]", "[XXXXX981]", "[XXXXX982]", "[XXXXX983]", "[XXXXX984]", "[XXXXX985]", "[XXXXX986]", "[XXXXX987]", "[XXXXX988]", "[XXXXX989]", "[XXXXX990]", "[XXXXX991]", "[XXXXX992]", "[XXXXX993]", "[XXXXX994]", "[XXXXX995]", "[XXXXX996]", "[XXXXX997]", "[XXXXX998]", "[XXXXX999]", "[XXXXX1000]", "[XXXXX1001]", "[XXXXX1002]", "[XXXXX1003]", "[XXXXX1004]", "[XXXXX1005]", "[XXXXX1006]", "[XXXXX1007]", "[XXXXX1008]", "[XXXXX1009]", "[XXXXX1010]", "[XXXXX1011]", "[XXXXX1012]", "[XXXXX1013]", "[XXXXX1014]", "[XXXXX1015]", "[XXXXX1016]", "[XXXXX1017]", "[XXXXX1018]", "[XXXXX1019]", "[XXXXX1020]", "[XXXXX1021]", "[XXXXX1022]", "[XXXXX1023]", "[XXXXX1024]", "[XXXXX1025]", "[XXXXX1026]", "[XXXXX1027]", "[XXXXX1028]", "[XXXXX1029]", "[XXXXX1030]", "[XXXXX1031]", "[XXXXX1032]", "[XXXXX1033]", "[XXXXX1034]", "[XXXXX1035]", "[XXXXX1036]", "[XXXXX1037]", "[XXXXX1038]", "[XXXXX1039]", "[XXXXX1040]", "[XXXXX1041]", "[XXXXX1042]", "[XXXXX1043]", "[XXXXX1044]", "[XXXXX1045]", "[XXXXX1046]", "[XXXXX1047]", "[XXXXX1048]", "[XXXXX1049]", "[XXXXX1050]", "[XXXXX1051]", "[XXXXX1052]", "[XXXXX1053]", "[XXXXX1054]", "[XXXXX1055]", "[XXXXX1056]", "[XXXXX1057]", "[XXXXX1058]", "[XXXXX1059]", "[XXXXX1060]", "[XXXXX1061]", "[XXXXX1062]", "[XXXXX1063]", "[XXXXX1064]", "[XXXXX1065]", "[XXXXX1066]", "[XXXXX1067]"]}
|
spiece.model
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3078c0a57f7cad63a8c415df0607ce6b0389cf0346899d034504cca74ab73494
|
3 |
+
size 1027832
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"do_lower_case": false, "remove_space": true, "keep_accents": true, "bos_token": "[CLS]", "eos_token": "[SEP]", "unk_token": "<unk>", "sep_token": "[SEP]", "pad_token": "<pad>", "cls_token": "[CLS]", "mask_token": {"content": "[MASK]", "single_word": false, "lstrip": true, "rstrip": false, "normalized": false, "__type": "AddedToken"}, "sp_model_kwargs": {}, "name_or_path": "models/10mb/ton_latn_10mb", "model_input_names": ["input_ids", "attention_mask"], "special_tokens_map_file": "models/10mb/ton_latn_10mb/special_tokens_map.json", "tokenizer_class": "AlbertTokenizer"}
|