goldfish-models
commited on
Commit
•
f302c09
1
Parent(s):
d180375
Upload lus_latn_5mb tokenizer.
Browse files- added_tokens.json +1 -0
- special_tokens_map.json +1 -0
- spiece.model +3 -0
- tokenizer.json +0 -0
- tokenizer_config.json +1 -0
added_tokens.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"[XXXXX701]": 48661, "[XXXXX283]": 48243, "[XXXXX344]": 48304, "[XXXXX882]": 48842, "[XXXXX359]": 48319, "[XXXXX440]": 48400, "[XXXXX951]": 48911, "[XXXXX146]": 48106, "[XXXXX593]": 48553, "[XXXXX1035]": 48995, "[XXXXX917]": 48877, "[XXXXX1026]": 48986, "[XXXXX245]": 48205, "[XXXXX812]": 48772, "[XXXXX1070]": 49030, "[XXXXX709]": 48669, "[XXXXX827]": 48787, "[XXXXX615]": 48575, "[XXXXX472]": 48432, "[XXXXX860]": 48820, "[XXXXX1073]": 49033, "[XXXXX366]": 48326, "[XXXXX581]": 48541, "[XXXXX179]": 48139, "[XXXXX670]": 48630, "[XXXXX1173]": 49133, "[XXXXX1166]": 49126, "[XXXXX741]": 48701, "[XXXXX427]": 48387, "[XXXXX656]": 48616, "[XXXXX1179]": 49139, "[XXXXX829]": 48789, "[XXXXX31]": 47991, "[XXXXX541]": 48501, "[XXXXX415]": 48375, "[XXXXX537]": 48497, "[XXXXX1109]": 49069, "[XXXXX641]": 48601, "[XXXXX964]": 48924, "[XXXXX121]": 48081, "[XXXXX1012]": 48972, "[XXXXX787]": 48747, "[XXXXX608]": 48568, "[XXXXX10]": 47970, "[XXXXX213]": 48173, "[XXXXX70]": 48030, "[XXXXX1008]": 48968, "[XXXXX164]": 48124, "[XXXXX675]": 48635, "[XXXXX79]": 48039, "[XXXXX1094]": 49054, "[XXXXX861]": 48821, "[XXXXX57]": 48017, "[XXXXX1097]": 49057, "[XXXXX247]": 48207, "[XXXXX341]": 48301, "[XXXXX51]": 48011, "[XXXXX1049]": 49009, "[XXXXX64]": 48024, "[XXXXX391]": 48351, "[XXXXX198]": 48158, "[XXXXX798]": 48758, "[XXXXX187]": 48147, "[XXXXX319]": 48279, "[XXXXX749]": 48709, "[XXXXX874]": 48834, "[XXXXX851]": 48811, "[XXXXX922]": 48882, "[XXXXX71]": 48031, "[XXXXX417]": 48377, "[XXXXX281]": 48241, "[XXXXX419]": 48379, "[XXXXX989]": 48949, "[XXXXX943]": 48903, "[XXXXX1055]": 49015, "[XXXXX1077]": 49037, "[XXXXX474]": 48434, "[XXXXX508]": 48468, "[XXXXX1123]": 49083, "[XXXXX1131]": 49091, "[XXXXX949]": 48909, "[XXXXX982]": 48942, "[XXXXX1112]": 49072, "[XXXXX555]": 48515, "[XXXXX274]": 48234, "[XXXXX425]": 48385, "[XXXXX1148]": 49108, "[XXXXX408]": 48368, "[XXXXX673]": 48633, "[XXXXX309]": 48269, "[XXXXX1188]": 49148, "[XXXXX799]": 48759, "[XXXXX328]": 48288, "[XXXXX316]": 48276, "[XXXXX1158]": 49118, "[XXXXX773]": 48733, "[XXXXX758]": 48718, "[XXXXX814]": 48774, "[XXXXX920]": 48880, "[XXXXX618]": 48578, "[XXXXX191]": 48151, "[XXXXX575]": 48535, "[XXXXX1127]": 49087, "[XXXXX357]": 48317, "[XXXXX844]": 48804, "[XXXXX312]": 48272, "[XXXXX862]": 48822, "[XXXXX984]": 48944, "[XXXXX921]": 48881, "[XXXXX307]": 48267, "[XXXXX409]": 48369, "[XXXXX499]": 48459, "[XXXXX630]": 48590, "[XXXXX1184]": 49144, "[XXXXX763]": 48723, "[XXXXX434]": 48394, "[XXXXX39]": 47999, "[XXXXX783]": 48743, "[XXXXX255]": 48215, "[XXXXX150]": 48110, "[XXXXX1024]": 48984, "[XXXXX1023]": 48983, "[XXXXX744]": 48704, "[XXXXX1031]": 48991, "[XXXXX546]": 48506, "[XXXXX708]": 48668, "[SEP]": 47957, "[XXXXX990]": 48950, "[XXXXX210]": 48170, "[XXXXX1029]": 48989, "[XXXXX377]": 48337, "[XXXXX102]": 48062, "[XXXXX770]": 48730, "[XXXXX1102]": 49062, "[XXXXX204]": 48164, "[XXXXX711]": 48671, "[XXXXX67]": 48027, "[XXXXX105]": 48065, "[XXXXX1107]": 49067, "[XXXXX1155]": 49115, "[XXXXX317]": 48277, "[XXXXX88]": 48048, "[XXXXX617]": 48577, "[XXXXX451]": 48411, "[XXXXX1132]": 49092, "[XXXXX351]": 48311, "[XXXXX1153]": 49113, "[XXXXX1126]": 49086, "[XXXXX591]": 48551, "[XXXXX535]": 48495, "[XXXXX321]": 48281, "[XXXXX804]": 48764, "[XXXXX110]": 48070, "[XXXXX487]": 48447, "[XXXXX209]": 48169, "[XXXXX9]": 47969, "[XXXXX445]": 48405, "[XXXXX158]": 48118, "[XXXXX721]": 48681, "[XXXXX757]": 48717, "[XXXXX864]": 48824, "[XXXXX231]": 48191, "[XXXXX594]": 48554, "[XXXXX863]": 48823, "[XXXXX781]": 48741, "[XXXXX1160]": 49120, "[XXXXX948]": 48908, "[XXXXX477]": 48437, "[XXXXX697]": 48657, "[XXXXX601]": 48561, "[XXXXX1089]": 49049, "[XXXXX934]": 48894, "[XXXXX343]": 48303, "[XXXXX22]": 47982, "[XXXXX251]": 48211, "[XXXXX392]": 48352, "[XXXXX965]": 48925, "[XXXXX509]": 48469, "[XXXXX199]": 48159, "[XXXXX893]": 48853, "[XXXXX999]": 48959, "[XXXXX908]": 48868, "[XXXXX1013]": 48973, "[XXXXX777]": 48737, "[XXXXX219]": 48179, "[XXXXX262]": 48222, "[XXXXX745]": 48705, "[XXXXX1038]": 48998, "[XXXXX897]": 48857, "[XXXXX237]": 48197, "[XXXXX884]": 48844, "[XXXXX667]": 48627, "[XXXXX968]": 48928, "[XXXXX683]": 48643, "[XXXXX569]": 48529, "[XXXXX382]": 48342, "[XXXXX739]": 48699, "[XXXXX295]": 48255, "[XXXXX866]": 48826, "[XXXXX665]": 48625, "[XXXXX223]": 48183, "[XXXXX742]": 48702, "[XXXXX93]": 48053, "[XXXXX857]": 48817, "[XXXXX926]": 48886, "[XXXXX269]": 48229, "[XXXXX871]": 48831, "[XXXXX294]": 48254, "[XXXXX700]": 48660, "[XXXXX205]": 48165, "[XXXXX376]": 48336, "[XXXXX1144]": 49104, "[XXXXX914]": 48874, "[XXXXX132]": 48092, "[XXXXX886]": 48846, "[XXXXX439]": 48399, "[XXXXX839]": 48799, "[XXXXX923]": 48883, "[XXXXX494]": 48454, "[XXXXX642]": 48602, "[XXXXX1092]": 49052, "[XXXXX435]": 48395, "[XXXXX1108]": 49068, "[XXXXX717]": 48677, "[XXXXX1111]": 49071, "[XXXXX188]": 48148, "[XXXXX831]": 48791, "[XXXXX590]": 48550, "[XXXXX62]": 48022, "[XXXXX994]": 48954, "[XXXXX901]": 48861, "[XXXXX734]": 48694, "[XXXXX136]": 48096, "[XXXXX819]": 48779, "[XXXXX695]": 48655, "[XXXXX998]": 48958, "[XXXXX682]": 48642, "[XXXXX443]": 48403, "[XXXXX599]": 48559, "[XXXXX389]": 48349, "[XXXXX413]": 48373, "[XXXXX1122]": 49082, "[XXXXX872]": 48832, "[XXXXX123]": 48083, "[XXXXX297]": 48257, "[XXXXX230]": 48190, "[XXXXX1079]": 49039, "[XXXXX378]": 48338, "[XXXXX502]": 48462, "[XXXXX671]": 48631, "[XXXXX75]": 48035, "[XXXXX730]": 48690, "[XXXXX761]": 48721, "[XXXXX766]": 48726, "[XXXXX597]": 48557, "[XXXXX315]": 48275, "[XXXXX803]": 48763, "[XXXXX291]": 48251, "[XXXXX566]": 48526, "[XXXXX1147]": 49107, "[XXXXX1064]": 49024, "[XXXXX1116]": 49076, "[XXXXX372]": 48332, "[XXXXX148]": 48108, "[XXXXX881]": 48841, "[XXXXX704]": 48664, "[XXXXX631]": 48591, "[XXXXX313]": 48273, "[XXXXX4]": 47964, "[XXXXX1083]": 49043, "[XXXXX311]": 48271, "[XXXXX49]": 48009, "[XXXXX1135]": 49095, "[XXXXX55]": 48015, "[XXXXX813]": 48773, "[XXXXX459]": 48419, "[XXXXX310]": 48270, "[XXXXX510]": 48470, "[XXXXX1171]": 49131, "[XXXXX693]": 48653, "[XXXXX27]": 47987, "[XXXXX1002]": 48962, "[XXXXX298]": 48258, "[XXXXX1000]": 48960, "[XXXXX1051]": 49011, "[XXXXX623]": 48583, "[XXXXX8]": 47968, "[XXXXX784]": 48744, "[XXXXX756]": 48716, "[XXXXX292]": 48252, "[XXXXX3]": 47963, "[XXXXX14]": 47974, "[XXXXX258]": 48218, "[XXXXX1115]": 49075, "[XXXXX475]": 48435, "[XXXXX547]": 48507, "[XXXXX645]": 48605, "[XXXXX662]": 48622, "[XXXXX760]": 48720, "[XXXXX265]": 48225, "[XXXXX222]": 48182, "[XXXXX1072]": 49032, "[XXXXX373]": 48333, "[XXXXX833]": 48793, "[XXXXX558]": 48518, "[XXXXX651]": 48611, "[XXXXX464]": 48424, "[XXXXX215]": 48175, "[XXXXX648]": 48608, "[XXXXX549]": 48509, "[XXXXX116]": 48076, "[XXXXX1174]": 49134, "[XXXXX43]": 48003, "[XXXXX952]": 48912, "[XXXXX227]": 48187, "[XXXXX559]": 48519, "[XXXXX1142]": 49102, "[XXXXX542]": 48502, "[XXXXX36]": 47996, "[XXXXX753]": 48713, "[XXXXX992]": 48952, "[XXXXX24]": 47984, "[XXXXX548]": 48508, "[XXXXX793]": 48753, "[XXXXX523]": 48483, "[XXXXX1060]": 49020, "[XXXXX365]": 48325, "[XXXXX520]": 48480, "[XXXXX107]": 48067, "[XXXXX511]": 48471, "[XXXXX963]": 48923, "[XXXXX1190]": 49150, "[XXXXX196]": 48156, "[XXXXX299]": 48259, "[XXXXX1161]": 49121, "[XXXXX186]": 48146, "[XXXXX737]": 48697, "[XXXXX73]": 48033, "[XXXXX1061]": 49021, "[XXXXX143]": 48103, "[XXXXX325]": 48285, "[XXXXX1071]": 49031, "[XXXXX501]": 48461, "[XXXXX462]": 48422, "[XXXXX1017]": 48977, "[XXXXX104]": 48064, "[XXXXX395]": 48355, "[XXXXX126]": 48086, "[XXXXX119]": 48079, "[XXXXX38]": 47998, "[XXXXX21]": 47981, "[XXXXX1169]": 49129, "[XXXXX473]": 48433, "[XXXXX939]": 48899, "[XXXXX221]": 48181, "[XXXXX853]": 48813, "[XXXXX644]": 48604, "[XXXXX1176]": 49136, "[XXXXX1156]": 49116, "[XXXXX484]": 48444, "[XXXXX907]": 48867, "[XXXXX1004]": 48964, "[XXXXX691]": 48651, "[XXXXX397]": 48357, "[XXXXX167]": 48127, "[XXXXX412]": 48372, "[XXXXX1011]": 48971, "[XXXXX837]": 48797, "[XXXXX129]": 48089, "[XXXXX895]": 48855, "[XXXXX988]": 48948, "[XXXXX301]": 48261, "[XXXXX266]": 48226, "[XXXXX1134]": 49094, "[XXXXX257]": 48217, "[XXXXX746]": 48706, "[XXXXX87]": 48047, "[XXXXX446]": 48406, "[XXXXX416]": 48376, "[XXXXX707]": 48667, "[XXXXX337]": 48297, "[XXXXX18]": 47978, "[XXXXX528]": 48488, "[XXXXX979]": 48939, "[XXXXX82]": 48042, "[XXXXX128]": 48088, "[XXXXX211]": 48171, "[XXXXX563]": 48523, "[XXXXX386]": 48346, "[XXXXX12]": 47972, "[XXXXX1048]": 49008, "[XXXXX141]": 48101, "[XXXXX894]": 48854, "[XXXXX720]": 48680, "[XXXXX676]": 48636, "[XXXXX889]": 48849, "[XXXXX928]": 48888, "[XXXXX117]": 48077, "[XXXXX1014]": 48974, "[XXXXX267]": 48227, "[XXXXX790]": 48750, "[XXXXX666]": 48626, "[XXXXX333]": 48293, "[XXXXX873]": 48833, "[XXXXX969]": 48929, "[XXXXX677]": 48637, "[XXXXX66]": 48026, "[XXXXX256]": 48216, "[XXXXX290]": 48250, "[XXXXX30]": 47990, "[XXXXX406]": 48366, "[XXXXX856]": 48816, "[XXXXX491]": 48451, "[XXXXX498]": 48458, "[XXXXX868]": 48828, "[XXXXX483]": 48443, "[XXXXX1007]": 48967, "[XXXXX525]": 48485, "[XXXXX275]": 48235, "[XXXXX1034]": 48994, "[XXXXX605]": 48565, "[XXXXX111]": 48071, "[XXXXX930]": 48890, "[XXXXX169]": 48129, "[XXXXX437]": 48397, "[XXXXX940]": 48900, "[XXXXX1124]": 49084, "[XXXXX273]": 48233, "[XXXXX975]": 48935, "[XXXXX385]": 48345, "[XXXXX465]": 48425, "[XXXXX879]": 48839, "[XXXXX1133]": 49093, "[XXXXX330]": 48290, "[XXXXX114]": 48074, "[XXXXX1099]": 49059, "[XXXXX152]": 48112, "[XXXXX429]": 48389, "[XXXXX654]": 48614, "[XXXXX767]": 48727, "[XXXXX775]": 48735, "[XXXXX61]": 48021, "[XXXXX194]": 48154, "[XXXXX936]": 48896, "[XXXXX1015]": 48975, "[XXXXX805]": 48765, "[XXXXX183]": 48143, "[XXXXX561]": 48521, "[XXXXX125]": 48085, "[XXXXX13]": 47973, "[XXXXX348]": 48308, "[XXXXX1086]": 49046, "[XXXXX1054]": 49014, "[XXXXX903]": 48863, "[XXXXX138]": 48098, "[XXXXX56]": 48016, "[XXXXX115]": 48075, "[XXXXX137]": 48097, "[XXXXX101]": 48061, "[XXXXX867]": 48827, "[XXXXX620]": 48580, "[XXXXX974]": 48934, "[XXXXX240]": 48200, "[XXXXX1120]": 49080, "[XXXXX692]": 48652, "[XXXXX828]": 48788, "[XXXXX241]": 48201, "[XXXXX99]": 48059, "[XXXXX282]": 48242, "[XXXXX966]": 48926, "[XXXXX1163]": 49123, "[XXXXX685]": 48645, "[XXXXX1046]": 49006, "[XXXXX398]": 48358, "[XXXXX752]": 48712, "[XXXXX582]": 48542, "[XXXXX96]": 48056, "[XXXXX503]": 48463, "[XXXXX1052]": 49012, "[XXXXX1080]": 49040, "[XXXXX1044]": 49004, "[XXXXX471]": 48431, "[XXXXX98]": 48058, "[XXXXX214]": 48174, "[XXXXX1189]": 49149, "[XXXXX1130]": 49090, "[XXXXX1033]": 48993, "[XXXXX250]": 48210, "[XXXXX259]": 48219, "[XXXXX538]": 48498, "[XXXXX589]": 48549, "[XXXXX16]": 47976, "[XXXXX1047]": 49007, "[XXXXX140]": 48100, "[XXXXX680]": 48640, "[XXXXX1152]": 49112, "[XXXXX248]": 48208, "[XXXXX20]": 47980, "[XXXXX595]": 48555, "[XXXXX405]": 48365, "[XXXXX944]": 48904, "[XXXXX192]": 48152, "[XXXXX946]": 48906, "[XXXXX699]": 48659, "[XXXXX529]": 48489, "[XXXXX1006]": 48966, "[XXXXX479]": 48439, "[XXXXX801]": 48761, "[XXXXX514]": 48474, "[XXXXX202]": 48162, "[XXXXX714]": 48674, "[XXXXX627]": 48587, "[XXXXX463]": 48423, "[XXXXX170]": 48130, "[XXXXX1018]": 48978, "[XXXXX834]": 48794, "[XXXXX849]": 48809, "[XXXXX380]": 48340, "[XXXXX736]": 48696, "[XXXXX347]": 48307, "[XXXXX573]": 48533, "[XXXXX840]": 48800, "[XXXXX168]": 48128, "[XXXXX242]": 48202, "[XXXXX955]": 48915, "[XXXXX1039]": 48999, "[XXXXX878]": 48838, "[XXXXX1100]": 49060, "[XXXXX776]": 48736, "[XXXXX63]": 48023, "[XXXXX600]": 48560, "[XXXXX550]": 48510, "[XXXXX6]": 47966, "[XXXXX1050]": 49010, "[XXXXX534]": 48494, "[XXXXX500]": 48460, "[XXXXX836]": 48796, "[XXXXX228]": 48188, "[XXXXX41]": 48001, "[XXXXX108]": 48068, "[XXXXX835]": 48795, "[XXXXX68]": 48028, "[XXXXX1098]": 49058, "[XXXXX904]": 48864, "[XXXXX587]": 48547, "[XXXXX628]": 48588, "[XXXXX820]": 48780, "[XXXXX1154]": 49114, "[XXXXX48]": 48008, "[XXXXX157]": 48117, "[XXXXX133]": 48093, "[XXXXX778]": 48738, "[XXXXX622]": 48582, "[XXXXX272]": 48232, "[XXXXX431]": 48391, "[XXXXX1125]": 49085, "[XXXXX551]": 48511, "[XXXXX669]": 48629, "[XXXXX1030]": 48990, "[XXXXX512]": 48472, "[XXXXX482]": 48442, "[XXXXX388]": 48348, "[XXXXX1040]": 49000, "[XXXXX225]": 48185, "[XXXXX824]": 48784, "[XXXXX588]": 48548, "[MASK]": 47959, "[XXXXX1025]": 48985, "[XXXXX1053]": 49013, "[XXXXX1010]": 48970, "[XXXXX553]": 48513, "[XXXXX702]": 48662, "[XXXXX637]": 48597, "[XXXXX1181]": 49141, "[XXXXX972]": 48932, "[XXXXX1062]": 49022, "[XXXXX496]": 48456, "[XXXXX72]": 48032, "[XXXXX792]": 48752, "[XXXXX270]": 48230, "[XXXXX592]": 48552, "[XXXXX339]": 48299, "[XXXXX46]": 48006, "[XXXXX754]": 48714, "[XXXXX185]": 48145, "[XXXXX539]": 48499, "[XXXXX854]": 48814, "[XXXXX687]": 48647, "[XXXXX340]": 48300, "[XXXXX109]": 48069, "[XXXXX100]": 48060, "[XXXXX355]": 48315, "[XXXXX650]": 48610, "[XXXXX870]": 48830, "[XXXXX80]": 48040, "[XXXXX1121]": 49081, "[XXXXX28]": 47988, "[XXXXX172]": 48132, "[XXXXX454]": 48414, "[XXXXX815]": 48775, "[XXXXX774]": 48734, "[XXXXX134]": 48094, "[XXXXX1074]": 49034, "[XXXXX271]": 48231, "[XXXXX604]": 48564, "[XXXXX438]": 48398, "[XXXXX956]": 48916, "[XXXXX441]": 48401, "[XXXXX1043]": 49003, "[XXXXX155]": 48115, "[XXXXX830]": 48790, "[XXXXX180]": 48140, "[XXXXX342]": 48302, "[XXXXX296]": 48256, "[XXXXX1182]": 49142, "[XXXXX794]": 48754, "[XXXXX329]": 48289, "[XXXXX243]": 48203, "[XXXXX876]": 48836, "[XXXXX1085]": 49045, "[XXXXX327]": 48287, "[XXXXX679]": 48639, "[XXXXX207]": 48167, "[XXXXX633]": 48593, "[XXXXX476]": 48436, "[XXXXX779]": 48739, "[XXXXX738]": 48698, "[XXXXX1068]": 49028, "[XXXXX1065]": 49025, "[XXXXX703]": 48663, "[XXXXX995]": 48955, "[XXXXX1145]": 49105, "[XXXXX276]": 48236, "[XXXXX806]": 48766, "[XXXXX401]": 48361, "[XXXXX1081]": 49041, "[XXXXX334]": 48294, "[XXXXX1022]": 48982, "[XXXXX156]": 48116, "[XXXXX1082]": 49042, "[XXXXX909]": 48869, "[XXXXX846]": 48806, "[XXXXX203]": 48163, "[XXXXX800]": 48760, "[XXXXX1151]": 49111, "[XXXXX896]": 48856, "[XXXXX678]": 48638, "[XXXXX103]": 48063, "[XXXXX460]": 48420, "[XXXXX808]": 48768, "[XXXXX200]": 48160, "[XXXXX807]": 48767, "[XXXXX751]": 48711, "[XXXXX733]": 48693, "[XXXXX40]": 48000, "[XXXXX354]": 48314, "[XXXXX127]": 48087, "[XXXXX458]": 48418, "[XXXXX411]": 48371, "[XXXXX381]": 48341, "[XXXXX1137]": 49097, "[XXXXX90]": 48050, "[XXXXX931]": 48891, "[XXXXX176]": 48136, "[XXXXX953]": 48913, "[XXXXX580]": 48540, "[XXXXX782]": 48742, "[XXXXX394]": 48354, "[XXXXX11]": 47971, "[XXXXX924]": 48884, "[XXXXX619]": 48579, "[XXXXX765]": 48725, "[XXXXX1093]": 49053, "[XXXXX364]": 48324, "[XXXXX706]": 48666, "[XXXXX436]": 48396, "[XXXXX399]": 48359, "[XXXXX331]": 48291, "[XXXXX913]": 48873, "[XXXXX314]": 48274, "[XXXXX869]": 48829, "[XXXXX1087]": 49047, "[XXXXX453]": 48413, "[XXXXX91]": 48051, "[XXXXX577]": 48537, "[XXXXX838]": 48798, "[XXXXX625]": 48585, "[XXXXX404]": 48364, "[XXXXX74]": 48034, "[XXXXX448]": 48408, "[XXXXX694]": 48654, "[XXXXX507]": 48467, "[XXXXX217]": 48177, "[XXXXX361]": 48321, "[XXXXX578]": 48538, "[XXXXX363]": 48323, "[XXXXX602]": 48562, "[XXXXX379]": 48339, "[XXXXX771]": 48731, "[XXXXX710]": 48670, "[XXXXX466]": 48426, "[XXXXX570]": 48530, "[XXXXX1021]": 48981, "[XXXXX855]": 48815, "[XXXXX420]": 48380, "[XXXXX318]": 48278, "[XXXXX832]": 48792, "[XXXXX175]": 48135, "[XXXXX336]": 48296, "[XXXXX950]": 48910, "[XXXXX705]": 48665, "[XXXXX865]": 48825, "[XXXXX1139]": 49099, "[XXXXX1067]": 49027, "[XXXXX37]": 47997, "[XXXXX489]": 48449, "[XXXXX544]": 48504, "[XXXXX957]": 48917, "[XXXXX764]": 48724, "[XXXXX960]": 48920, "[XXXXX430]": 48390, "[XXXXX941]": 48901, "[XXXXX1183]": 49143, "[XXXXX748]": 48708, "[XXXXX1057]": 49017, "[XXXXX154]": 48114, "[XXXXX1129]": 49089, "[XXXXX246]": 48206, "[XXXXX352]": 48312, "[XXXXX987]": 48947, "[XXXXX452]": 48412, "[XXXXX585]": 48545, "[XXXXX153]": 48113, "[XXXXX1157]": 49117, "[XXXXX178]": 48138, "[XXXXX636]": 48596, "[XXXXX47]": 48007, "[XXXXX190]": 48150, "[XXXXX526]": 48486, "[XXXXX1003]": 48963, "[XXXXX1149]": 49109, "[XXXXX522]": 48482, "[XXXXX345]": 48305, "[XXXXX983]": 48943, "[XXXXX959]": 48919, "[XXXXX15]": 47975, "[XXXXX1177]": 49137, "[XXXXX712]": 48672, "[XXXXX26]": 47986, "[XXXXX113]": 48073, "[XXXXX1119]": 49079, "[XXXXX568]": 48528, "[XXXXX493]": 48453, "[XXXXX77]": 48037, "[XXXXX788]": 48748, "[XXXXX5]": 47965, "[XXXXX915]": 48875, "[XXXXX289]": 48249, "[XXXXX905]": 48865, "[XXXXX576]": 48536, "[XXXXX826]": 48786, "[XXXXX610]": 48570, "[XXXXX1045]": 49005, "[XXXXX643]": 48603, "[XXXXX370]": 48330, "[XXXXX579]": 48539, "[XXXXX338]": 48298, "[XXXXX1168]": 49128, "[XXXXX518]": 48478, "[XXXXX421]": 48381, "[XXXXX562]": 48522, "[XXXXX609]": 48569, "[XXXXX967]": 48927, "[XXXXX303]": 48263, "[XXXXX407]": 48367, "[XXXXX1066]": 49026, "[XXXXX400]": 48360, "[XXXXX23]": 47983, "[XXXXX962]": 48922, "[XXXXX980]": 48940, "[XXXXX1076]": 49036, "[XXXXX360]": 48320, "[XXXXX358]": 48318, "[XXXXX664]": 48624, "[XXXXX725]": 48685, "[XXXXX743]": 48703, "[XXXXX574]": 48534, "[XXXXX981]": 48941, "[XXXXX640]": 48600, "[XXXXX332]": 48292, "[XXXXX147]": 48107, "[XXXXX606]": 48566, "[XXXXX478]": 48438, "[XXXXX54]": 48014, "[XXXXX424]": 48384, "[XXXXX490]": 48450, "[XXXXX719]": 48679, "[XXXXX1140]": 49100, "[XXXXX390]": 48350, "[XXXXX750]": 48710, "[XXXXX686]": 48646, "[XXXXX1187]": 49147, "[XXXXX891]": 48851, "[XXXXX193]": 48153, "[XXXXX842]": 48802, "[XXXXX120]": 48080, "[XXXXX253]": 48213, "[XXXXX450]": 48410, "[XXXXX696]": 48656, "[XXXXX583]": 48543, "[XXXXX791]": 48751, "[XXXXX718]": 48678, "<pad>": 47958, "[XXXXX727]": 48687, "[XXXXX403]": 48363, "[XXXXX728]": 48688, "[XXXXX106]": 48066, "[XXXXX444]": 48404, "[XXXXX455]": 48415, "[XXXXX65]": 48025, "[XXXXX1143]": 49103, "[XXXXX822]": 48782, "[XXXXX552]": 48512, "[XXXXX252]": 48212, "[XXXXX25]": 47985, "[XXXXX286]": 48246, "[XXXXX85]": 48045, "[XXXXX492]": 48452, "[XXXXX60]": 48020, "[XXXXX368]": 48328, "[XXXXX89]": 48049, "[XXXXX384]": 48344, "[XXXXX263]": 48223, "[XXXXX571]": 48531, "[XXXXX954]": 48914, "[XXXXX638]": 48598, "[XXXXX1056]": 49016, "[XXXXX621]": 48581, "[XXXXX724]": 48684, "[XXXXX130]": 48090, "[XXXXX335]": 48295, "[XXXXX488]": 48448, "[XXXXX260]": 48220, "[XXXXX1128]": 49088, "[XXXXX1075]": 49035, "[XXXXX306]": 48266, "[XXXXX906]": 48866, "[XXXXX433]": 48393, "[XXXXX1180]": 49140, "[XXXXX536]": 48496, "[XXXXX516]": 48476, "[XXXXX461]": 48421, "[XXXXX698]": 48658, "[XXXXX1110]": 49070, "[XXXXX1159]": 49119, "[XXXXX369]": 48329, "[XXXXX324]": 48284, "[XXXXX32]": 47992, "[XXXXX495]": 48455, "[XXXXX802]": 48762, "[XXXXX504]": 48464, "[XXXXX50]": 48010, "[XXXXX689]": 48649, "[XXXXX1042]": 49002, "[XXXXX229]": 48189, "[XXXXX280]": 48240, "[XXXXX755]": 48715, "[XXXXX1104]": 49064, "[XXXXX887]": 48847, "[XXXXX163]": 48123, "[XXXXX442]": 48402, "[XXXXX818]": 48778, "[XXXXX174]": 48134, "[XXXXX937]": 48897, "[XXXXX1020]": 48980, "[XXXXX249]": 48209, "[XXXXX557]": 48517, "[XXXXX1164]": 49124, "[XXXXX236]": 48196, "[XXXXX467]": 48427, "[XXXXX42]": 48002, "[XXXXX238]": 48198, "[XXXXX612]": 48572, "[XXXXX233]": 48193, "[XXXXX632]": 48592, "[XXXXX367]": 48327, "[XXXXX1146]": 49106, "[XXXXX607]": 48567, "[XXXXX976]": 48936, "[XXXXX899]": 48859, "[XXXXX614]": 48574, "[XXXXX160]": 48120, "[XXXXX978]": 48938, "[XXXXX1001]": 48961, "[XXXXX29]": 47989, "[XXXXX1191]": 49151, "[XXXXX1059]": 49019, "[XXXXX1016]": 48976, "[XXXXX785]": 48745, "[XXXXX118]": 48078, "[XXXXX418]": 48378, "[XXXXX929]": 48889, "[XXXXX19]": 47979, "[XXXXX985]": 48945, "[XXXXX1106]": 49066, "[XXXXX1088]": 49048, "[XXXXX858]": 48818, "[XXXXX1118]": 49078, "[XXXXX112]": 48072, "[XXXXX244]": 48204, "[XXXXX346]": 48306, "[XXXXX716]": 48676, "[XXXXX497]": 48457, "[XXXXX942]": 48902, "[XXXXX362]": 48322, "[XXXXX457]": 48417, "[XXXXX688]": 48648, "[XXXXX293]": 48253, "[XXXXX224]": 48184, "[XXXXX584]": 48544, "[XXXXX649]": 48609, "[XXXXX300]": 48260, "[XXXXX305]": 48265, "[XXXXX135]": 48095, "[XXXXX59]": 48019, "[XXXXX17]": 47977, "[XXXXX33]": 47993, "[XXXXX277]": 48237, "[XXXXX387]": 48347, "[XXXXX997]": 48957, "[XXXXX811]": 48771, "[XXXXX786]": 48746, "[XXXXX145]": 48105, "[XXXXX986]": 48946, "[XXXXX1032]": 48992, "[XXXXX506]": 48466, "[XXXXX892]": 48852, "[XXXXX423]": 48383, "[XXXXX208]": 48168, "[XXXXX486]": 48446, "[XXXXX220]": 48180, "[XXXXX795]": 48755, "[XXXXX84]": 48044, "[XXXXX1090]": 49050, "[XXXXX747]": 48707, "[XXXXX769]": 48729, "[XXXXX422]": 48382, "[XXXXX759]": 48719, "[XXXXX564]": 48524, "[XXXXX481]": 48441, "[XXXXX1150]": 49110, "[XXXXX254]": 48214, "[XXXXX635]": 48595, "[XXXXX95]": 48055, "[XXXXX910]": 48870, "[XXXXX1063]": 49023, "[XXXXX216]": 48176, "[XXXXX624]": 48584, "[XXXXX1069]": 49029, "[XXXXX888]": 48848, "[XXXXX684]": 48644, "[XXXXX517]": 48477, "[XXXXX816]": 48776, "[XXXXX396]": 48356, "[XXXXX659]": 48619, "[XXXXX166]": 48126, "[XXXXX1091]": 49051, "[XXXXX94]": 48054, "[XXXXX810]": 48770, "[XXXXX613]": 48573, "[XXXXX1105]": 49065, "[XXXXX181]": 48141, "[XXXXX58]": 48018, "[XXXXX308]": 48268, "[XXXXX78]": 48038, "[XXXXX690]": 48650, "[XXXXX349]": 48309, "[XXXXX189]": 48149, "[XXXXX825]": 48785, "[XXXXX918]": 48878, "[XXXXX912]": 48872, "[XXXXX817]": 48777, "[XXXXX268]": 48228, "[XXXXX674]": 48634, "[XXXXX184]": 48144, "[XXXXX519]": 48479, "[XXXXX235]": 48195, "[XXXXX898]": 48858, "[XXXXX197]": 48157, "[XXXXX515]": 48475, "[XXXXX232]": 48192, "[XXXXX1186]": 49146, "[XXXXX970]": 48930, "[XXXXX657]": 48617, "[XXXXX151]": 48111, "[XXXXX672]": 48632, "[XXXXX841]": 48801, "[XXXXX470]": 48430, "[XXXXX34]": 47994, "[XXXXX182]": 48142, "[XXXXX797]": 48757, "[XXXXX521]": 48481, "[XXXXX726]": 48686, "[XXXXX1019]": 48979, "[XXXXX165]": 48125, "[XXXXX1058]": 49018, "[XXXXX530]": 48490, "[XXXXX572]": 48532, "[XXXXX402]": 48362, "[XXXXX524]": 48484, "[XXXXX845]": 48805, "[XXXXX159]": 48119, "[XXXXX239]": 48199, "[XXXXX206]": 48166, "[XXXXX611]": 48571, "[XXXXX731]": 48691, "[XXXXX1138]": 49098, "[XXXXX663]": 48623, "[XXXXX261]": 48221, "[XXXXX505]": 48465, "[XXXXX53]": 48013, "[XXXXX426]": 48386, "[XXXXX288]": 48248, "[XXXXX821]": 48781, "[XXXXX284]": 48244, "[XXXXX932]": 48892, "[XXXXX850]": 48810, "[XXXXX375]": 48335, "[XXXXX859]": 48819, "[XXXXX639]": 48599, "[XXXXX768]": 48728, "[XXXXX1185]": 49145, "[XXXXX772]": 48732, "[XXXXX780]": 48740, "[XXXXX533]": 48493, "[XXXXX1096]": 49056, "[XXXXX1095]": 49055, "[XXXXX647]": 48607, "[XXXXX938]": 48898, "[XXXXX139]": 48099, "[XXXXX911]": 48871, "[XXXXX1037]": 48997, "[XXXXX902]": 48862, "[XXXXX848]": 48808, "[XXXXX356]": 48316, "[XXXXX634]": 48594, "[XXXXX540]": 48500, "[XXXXX1005]": 48965, "[XXXXX847]": 48807, "[XXXXX449]": 48409, "[XXXXX973]": 48933, "[XXXXX852]": 48812, "[XXXXX1165]": 49125, "[XXXXX69]": 48029, "[XXXXX371]": 48331, "[XXXXX468]": 48428, "[XXXXX142]": 48102, "[XXXXX596]": 48556, "[XXXXX1172]": 49132, "[XXXXX131]": 48091, "[XXXXX2]": 47962, "[XXXXX234]": 48194, "[XXXXX432]": 48392, "[XXXXX586]": 48546, "[XXXXX278]": 48238, "[XXXXX1113]": 49073, "[XXXXX616]": 48576, "[XXXXX565]": 48525, "[XXXXX264]": 48224, "[XXXXX531]": 48491, "[XXXXX958]": 48918, "[XXXXX480]": 48440, "[XXXXX1103]": 49063, "[XXXXX1101]": 49061, "[XXXXX374]": 48334, "[XXXXX428]": 48388, "[XXXXX161]": 48121, "[XXXXX173]": 48133, "[XXXXX933]": 48893, "[XXXXX1028]": 48988, "[XXXXX527]": 48487, "[XXXXX567]": 48527, "[XXXXX661]": 48621, "[XXXXX900]": 48860, "[XXXXX713]": 48673, "[XXXXX823]": 48783, "[XXXXX1078]": 49038, "[XXXXX740]": 48700, "[XXXXX554]": 48514, "[XXXXX883]": 48843, "[XXXXX383]": 48343, "[XXXXX653]": 48613, "[XXXXX149]": 48109, "[XXXXX660]": 48620, "[XXXXX171]": 48131, "[XXXXX890]": 48850, "[XXXXX81]": 48041, "[XXXXX212]": 48172, "[XXXXX789]": 48749, "[XXXXX545]": 48505, "[XXXXX885]": 48845, "[XXXXX414]": 48374, "[XXXXX927]": 48887, "[XXXXX843]": 48803, "[XXXXX919]": 48879, "[XXXXX122]": 48082, "[XXXXX320]": 48280, "[XXXXX556]": 48516, "[XXXXX285]": 48245, "[XXXXX1178]": 49138, "[XXXXX729]": 48689, "[XXXXX195]": 48155, "[XXXXX877]": 48837, "[XXXXX456]": 48416, "[XXXXX1136]": 49096, "[XXXXX1114]": 49074, "[XXXXX945]": 48905, "[XXXXX1141]": 49101, "[XXXXX993]": 48953, "[XXXXX1041]": 49001, "[XXXXX1167]": 49127, "[XXXXX393]": 48353, "[XXXXX875]": 48835, "[XXXXX732]": 48692, "[XXXXX1170]": 49130, "[XXXXX162]": 48122, "[XXXXX947]": 48907, "[XXXXX668]": 48628, "[XXXXX762]": 48722, "[XXXXX86]": 48046, "[XXXXX469]": 48429, "[XXXXX809]": 48769, "[XXXXX655]": 48615, "[CLS]": 47956, "[XXXXX44]": 48004, "[XXXXX35]": 47995, "[XXXXX201]": 48161, "[XXXXX410]": 48370, "[XXXXX350]": 48310, "[XXXXX1027]": 48987, "[XXXXX1]": 47961, "[XXXXX560]": 48520, "[XXXXX646]": 48606, "[XXXXX485]": 48445, "[XXXXX723]": 48683, "[XXXXX977]": 48937, "[XXXXX52]": 48012, "[XXXXX1084]": 49044, "[XXXXX124]": 48084, "[XXXXX598]": 48558, "[XXXXX629]": 48589, "[XXXXX513]": 48473, "[XXXXX83]": 48043, "[XXXXX991]": 48951, "[XXXXX658]": 48618, "[XXXXX1009]": 48969, "[XXXXX1117]": 49077, "[XXXXX652]": 48612, "[XXXXX287]": 48247, "[XXXXX935]": 48895, "[XXXXX722]": 48682, "[XXXXX543]": 48503, "[XXXXX92]": 48052, "[XXXXX304]": 48264, "[XXXXX925]": 48885, "[XXXXX532]": 48492, "[XXXXX735]": 48695, "[XXXXX1162]": 49122, "[XXXXX279]": 48239, "[XXXXX45]": 48005, "[XXXXX302]": 48262, "[XXXXX916]": 48876, "[XXXXX971]": 48931, "[XXXXX0]": 47960, "[XXXXX323]": 48283, "[XXXXX1036]": 48996, "[XXXXX880]": 48840, "[XXXXX796]": 48756, "[XXXXX7]": 47967, "[XXXXX681]": 48641, "[XXXXX626]": 48586, "[XXXXX144]": 48104, "[XXXXX218]": 48178, "[XXXXX226]": 48186, "[XXXXX326]": 48286, "[XXXXX177]": 48137, "[XXXXX996]": 48956, "[XXXXX97]": 48057, "[XXXXX447]": 48407, "[XXXXX1175]": 49135, "[XXXXX715]": 48675, "[XXXXX961]": 48921, "[XXXXX322]": 48282, "[XXXXX353]": 48313, "[XXXXX603]": 48563, "[XXXXX76]": 48036}
|
special_tokens_map.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"bos_token": "[CLS]", "eos_token": "[SEP]", "unk_token": "<unk>", "sep_token": "[SEP]", "pad_token": "<pad>", "cls_token": "[CLS]", "mask_token": {"content": "[MASK]", "single_word": false, "lstrip": true, "rstrip": false, "normalized": false}, "additional_special_tokens": ["[XXXXX0]", "[XXXXX1]", "[XXXXX2]", "[XXXXX3]", "[XXXXX4]", "[XXXXX5]", "[XXXXX6]", "[XXXXX7]", "[XXXXX8]", "[XXXXX9]", "[XXXXX10]", "[XXXXX11]", "[XXXXX12]", "[XXXXX13]", "[XXXXX14]", "[XXXXX15]", "[XXXXX16]", "[XXXXX17]", "[XXXXX18]", "[XXXXX19]", "[XXXXX20]", "[XXXXX21]", "[XXXXX22]", "[XXXXX23]", "[XXXXX24]", "[XXXXX25]", "[XXXXX26]", "[XXXXX27]", "[XXXXX28]", "[XXXXX29]", "[XXXXX30]", "[XXXXX31]", "[XXXXX32]", "[XXXXX33]", "[XXXXX34]", "[XXXXX35]", "[XXXXX36]", "[XXXXX37]", "[XXXXX38]", "[XXXXX39]", "[XXXXX40]", "[XXXXX41]", "[XXXXX42]", "[XXXXX43]", "[XXXXX44]", "[XXXXX45]", "[XXXXX46]", "[XXXXX47]", "[XXXXX48]", "[XXXXX49]", "[XXXXX50]", "[XXXXX51]", "[XXXXX52]", "[XXXXX53]", "[XXXXX54]", "[XXXXX55]", "[XXXXX56]", "[XXXXX57]", "[XXXXX58]", "[XXXXX59]", "[XXXXX60]", "[XXXXX61]", "[XXXXX62]", "[XXXXX63]", "[XXXXX64]", "[XXXXX65]", "[XXXXX66]", "[XXXXX67]", "[XXXXX68]", "[XXXXX69]", "[XXXXX70]", "[XXXXX71]", "[XXXXX72]", "[XXXXX73]", "[XXXXX74]", "[XXXXX75]", "[XXXXX76]", "[XXXXX77]", "[XXXXX78]", "[XXXXX79]", "[XXXXX80]", "[XXXXX81]", "[XXXXX82]", "[XXXXX83]", "[XXXXX84]", "[XXXXX85]", "[XXXXX86]", "[XXXXX87]", "[XXXXX88]", "[XXXXX89]", "[XXXXX90]", "[XXXXX91]", "[XXXXX92]", "[XXXXX93]", "[XXXXX94]", "[XXXXX95]", "[XXXXX96]", "[XXXXX97]", "[XXXXX98]", "[XXXXX99]", "[XXXXX100]", "[XXXXX101]", "[XXXXX102]", "[XXXXX103]", "[XXXXX104]", "[XXXXX105]", "[XXXXX106]", "[XXXXX107]", "[XXXXX108]", "[XXXXX109]", "[XXXXX110]", "[XXXXX111]", "[XXXXX112]", "[XXXXX113]", "[XXXXX114]", "[XXXXX115]", "[XXXXX116]", "[XXXXX117]", "[XXXXX118]", "[XXXXX119]", "[XXXXX120]", "[XXXXX121]", "[XXXXX122]", "[XXXXX123]", "[XXXXX124]", "[XXXXX125]", "[XXXXX126]", "[XXXXX127]", "[XXXXX128]", "[XXXXX129]", "[XXXXX130]", "[XXXXX131]", "[XXXXX132]", "[XXXXX133]", "[XXXXX134]", "[XXXXX135]", "[XXXXX136]", "[XXXXX137]", "[XXXXX138]", "[XXXXX139]", "[XXXXX140]", "[XXXXX141]", "[XXXXX142]", "[XXXXX143]", "[XXXXX144]", "[XXXXX145]", "[XXXXX146]", "[XXXXX147]", "[XXXXX148]", "[XXXXX149]", "[XXXXX150]", "[XXXXX151]", "[XXXXX152]", "[XXXXX153]", "[XXXXX154]", "[XXXXX155]", "[XXXXX156]", "[XXXXX157]", "[XXXXX158]", "[XXXXX159]", "[XXXXX160]", "[XXXXX161]", "[XXXXX162]", "[XXXXX163]", "[XXXXX164]", "[XXXXX165]", "[XXXXX166]", "[XXXXX167]", "[XXXXX168]", "[XXXXX169]", "[XXXXX170]", "[XXXXX171]", "[XXXXX172]", "[XXXXX173]", "[XXXXX174]", "[XXXXX175]", "[XXXXX176]", "[XXXXX177]", "[XXXXX178]", "[XXXXX179]", "[XXXXX180]", "[XXXXX181]", "[XXXXX182]", "[XXXXX183]", "[XXXXX184]", "[XXXXX185]", "[XXXXX186]", "[XXXXX187]", "[XXXXX188]", "[XXXXX189]", "[XXXXX190]", "[XXXXX191]", "[XXXXX192]", "[XXXXX193]", "[XXXXX194]", "[XXXXX195]", "[XXXXX196]", "[XXXXX197]", "[XXXXX198]", "[XXXXX199]", "[XXXXX200]", "[XXXXX201]", "[XXXXX202]", "[XXXXX203]", "[XXXXX204]", "[XXXXX205]", "[XXXXX206]", "[XXXXX207]", "[XXXXX208]", "[XXXXX209]", "[XXXXX210]", "[XXXXX211]", "[XXXXX212]", "[XXXXX213]", "[XXXXX214]", "[XXXXX215]", "[XXXXX216]", "[XXXXX217]", "[XXXXX218]", "[XXXXX219]", "[XXXXX220]", "[XXXXX221]", "[XXXXX222]", "[XXXXX223]", "[XXXXX224]", "[XXXXX225]", "[XXXXX226]", "[XXXXX227]", "[XXXXX228]", "[XXXXX229]", "[XXXXX230]", "[XXXXX231]", "[XXXXX232]", "[XXXXX233]", "[XXXXX234]", "[XXXXX235]", "[XXXXX236]", "[XXXXX237]", "[XXXXX238]", "[XXXXX239]", "[XXXXX240]", "[XXXXX241]", "[XXXXX242]", "[XXXXX243]", "[XXXXX244]", "[XXXXX245]", "[XXXXX246]", "[XXXXX247]", "[XXXXX248]", "[XXXXX249]", "[XXXXX250]", "[XXXXX251]", "[XXXXX252]", "[XXXXX253]", "[XXXXX254]", "[XXXXX255]", "[XXXXX256]", "[XXXXX257]", "[XXXXX258]", "[XXXXX259]", "[XXXXX260]", "[XXXXX261]", "[XXXXX262]", "[XXXXX263]", "[XXXXX264]", "[XXXXX265]", "[XXXXX266]", "[XXXXX267]", "[XXXXX268]", "[XXXXX269]", "[XXXXX270]", "[XXXXX271]", "[XXXXX272]", "[XXXXX273]", "[XXXXX274]", "[XXXXX275]", "[XXXXX276]", "[XXXXX277]", "[XXXXX278]", "[XXXXX279]", "[XXXXX280]", "[XXXXX281]", "[XXXXX282]", "[XXXXX283]", "[XXXXX284]", "[XXXXX285]", "[XXXXX286]", "[XXXXX287]", "[XXXXX288]", "[XXXXX289]", "[XXXXX290]", "[XXXXX291]", "[XXXXX292]", "[XXXXX293]", "[XXXXX294]", "[XXXXX295]", "[XXXXX296]", "[XXXXX297]", "[XXXXX298]", "[XXXXX299]", "[XXXXX300]", "[XXXXX301]", "[XXXXX302]", "[XXXXX303]", "[XXXXX304]", "[XXXXX305]", "[XXXXX306]", "[XXXXX307]", "[XXXXX308]", "[XXXXX309]", "[XXXXX310]", "[XXXXX311]", "[XXXXX312]", "[XXXXX313]", "[XXXXX314]", "[XXXXX315]", "[XXXXX316]", "[XXXXX317]", "[XXXXX318]", "[XXXXX319]", "[XXXXX320]", "[XXXXX321]", "[XXXXX322]", "[XXXXX323]", "[XXXXX324]", "[XXXXX325]", "[XXXXX326]", "[XXXXX327]", "[XXXXX328]", "[XXXXX329]", "[XXXXX330]", "[XXXXX331]", "[XXXXX332]", "[XXXXX333]", "[XXXXX334]", "[XXXXX335]", "[XXXXX336]", "[XXXXX337]", "[XXXXX338]", "[XXXXX339]", "[XXXXX340]", "[XXXXX341]", "[XXXXX342]", "[XXXXX343]", "[XXXXX344]", "[XXXXX345]", "[XXXXX346]", "[XXXXX347]", "[XXXXX348]", "[XXXXX349]", "[XXXXX350]", "[XXXXX351]", "[XXXXX352]", "[XXXXX353]", "[XXXXX354]", "[XXXXX355]", "[XXXXX356]", "[XXXXX357]", "[XXXXX358]", "[XXXXX359]", "[XXXXX360]", "[XXXXX361]", "[XXXXX362]", "[XXXXX363]", "[XXXXX364]", "[XXXXX365]", "[XXXXX366]", "[XXXXX367]", "[XXXXX368]", "[XXXXX369]", "[XXXXX370]", "[XXXXX371]", "[XXXXX372]", "[XXXXX373]", "[XXXXX374]", "[XXXXX375]", "[XXXXX376]", "[XXXXX377]", "[XXXXX378]", "[XXXXX379]", "[XXXXX380]", "[XXXXX381]", "[XXXXX382]", "[XXXXX383]", "[XXXXX384]", "[XXXXX385]", "[XXXXX386]", "[XXXXX387]", "[XXXXX388]", "[XXXXX389]", "[XXXXX390]", "[XXXXX391]", "[XXXXX392]", "[XXXXX393]", "[XXXXX394]", "[XXXXX395]", "[XXXXX396]", "[XXXXX397]", "[XXXXX398]", "[XXXXX399]", "[XXXXX400]", "[XXXXX401]", "[XXXXX402]", "[XXXXX403]", "[XXXXX404]", "[XXXXX405]", "[XXXXX406]", "[XXXXX407]", "[XXXXX408]", "[XXXXX409]", "[XXXXX410]", "[XXXXX411]", "[XXXXX412]", "[XXXXX413]", "[XXXXX414]", "[XXXXX415]", "[XXXXX416]", "[XXXXX417]", "[XXXXX418]", "[XXXXX419]", "[XXXXX420]", "[XXXXX421]", "[XXXXX422]", "[XXXXX423]", "[XXXXX424]", "[XXXXX425]", "[XXXXX426]", "[XXXXX427]", "[XXXXX428]", "[XXXXX429]", "[XXXXX430]", "[XXXXX431]", "[XXXXX432]", "[XXXXX433]", "[XXXXX434]", "[XXXXX435]", "[XXXXX436]", "[XXXXX437]", "[XXXXX438]", "[XXXXX439]", "[XXXXX440]", "[XXXXX441]", "[XXXXX442]", "[XXXXX443]", "[XXXXX444]", "[XXXXX445]", "[XXXXX446]", "[XXXXX447]", "[XXXXX448]", "[XXXXX449]", "[XXXXX450]", "[XXXXX451]", "[XXXXX452]", "[XXXXX453]", "[XXXXX454]", "[XXXXX455]", "[XXXXX456]", "[XXXXX457]", "[XXXXX458]", "[XXXXX459]", "[XXXXX460]", "[XXXXX461]", "[XXXXX462]", "[XXXXX463]", "[XXXXX464]", "[XXXXX465]", "[XXXXX466]", "[XXXXX467]", "[XXXXX468]", "[XXXXX469]", "[XXXXX470]", "[XXXXX471]", "[XXXXX472]", "[XXXXX473]", "[XXXXX474]", "[XXXXX475]", "[XXXXX476]", "[XXXXX477]", "[XXXXX478]", "[XXXXX479]", "[XXXXX480]", "[XXXXX481]", "[XXXXX482]", "[XXXXX483]", "[XXXXX484]", "[XXXXX485]", "[XXXXX486]", "[XXXXX487]", "[XXXXX488]", "[XXXXX489]", "[XXXXX490]", "[XXXXX491]", "[XXXXX492]", "[XXXXX493]", "[XXXXX494]", "[XXXXX495]", "[XXXXX496]", "[XXXXX497]", "[XXXXX498]", "[XXXXX499]", "[XXXXX500]", "[XXXXX501]", "[XXXXX502]", "[XXXXX503]", "[XXXXX504]", "[XXXXX505]", "[XXXXX506]", "[XXXXX507]", "[XXXXX508]", "[XXXXX509]", "[XXXXX510]", "[XXXXX511]", "[XXXXX512]", "[XXXXX513]", "[XXXXX514]", "[XXXXX515]", "[XXXXX516]", "[XXXXX517]", "[XXXXX518]", "[XXXXX519]", "[XXXXX520]", "[XXXXX521]", "[XXXXX522]", "[XXXXX523]", "[XXXXX524]", "[XXXXX525]", "[XXXXX526]", "[XXXXX527]", "[XXXXX528]", "[XXXXX529]", "[XXXXX530]", "[XXXXX531]", "[XXXXX532]", "[XXXXX533]", "[XXXXX534]", "[XXXXX535]", "[XXXXX536]", "[XXXXX537]", "[XXXXX538]", "[XXXXX539]", "[XXXXX540]", "[XXXXX541]", "[XXXXX542]", "[XXXXX543]", "[XXXXX544]", "[XXXXX545]", "[XXXXX546]", "[XXXXX547]", "[XXXXX548]", "[XXXXX549]", "[XXXXX550]", "[XXXXX551]", "[XXXXX552]", "[XXXXX553]", "[XXXXX554]", "[XXXXX555]", "[XXXXX556]", "[XXXXX557]", "[XXXXX558]", "[XXXXX559]", "[XXXXX560]", "[XXXXX561]", "[XXXXX562]", "[XXXXX563]", "[XXXXX564]", "[XXXXX565]", "[XXXXX566]", "[XXXXX567]", "[XXXXX568]", "[XXXXX569]", "[XXXXX570]", "[XXXXX571]", "[XXXXX572]", "[XXXXX573]", "[XXXXX574]", "[XXXXX575]", "[XXXXX576]", "[XXXXX577]", "[XXXXX578]", "[XXXXX579]", "[XXXXX580]", "[XXXXX581]", "[XXXXX582]", "[XXXXX583]", "[XXXXX584]", "[XXXXX585]", "[XXXXX586]", "[XXXXX587]", "[XXXXX588]", "[XXXXX589]", "[XXXXX590]", "[XXXXX591]", "[XXXXX592]", "[XXXXX593]", "[XXXXX594]", "[XXXXX595]", "[XXXXX596]", "[XXXXX597]", "[XXXXX598]", "[XXXXX599]", "[XXXXX600]", "[XXXXX601]", "[XXXXX602]", "[XXXXX603]", "[XXXXX604]", "[XXXXX605]", "[XXXXX606]", "[XXXXX607]", "[XXXXX608]", "[XXXXX609]", "[XXXXX610]", "[XXXXX611]", "[XXXXX612]", "[XXXXX613]", "[XXXXX614]", "[XXXXX615]", "[XXXXX616]", "[XXXXX617]", "[XXXXX618]", "[XXXXX619]", "[XXXXX620]", "[XXXXX621]", "[XXXXX622]", "[XXXXX623]", "[XXXXX624]", "[XXXXX625]", "[XXXXX626]", "[XXXXX627]", "[XXXXX628]", "[XXXXX629]", "[XXXXX630]", "[XXXXX631]", "[XXXXX632]", "[XXXXX633]", "[XXXXX634]", "[XXXXX635]", "[XXXXX636]", "[XXXXX637]", "[XXXXX638]", "[XXXXX639]", "[XXXXX640]", "[XXXXX641]", "[XXXXX642]", "[XXXXX643]", "[XXXXX644]", "[XXXXX645]", "[XXXXX646]", "[XXXXX647]", "[XXXXX648]", "[XXXXX649]", "[XXXXX650]", "[XXXXX651]", "[XXXXX652]", "[XXXXX653]", "[XXXXX654]", "[XXXXX655]", "[XXXXX656]", "[XXXXX657]", "[XXXXX658]", "[XXXXX659]", "[XXXXX660]", "[XXXXX661]", "[XXXXX662]", "[XXXXX663]", "[XXXXX664]", "[XXXXX665]", "[XXXXX666]", "[XXXXX667]", "[XXXXX668]", "[XXXXX669]", "[XXXXX670]", "[XXXXX671]", "[XXXXX672]", "[XXXXX673]", "[XXXXX674]", "[XXXXX675]", "[XXXXX676]", "[XXXXX677]", "[XXXXX678]", "[XXXXX679]", "[XXXXX680]", "[XXXXX681]", "[XXXXX682]", "[XXXXX683]", "[XXXXX684]", "[XXXXX685]", "[XXXXX686]", "[XXXXX687]", "[XXXXX688]", "[XXXXX689]", "[XXXXX690]", "[XXXXX691]", "[XXXXX692]", "[XXXXX693]", "[XXXXX694]", "[XXXXX695]", "[XXXXX696]", "[XXXXX697]", "[XXXXX698]", "[XXXXX699]", "[XXXXX700]", "[XXXXX701]", "[XXXXX702]", "[XXXXX703]", "[XXXXX704]", "[XXXXX705]", "[XXXXX706]", "[XXXXX707]", "[XXXXX708]", "[XXXXX709]", "[XXXXX710]", "[XXXXX711]", "[XXXXX712]", "[XXXXX713]", "[XXXXX714]", "[XXXXX715]", "[XXXXX716]", "[XXXXX717]", "[XXXXX718]", "[XXXXX719]", "[XXXXX720]", "[XXXXX721]", "[XXXXX722]", "[XXXXX723]", "[XXXXX724]", "[XXXXX725]", "[XXXXX726]", "[XXXXX727]", "[XXXXX728]", "[XXXXX729]", "[XXXXX730]", "[XXXXX731]", "[XXXXX732]", "[XXXXX733]", "[XXXXX734]", "[XXXXX735]", "[XXXXX736]", "[XXXXX737]", "[XXXXX738]", "[XXXXX739]", "[XXXXX740]", "[XXXXX741]", "[XXXXX742]", "[XXXXX743]", "[XXXXX744]", "[XXXXX745]", "[XXXXX746]", "[XXXXX747]", "[XXXXX748]", "[XXXXX749]", "[XXXXX750]", "[XXXXX751]", "[XXXXX752]", "[XXXXX753]", "[XXXXX754]", "[XXXXX755]", "[XXXXX756]", "[XXXXX757]", "[XXXXX758]", "[XXXXX759]", "[XXXXX760]", "[XXXXX761]", "[XXXXX762]", "[XXXXX763]", "[XXXXX764]", "[XXXXX765]", "[XXXXX766]", "[XXXXX767]", "[XXXXX768]", "[XXXXX769]", "[XXXXX770]", "[XXXXX771]", "[XXXXX772]", "[XXXXX773]", "[XXXXX774]", "[XXXXX775]", "[XXXXX776]", "[XXXXX777]", "[XXXXX778]", "[XXXXX779]", "[XXXXX780]", "[XXXXX781]", "[XXXXX782]", "[XXXXX783]", "[XXXXX784]", "[XXXXX785]", "[XXXXX786]", "[XXXXX787]", "[XXXXX788]", "[XXXXX789]", "[XXXXX790]", "[XXXXX791]", "[XXXXX792]", "[XXXXX793]", "[XXXXX794]", "[XXXXX795]", "[XXXXX796]", "[XXXXX797]", "[XXXXX798]", "[XXXXX799]", "[XXXXX800]", "[XXXXX801]", "[XXXXX802]", "[XXXXX803]", "[XXXXX804]", "[XXXXX805]", "[XXXXX806]", "[XXXXX807]", "[XXXXX808]", "[XXXXX809]", "[XXXXX810]", "[XXXXX811]", "[XXXXX812]", "[XXXXX813]", "[XXXXX814]", "[XXXXX815]", "[XXXXX816]", "[XXXXX817]", "[XXXXX818]", "[XXXXX819]", "[XXXXX820]", "[XXXXX821]", "[XXXXX822]", "[XXXXX823]", "[XXXXX824]", "[XXXXX825]", "[XXXXX826]", "[XXXXX827]", "[XXXXX828]", "[XXXXX829]", "[XXXXX830]", "[XXXXX831]", "[XXXXX832]", "[XXXXX833]", "[XXXXX834]", "[XXXXX835]", "[XXXXX836]", "[XXXXX837]", "[XXXXX838]", "[XXXXX839]", "[XXXXX840]", "[XXXXX841]", "[XXXXX842]", "[XXXXX843]", "[XXXXX844]", "[XXXXX845]", "[XXXXX846]", "[XXXXX847]", "[XXXXX848]", "[XXXXX849]", "[XXXXX850]", "[XXXXX851]", "[XXXXX852]", "[XXXXX853]", "[XXXXX854]", "[XXXXX855]", "[XXXXX856]", "[XXXXX857]", "[XXXXX858]", "[XXXXX859]", "[XXXXX860]", "[XXXXX861]", "[XXXXX862]", "[XXXXX863]", "[XXXXX864]", "[XXXXX865]", "[XXXXX866]", "[XXXXX867]", "[XXXXX868]", "[XXXXX869]", "[XXXXX870]", "[XXXXX871]", "[XXXXX872]", "[XXXXX873]", "[XXXXX874]", "[XXXXX875]", "[XXXXX876]", "[XXXXX877]", "[XXXXX878]", "[XXXXX879]", "[XXXXX880]", "[XXXXX881]", "[XXXXX882]", "[XXXXX883]", "[XXXXX884]", "[XXXXX885]", "[XXXXX886]", "[XXXXX887]", "[XXXXX888]", "[XXXXX889]", "[XXXXX890]", "[XXXXX891]", "[XXXXX892]", "[XXXXX893]", "[XXXXX894]", "[XXXXX895]", "[XXXXX896]", "[XXXXX897]", "[XXXXX898]", "[XXXXX899]", "[XXXXX900]", "[XXXXX901]", "[XXXXX902]", "[XXXXX903]", "[XXXXX904]", "[XXXXX905]", "[XXXXX906]", "[XXXXX907]", "[XXXXX908]", "[XXXXX909]", "[XXXXX910]", "[XXXXX911]", "[XXXXX912]", "[XXXXX913]", "[XXXXX914]", "[XXXXX915]", "[XXXXX916]", "[XXXXX917]", "[XXXXX918]", "[XXXXX919]", "[XXXXX920]", "[XXXXX921]", "[XXXXX922]", "[XXXXX923]", "[XXXXX924]", "[XXXXX925]", "[XXXXX926]", "[XXXXX927]", "[XXXXX928]", "[XXXXX929]", "[XXXXX930]", "[XXXXX931]", "[XXXXX932]", "[XXXXX933]", "[XXXXX934]", "[XXXXX935]", "[XXXXX936]", "[XXXXX937]", "[XXXXX938]", "[XXXXX939]", "[XXXXX940]", "[XXXXX941]", "[XXXXX942]", "[XXXXX943]", "[XXXXX944]", "[XXXXX945]", "[XXXXX946]", "[XXXXX947]", "[XXXXX948]", "[XXXXX949]", "[XXXXX950]", "[XXXXX951]", "[XXXXX952]", "[XXXXX953]", "[XXXXX954]", "[XXXXX955]", "[XXXXX956]", "[XXXXX957]", "[XXXXX958]", "[XXXXX959]", "[XXXXX960]", "[XXXXX961]", "[XXXXX962]", "[XXXXX963]", "[XXXXX964]", "[XXXXX965]", "[XXXXX966]", "[XXXXX967]", "[XXXXX968]", "[XXXXX969]", "[XXXXX970]", "[XXXXX971]", "[XXXXX972]", "[XXXXX973]", "[XXXXX974]", "[XXXXX975]", "[XXXXX976]", "[XXXXX977]", "[XXXXX978]", "[XXXXX979]", "[XXXXX980]", "[XXXXX981]", "[XXXXX982]", "[XXXXX983]", "[XXXXX984]", "[XXXXX985]", "[XXXXX986]", "[XXXXX987]", "[XXXXX988]", "[XXXXX989]", "[XXXXX990]", "[XXXXX991]", "[XXXXX992]", "[XXXXX993]", "[XXXXX994]", "[XXXXX995]", "[XXXXX996]", "[XXXXX997]", "[XXXXX998]", "[XXXXX999]", "[XXXXX1000]", "[XXXXX1001]", "[XXXXX1002]", "[XXXXX1003]", "[XXXXX1004]", "[XXXXX1005]", "[XXXXX1006]", "[XXXXX1007]", "[XXXXX1008]", "[XXXXX1009]", "[XXXXX1010]", "[XXXXX1011]", "[XXXXX1012]", "[XXXXX1013]", "[XXXXX1014]", "[XXXXX1015]", "[XXXXX1016]", "[XXXXX1017]", "[XXXXX1018]", "[XXXXX1019]", "[XXXXX1020]", "[XXXXX1021]", "[XXXXX1022]", "[XXXXX1023]", "[XXXXX1024]", "[XXXXX1025]", "[XXXXX1026]", "[XXXXX1027]", "[XXXXX1028]", "[XXXXX1029]", "[XXXXX1030]", "[XXXXX1031]", "[XXXXX1032]", "[XXXXX1033]", "[XXXXX1034]", "[XXXXX1035]", "[XXXXX1036]", "[XXXXX1037]", "[XXXXX1038]", "[XXXXX1039]", "[XXXXX1040]", "[XXXXX1041]", "[XXXXX1042]", "[XXXXX1043]", "[XXXXX1044]", "[XXXXX1045]", "[XXXXX1046]", "[XXXXX1047]", "[XXXXX1048]", "[XXXXX1049]", "[XXXXX1050]", "[XXXXX1051]", "[XXXXX1052]", "[XXXXX1053]", "[XXXXX1054]", "[XXXXX1055]", "[XXXXX1056]", "[XXXXX1057]", "[XXXXX1058]", "[XXXXX1059]", "[XXXXX1060]", "[XXXXX1061]", "[XXXXX1062]", "[XXXXX1063]", "[XXXXX1064]", "[XXXXX1065]", "[XXXXX1066]", "[XXXXX1067]", "[XXXXX1068]", "[XXXXX1069]", "[XXXXX1070]", "[XXXXX1071]", "[XXXXX1072]", "[XXXXX1073]", "[XXXXX1074]", "[XXXXX1075]", "[XXXXX1076]", "[XXXXX1077]", "[XXXXX1078]", "[XXXXX1079]", "[XXXXX1080]", "[XXXXX1081]", "[XXXXX1082]", "[XXXXX1083]", "[XXXXX1084]", "[XXXXX1085]", "[XXXXX1086]", "[XXXXX1087]", "[XXXXX1088]", "[XXXXX1089]", "[XXXXX1090]", "[XXXXX1091]", "[XXXXX1092]", "[XXXXX1093]", "[XXXXX1094]", "[XXXXX1095]", "[XXXXX1096]", "[XXXXX1097]", "[XXXXX1098]", "[XXXXX1099]", "[XXXXX1100]", "[XXXXX1101]", "[XXXXX1102]", "[XXXXX1103]", "[XXXXX1104]", "[XXXXX1105]", "[XXXXX1106]", "[XXXXX1107]", "[XXXXX1108]", "[XXXXX1109]", "[XXXXX1110]", "[XXXXX1111]", "[XXXXX1112]", "[XXXXX1113]", "[XXXXX1114]", "[XXXXX1115]", "[XXXXX1116]", "[XXXXX1117]", "[XXXXX1118]", "[XXXXX1119]", "[XXXXX1120]", "[XXXXX1121]", "[XXXXX1122]", "[XXXXX1123]", "[XXXXX1124]", "[XXXXX1125]", "[XXXXX1126]", "[XXXXX1127]", "[XXXXX1128]", "[XXXXX1129]", "[XXXXX1130]", "[XXXXX1131]", "[XXXXX1132]", "[XXXXX1133]", "[XXXXX1134]", "[XXXXX1135]", "[XXXXX1136]", "[XXXXX1137]", "[XXXXX1138]", "[XXXXX1139]", "[XXXXX1140]", "[XXXXX1141]", "[XXXXX1142]", "[XXXXX1143]", "[XXXXX1144]", "[XXXXX1145]", "[XXXXX1146]", "[XXXXX1147]", "[XXXXX1148]", "[XXXXX1149]", "[XXXXX1150]", "[XXXXX1151]", "[XXXXX1152]", "[XXXXX1153]", "[XXXXX1154]", "[XXXXX1155]", "[XXXXX1156]", "[XXXXX1157]", "[XXXXX1158]", "[XXXXX1159]", "[XXXXX1160]", "[XXXXX1161]", "[XXXXX1162]", "[XXXXX1163]", "[XXXXX1164]", "[XXXXX1165]", "[XXXXX1166]", "[XXXXX1167]", "[XXXXX1168]", "[XXXXX1169]", "[XXXXX1170]", "[XXXXX1171]", "[XXXXX1172]", "[XXXXX1173]", "[XXXXX1174]", "[XXXXX1175]", "[XXXXX1176]", "[XXXXX1177]", "[XXXXX1178]", "[XXXXX1179]", "[XXXXX1180]", "[XXXXX1181]", "[XXXXX1182]", "[XXXXX1183]", "[XXXXX1184]", "[XXXXX1185]", "[XXXXX1186]", "[XXXXX1187]", "[XXXXX1188]", "[XXXXX1189]", "[XXXXX1190]", "[XXXXX1191]"]}
|
spiece.model
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ddfd2a48e4f24841f1b5e926357c751dbce7bc28fc3feeb18cd69ad1cf44b6c
|
3 |
+
size 1003082
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"do_lower_case": false, "remove_space": true, "keep_accents": true, "bos_token": "[CLS]", "eos_token": "[SEP]", "unk_token": "<unk>", "sep_token": "[SEP]", "pad_token": "<pad>", "cls_token": "[CLS]", "mask_token": {"content": "[MASK]", "single_word": false, "lstrip": true, "rstrip": false, "normalized": false, "__type": "AddedToken"}, "sp_model_kwargs": {}, "name_or_path": "models/5mb/lus_latn_5mb", "model_input_names": ["input_ids", "attention_mask"], "special_tokens_map_file": "models/5mb/lus_latn_5mb/special_tokens_map.json", "tokenizer_class": "AlbertTokenizer"}
|