goldfish-models commited on
Commit
978f4be
1 Parent(s): 546af3c

Upload gla_latn_5mb tokenizer.

Browse files
added_tokens.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"[XXXXX139]": 44407, "[XXXXX760]": 45028, "[XXXXX530]": 44798, "[XXXXX57]": 44325, "[XXXXX577]": 44845, "[XXXXX299]": 44567, "[XXXXX290]": 44558, "[XXXXX772]": 45040, "[XXXXX641]": 44909, "[XXXXX441]": 44709, "[XXXXX39]": 44307, "[XXXXX592]": 44860, "[XXXXX134]": 44402, "[XXXXX684]": 44952, "[XXXXX748]": 45016, "[XXXXX121]": 44389, "[XXXXX462]": 44730, "[XXXXX525]": 44793, "[XXXXX156]": 44424, "[XXXXX22]": 44290, "[XXXXX693]": 44961, "[XXXXX447]": 44715, "[XXXXX28]": 44296, "[XXXXX374]": 44642, "[XXXXX40]": 44308, "[XXXXX250]": 44518, "[XXXXX72]": 44340, "[XXXXX239]": 44507, "[XXXXX209]": 44477, "[XXXXX278]": 44546, "[XXXXX305]": 44573, "[XXXXX274]": 44542, "[XXXXX476]": 44744, "[XXXXX233]": 44501, "[XXXXX380]": 44648, "[XXXXX133]": 44401, "[XXXXX344]": 44612, "[XXXXX467]": 44735, "[XXXXX249]": 44517, "[XXXXX228]": 44496, "[XXXXX398]": 44666, "[XXXXX332]": 44600, "[XXXXX595]": 44863, "[XXXXX759]": 45027, "[XXXXX23]": 44291, "[XXXXX393]": 44661, "[XXXXX786]": 45054, "[XXXXX433]": 44701, "[XXXXX626]": 44894, "[XXXXX391]": 44659, "[XXXXX14]": 44282, "[XXXXX140]": 44408, "[XXXXX81]": 44349, "[XXXXX312]": 44580, "[XXXXX434]": 44702, "[XXXXX569]": 44837, "[XXXXX219]": 44487, "[XXXXX500]": 44768, "[XXXXX317]": 44585, "[XXXXX682]": 44950, "[XXXXX783]": 45051, "[XXXXX590]": 44858, "[XXXXX258]": 44526, "[XXXXX311]": 44579, "[XXXXX657]": 44925, "[XXXXX784]": 45052, "[XXXXX245]": 44513, "[XXXXX323]": 44591, "[XXXXX293]": 44561, "[XXXXX544]": 44812, "[XXXXX309]": 44577, "[XXXXX663]": 44931, "[XXXXX679]": 44947, "[XXXXX80]": 44348, "[XXXXX279]": 44547, "[XXXXX362]": 44630, "[XXXXX98]": 44366, "[XXXXX639]": 44907, "[XXXXX29]": 44297, "[XXXXX107]": 44375, "[XXXXX63]": 44331, "[XXXXX708]": 44976, "[XXXXX777]": 45045, "[XXXXX633]": 44901, "[XXXXX625]": 44893, "[XXXXX92]": 44360, "[XXXXX628]": 44896, "[XXXXX375]": 44643, "[XXXXX766]": 45034, "[XXXXX472]": 44740, "[XXXXX518]": 44786, "[XXXXX495]": 44763, "[XXXXX778]": 45046, "[XXXXX207]": 44475, "[XXXXX193]": 44461, "[XXXXX519]": 44787, "[XXXXX771]": 45039, "[XXXXX171]": 44439, "[XXXXX162]": 44430, "[XXXXX59]": 44327, "[XXXXX357]": 44625, "[XXXXX428]": 44696, "[XXXXX340]": 44608, "[XXXXX443]": 44711, "[XXXXX707]": 44975, "[XXXXX510]": 44778, "[XXXXX654]": 44922, "[XXXXX11]": 44279, "[XXXXX560]": 44828, "[XXXXX16]": 44284, "[XXXXX352]": 44620, "[XXXXX117]": 44385, "[XXXXX264]": 44532, "[XXXXX736]": 45004, "[XXXXX295]": 44563, "[XXXXX128]": 44396, "[XXXXX383]": 44651, "[XXXXX549]": 44817, "[XXXXX719]": 44987, "[XXXXX547]": 44815, "[XXXXX427]": 44695, "[XXXXX619]": 44887, "[XXXXX738]": 45006, "[XXXXX252]": 44520, "[XXXXX4]": 44272, "[XXXXX726]": 44994, "[XXXXX504]": 44772, "[XXXXX99]": 44367, "[XXXXX575]": 44843, "[XXXXX681]": 44949, "[XXXXX589]": 44857, "[XXXXX79]": 44347, "[XXXXX284]": 44552, "[MASK]": 44267, "[XXXXX552]": 44820, "[XXXXX20]": 44288, "[XXXXX8]": 44276, "[XXXXX337]": 44605, "[XXXXX710]": 44978, "[XXXXX497]": 44765, "[XXXXX588]": 44856, "[XXXXX740]": 45008, "[XXXXX265]": 44533, "[XXXXX415]": 44683, "[XXXXX603]": 44871, "[XXXXX257]": 44525, "[XXXXX787]": 45055, "[XXXXX470]": 44738, "[XXXXX648]": 44916, "[XXXXX701]": 44969, "[XXXXX213]": 44481, "[XXXXX555]": 44823, "[XXXXX382]": 44650, "[XXXXX259]": 44527, "[XXXXX703]": 44971, "[XXXXX298]": 44566, "[XXXXX260]": 44528, "[XXXXX379]": 44647, "[XXXXX769]": 45037, "[XXXXX183]": 44451, "[XXXXX471]": 44739, "[XXXXX407]": 44675, "[XXXXX481]": 44749, "[XXXXX114]": 44382, "[XXXXX509]": 44777, "[XXXXX444]": 44712, "[XXXXX150]": 44418, "[XXXXX541]": 44809, "[XXXXX757]": 45025, "[XXXXX770]": 45038, "[XXXXX253]": 44521, "[XXXXX706]": 44974, "[XXXXX477]": 44745, "[XXXXX674]": 44942, "[XXXXX466]": 44734, "[XXXXX271]": 44539, "[XXXXX205]": 44473, "[XXXXX538]": 44806, "[XXXXX775]": 45043, "[XXXXX616]": 44884, "[XXXXX355]": 44623, "[XXXXX629]": 44897, "[XXXXX696]": 44964, "[XXXXX152]": 44420, "[XXXXX488]": 44756, "[XXXXX119]": 44387, "[XXXXX514]": 44782, "[XXXXX33]": 44301, "[XXXXX64]": 44332, "[XXXXX607]": 44875, "[XXXXX191]": 44459, "[XXXXX754]": 45022, "[XXXXX330]": 44598, "[XXXXX409]": 44677, "[XXXXX277]": 44545, "[XXXXX418]": 44686, "[XXXXX214]": 44482, "[XXXXX532]": 44800, "[XXXXX776]": 45044, "[XXXXX655]": 44923, "[XXXXX586]": 44854, "[XXXXX300]": 44568, "[XXXXX185]": 44453, "[XXXXX136]": 44404, "[XXXXX143]": 44411, "[XXXXX513]": 44781, "[XXXXX306]": 44574, "[XXXXX144]": 44412, "[XXXXX773]": 45041, "[XXXXX376]": 44644, "[XXXXX354]": 44622, "[XXXXX739]": 45007, "[XXXXX141]": 44409, "[XXXXX372]": 44640, "<pad>": 44266, "[XXXXX55]": 44323, "[XXXXX501]": 44769, "[XXXXX559]": 44827, "[XXXXX334]": 44602, "[XXXXX526]": 44794, "[XXXXX669]": 44937, "[XXXXX381]": 44649, "[XXXXX712]": 44980, "[XXXXX225]": 44493, "[XXXXX287]": 44555, "[XXXXX123]": 44391, "[XXXXX26]": 44294, "[XXXXX406]": 44674, "[XXXXX715]": 44983, "[XXXXX709]": 44977, "[XXXXX743]": 45011, "[XXXXX479]": 44747, "[XXXXX46]": 44314, "[XXXXX154]": 44422, "[XXXXX714]": 44982, "[XXXXX647]": 44915, "[XXXXX767]": 45035, "[XXXXX166]": 44434, "[XXXXX487]": 44755, "[XXXXX746]": 45014, "[XXXXX593]": 44861, "[XXXXX335]": 44603, "[XXXXX673]": 44941, "[XXXXX373]": 44641, "[XXXXX248]": 44516, "[XXXXX727]": 44995, "[XXXXX73]": 44341, "[XXXXX402]": 44670, "[XXXXX774]": 45042, "[XXXXX503]": 44771, "[XXXXX780]": 45048, "[XXXXX704]": 44972, "[XXXXX112]": 44380, "[XXXXX677]": 44945, "[XXXXX246]": 44514, "[XXXXX531]": 44799, "[XXXXX720]": 44988, "[XXXXX448]": 44716, "[XXXXX169]": 44437, "[XXXXX493]": 44761, "[XXXXX280]": 44548, "[XXXXX498]": 44766, "[XXXXX192]": 44460, "[XXXXX604]": 44872, "[XXXXX656]": 44924, "[XXXXX308]": 44576, "[XXXXX502]": 44770, "[XXXXX3]": 44271, "[XXXXX365]": 44633, "[XXXXX515]": 44783, "[XXXXX644]": 44912, "[XXXXX218]": 44486, "[XXXXX256]": 44524, "[XXXXX43]": 44311, "[XXXXX572]": 44840, "[XXXXX730]": 44998, "[XXXXX282]": 44550, "[XXXXX237]": 44505, "[XXXXX545]": 44813, "[XXXXX148]": 44416, "[XXXXX310]": 44578, "[XXXXX106]": 44374, "[XXXXX781]": 45049, "[XXXXX489]": 44757, "[XXXXX386]": 44654, "[XXXXX689]": 44957, "[XXXXX69]": 44337, "[XXXXX349]": 44617, "[XXXXX289]": 44557, "[XXXXX120]": 44388, "[XXXXX142]": 44410, "[XXXXX53]": 44321, "[XXXXX158]": 44426, "[XXXXX58]": 44326, "[CLS]": 44264, "[XXXXX198]": 44466, "[XXXXX612]": 44880, "[XXXXX101]": 44369, "[XXXXX578]": 44846, "[XXXXX370]": 44638, "[XXXXX82]": 44350, "[XXXXX697]": 44965, "[XXXXX473]": 44741, "[XXXXX614]": 44882, "[XXXXX267]": 44535, "[XXXXX167]": 44435, "[XXXXX621]": 44889, "[XXXXX108]": 44376, "[XXXXX496]": 44764, "[XXXXX285]": 44553, "[XXXXX451]": 44719, "[XXXXX567]": 44835, "[XXXXX718]": 44986, "[XXXXX782]": 45050, "[XXXXX528]": 44796, "[XXXXX576]": 44844, "[XXXXX423]": 44691, "[XXXXX749]": 45017, "[XXXXX5]": 44273, "[XXXXX364]": 44632, "[XXXXX464]": 44732, "[XXXXX288]": 44556, "[XXXXX100]": 44368, "[XXXXX270]": 44538, "[XXXXX220]": 44488, "[XXXXX50]": 44318, "[XXXXX658]": 44926, "[XXXXX401]": 44669, "[XXXXX733]": 45001, "[XXXXX768]": 45036, "[XXXXX688]": 44956, "[XXXXX361]": 44629, "[XXXXX403]": 44671, "[XXXXX232]": 44500, "[XXXXX554]": 44822, "[XXXXX9]": 44277, "[XXXXX521]": 44789, "[XXXXX262]": 44530, "[XXXXX667]": 44935, "[XXXXX238]": 44506, "[XXXXX408]": 44676, "[XXXXX678]": 44946, "[XXXXX195]": 44463, "[XXXXX725]": 44993, "[XXXXX649]": 44917, "[SEP]": 44265, "[XXXXX363]": 44631, "[XXXXX331]": 44599, "[XXXXX236]": 44504, "[XXXXX429]": 44697, "[XXXXX617]": 44885, "[XXXXX35]": 44303, "[XXXXX126]": 44394, "[XXXXX129]": 44397, "[XXXXX85]": 44353, "[XXXXX457]": 44725, "[XXXXX540]": 44808, "[XXXXX465]": 44733, "[XXXXX546]": 44814, "[XXXXX437]": 44705, "[XXXXX97]": 44365, "[XXXXX329]": 44597, "[XXXXX2]": 44270, "[XXXXX206]": 44474, "[XXXXX338]": 44606, "[XXXXX151]": 44419, "[XXXXX286]": 44554, "[XXXXX74]": 44342, "[XXXXX118]": 44386, "[XXXXX698]": 44966, "[XXXXX17]": 44285, "[XXXXX634]": 44902, "[XXXXX652]": 44920, "[XXXXX41]": 44309, "[XXXXX342]": 44610, "[XXXXX77]": 44345, "[XXXXX387]": 44655, "[XXXXX78]": 44346, "[XXXXX138]": 44406, "[XXXXX666]": 44934, "[XXXXX553]": 44821, "[XXXXX446]": 44714, "[XXXXX469]": 44737, "[XXXXX19]": 44287, "[XXXXX61]": 44329, "[XXXXX587]": 44855, "[XXXXX0]": 44268, "[XXXXX508]": 44776, "[XXXXX328]": 44596, "[XXXXX351]": 44619, "[XXXXX411]": 44679, "[XXXXX606]": 44874, "[XXXXX146]": 44414, "[XXXXX86]": 44354, "[XXXXX190]": 44458, "[XXXXX378]": 44646, "[XXXXX608]": 44876, "[XXXXX202]": 44470, "[XXXXX638]": 44906, "[XXXXX131]": 44399, "[XXXXX659]": 44927, "[XXXXX292]": 44560, "[XXXXX700]": 44968, "[XXXXX651]": 44919, "[XXXXX37]": 44305, "[XXXXX210]": 44478, "[XXXXX671]": 44939, "[XXXXX87]": 44355, "[XXXXX557]": 44825, "[XXXXX668]": 44936, "[XXXXX675]": 44943, "[XXXXX442]": 44710, "[XXXXX636]": 44904, "[XXXXX492]": 44760, "[XXXXX159]": 44427, "[XXXXX683]": 44951, "[XXXXX66]": 44334, "[XXXXX600]": 44868, "[XXXXX304]": 44572, "[XXXXX122]": 44390, "[XXXXX550]": 44818, "[XXXXX109]": 44377, "[XXXXX635]": 44903, "[XXXXX672]": 44940, "[XXXXX240]": 44508, "[XXXXX105]": 44373, "[XXXXX90]": 44358, "[XXXXX145]": 44413, "[XXXXX223]": 44491, "[XXXXX694]": 44962, "[XXXXX70]": 44338, "[XXXXX38]": 44306, "[XXXXX764]": 45032, "[XXXXX624]": 44892, "[XXXXX642]": 44910, "[XXXXX15]": 44283, "[XXXXX454]": 44722, "[XXXXX314]": 44582, "[XXXXX692]": 44960, "[XXXXX630]": 44898, "[XXXXX385]": 44653, "[XXXXX346]": 44614, "[XXXXX480]": 44748, "[XXXXX21]": 44289, "[XXXXX52]": 44320, "[XXXXX318]": 44586, "[XXXXX10]": 44278, "[XXXXX756]": 45024, "[XXXXX234]": 44502, "[XXXXX263]": 44531, "[XXXXX691]": 44959, "[XXXXX247]": 44515, "[XXXXX91]": 44359, "[XXXXX735]": 45003, "[XXXXX215]": 44483, "[XXXXX313]": 44581, "[XXXXX660]": 44928, "[XXXXX520]": 44788, "[XXXXX478]": 44746, "[XXXXX643]": 44911, "[XXXXX180]": 44448, "[XXXXX178]": 44446, "[XXXXX27]": 44295, "[XXXXX455]": 44723, "[XXXXX537]": 44805, "[XXXXX397]": 44665, "[XXXXX25]": 44293, "[XXXXX369]": 44637, "[XXXXX724]": 44992, "[XXXXX96]": 44364, "[XXXXX570]": 44838, "[XXXXX745]": 45013, "[XXXXX717]": 44985, "[XXXXX251]": 44519, "[XXXXX711]": 44979, "[XXXXX297]": 44565, "[XXXXX302]": 44570, "[XXXXX201]": 44469, "[XXXXX690]": 44958, "[XXXXX664]": 44932, "[XXXXX135]": 44403, "[XXXXX273]": 44541, "[XXXXX212]": 44480, "[XXXXX62]": 44330, "[XXXXX618]": 44886, "[XXXXX562]": 44830, "[XXXXX137]": 44405, "[XXXXX348]": 44616, "[XXXXX44]": 44312, "[XXXXX631]": 44899, "[XXXXX613]": 44881, "[XXXXX490]": 44758, "[XXXXX731]": 44999, "[XXXXX392]": 44660, "[XXXXX358]": 44626, "[XXXXX765]": 45033, "[XXXXX377]": 44645, "[XXXXX685]": 44953, "[XXXXX283]": 44551, "[XXXXX60]": 44328, "[XXXXX687]": 44955, "[XXXXX763]": 45031, "[XXXXX742]": 45010, "[XXXXX269]": 44537, "[XXXXX255]": 44523, "[XXXXX13]": 44281, "[XXXXX627]": 44895, "[XXXXX548]": 44816, "[XXXXX452]": 44720, "[XXXXX113]": 44381, "[XXXXX254]": 44522, "[XXXXX581]": 44849, "[XXXXX153]": 44421, "[XXXXX460]": 44728, "[XXXXX47]": 44315, "[XXXXX474]": 44742, "[XXXXX65]": 44333, "[XXXXX468]": 44736, "[XXXXX165]": 44433, "[XXXXX303]": 44571, "[XXXXX761]": 45029, "[XXXXX322]": 44590, "[XXXXX320]": 44588, "[XXXXX533]": 44801, "[XXXXX605]": 44873, "[XXXXX208]": 44476, "[XXXXX326]": 44594, "[XXXXX637]": 44905, "[XXXXX95]": 44363, "[XXXXX394]": 44662, "[XXXXX699]": 44967, "[XXXXX453]": 44721, "[XXXXX438]": 44706, "[XXXXX676]": 44944, "[XXXXX51]": 44319, "[XXXXX170]": 44438, "[XXXXX417]": 44685, "[XXXXX30]": 44298, "[XXXXX507]": 44775, "[XXXXX516]": 44784, "[XXXXX157]": 44425, "[XXXXX459]": 44727, "[XXXXX266]": 44534, "[XXXXX176]": 44444, "[XXXXX440]": 44708, "[XXXXX645]": 44913, "[XXXXX529]": 44797, "[XXXXX194]": 44462, "[XXXXX579]": 44847, "[XXXXX662]": 44930, "[XXXXX93]": 44361, "[XXXXX356]": 44624, "[XXXXX199]": 44467, "[XXXXX189]": 44457, "[XXXXX89]": 44357, "[XXXXX404]": 44672, "[XXXXX88]": 44356, "[XXXXX661]": 44929, "[XXXXX686]": 44954, "[XXXXX272]": 44540, "[XXXXX580]": 44848, "[XXXXX564]": 44832, "[XXXXX161]": 44429, "[XXXXX751]": 45019, "[XXXXX186]": 44454, "[XXXXX762]": 45030, "[XXXXX721]": 44989, "[XXXXX188]": 44456, "[XXXXX609]": 44877, "[XXXXX695]": 44963, "[XXXXX24]": 44292, "[XXXXX419]": 44687, "[XXXXX307]": 44575, "[XXXXX200]": 44468, "[XXXXX728]": 44996, "[XXXXX347]": 44615, "[XXXXX390]": 44658, "[XXXXX558]": 44826, "[XXXXX45]": 44313, "[XXXXX42]": 44310, "[XXXXX324]": 44592, "[XXXXX296]": 44564, "[XXXXX573]": 44841, "[XXXXX486]": 44754, "[XXXXX445]": 44713, "[XXXXX6]": 44274, "[XXXXX561]": 44829, "[XXXXX241]": 44509, "[XXXXX412]": 44680, "[XXXXX1]": 44269, "[XXXXX536]": 44804, "[XXXXX599]": 44867, "[XXXXX76]": 44344, "[XXXXX224]": 44492, "[XXXXX359]": 44627, "[XXXXX491]": 44759, "[XXXXX702]": 44970, "[XXXXX75]": 44343, "[XXXXX485]": 44753, "[XXXXX227]": 44495, "[XXXXX499]": 44767, "[XXXXX574]": 44842, "[XXXXX432]": 44700, "[XXXXX732]": 45000, "[XXXXX583]": 44851, "[XXXXX319]": 44587, "[XXXXX168]": 44436, "[XXXXX785]": 45053, "[XXXXX737]": 45005, "[XXXXX339]": 44607, "[XXXXX229]": 44497, "[XXXXX596]": 44864, "[XXXXX615]": 44883, "[XXXXX435]": 44703, "[XXXXX173]": 44441, "[XXXXX388]": 44656, "[XXXXX623]": 44891, "[XXXXX187]": 44455, "[XXXXX456]": 44724, "[XXXXX461]": 44729, "[XXXXX431]": 44699, "[XXXXX384]": 44652, "[XXXXX115]": 44383, "[XXXXX755]": 45023, "[XXXXX494]": 44762, "[XXXXX430]": 44698, "[XXXXX458]": 44726, "[XXXXX665]": 44933, "[XXXXX611]": 44879, "[XXXXX439]": 44707, "[XXXXX484]": 44752, "[XXXXX653]": 44921, "[XXXXX216]": 44484, "[XXXXX268]": 44536, "[XXXXX94]": 44362, "[XXXXX175]": 44443, "[XXXXX482]": 44750, "[XXXXX217]": 44485, "[XXXXX155]": 44423, "[XXXXX177]": 44445, "[XXXXX301]": 44569, "[XXXXX744]": 45012, "[XXXXX424]": 44692, "[XXXXX650]": 44918, "[XXXXX275]": 44543, "[XXXXX680]": 44948, "[XXXXX147]": 44415, "[XXXXX48]": 44316, "[XXXXX713]": 44981, "[XXXXX563]": 44831, "[XXXXX316]": 44584, "[XXXXX341]": 44609, "[XXXXX243]": 44511, "[XXXXX524]": 44792, "[XXXXX747]": 45015, "[XXXXX405]": 44673, "[XXXXX132]": 44400, "[XXXXX360]": 44628, "[XXXXX230]": 44498, "[XXXXX350]": 44618, "[XXXXX231]": 44499, "[XXXXX598]": 44866, "[XXXXX103]": 44371, "[XXXXX83]": 44351, "[XXXXX716]": 44984, "[XXXXX542]": 44810, "[XXXXX425]": 44693, "[XXXXX327]": 44595, "[XXXXX336]": 44604, "[XXXXX164]": 44432, "[XXXXX211]": 44479, "[XXXXX294]": 44562, "[XXXXX566]": 44834, "[XXXXX181]": 44449, "[XXXXX12]": 44280, "[XXXXX111]": 44379, "[XXXXX506]": 44774, "[XXXXX36]": 44304, "[XXXXX7]": 44275, "[XXXXX400]": 44668, "[XXXXX416]": 44684, "[XXXXX483]": 44751, "[XXXXX226]": 44494, "[XXXXX396]": 44664, "[XXXXX371]": 44639, "[XXXXX221]": 44489, "[XXXXX565]": 44833, "[XXXXX426]": 44694, "[XXXXX522]": 44790, "[XXXXX752]": 45020, "[XXXXX705]": 44973, "[XXXXX758]": 45026, "[XXXXX366]": 44634, "[XXXXX343]": 44611, "[XXXXX646]": 44914, "[XXXXX325]": 44593, "[XXXXX184]": 44452, "[XXXXX413]": 44681, "[XXXXX551]": 44819, "[XXXXX163]": 44431, "[XXXXX610]": 44878, "[XXXXX261]": 44529, "[XXXXX34]": 44302, "[XXXXX204]": 44472, "[XXXXX475]": 44743, "[XXXXX511]": 44779, "[XXXXX622]": 44890, "[XXXXX242]": 44510, "[XXXXX505]": 44773, "[XXXXX127]": 44395, "[XXXXX734]": 45002, "[XXXXX235]": 44503, "[XXXXX182]": 44450, "[XXXXX422]": 44690, "[XXXXX741]": 45009, "[XXXXX723]": 44991, "[XXXXX54]": 44322, "[XXXXX67]": 44335, "[XXXXX110]": 44378, "[XXXXX421]": 44689, "[XXXXX535]": 44803, "[XXXXX463]": 44731, "[XXXXX124]": 44392, "[XXXXX594]": 44862, "[XXXXX71]": 44339, "[XXXXX130]": 44398, "[XXXXX410]": 44678, "[XXXXX291]": 44559, "[XXXXX281]": 44549, "[XXXXX517]": 44785, "[XXXXX539]": 44807, "[XXXXX389]": 44657, "[XXXXX534]": 44802, "[XXXXX602]": 44870, "[XXXXX276]": 44544, "[XXXXX116]": 44384, "[XXXXX125]": 44393, "[XXXXX601]": 44869, "[XXXXX523]": 44791, "[XXXXX56]": 44324, "[XXXXX174]": 44442, "[XXXXX568]": 44836, "[XXXXX149]": 44417, "[XXXXX179]": 44447, "[XXXXX84]": 44352, "[XXXXX160]": 44428, "[XXXXX49]": 44317, "[XXXXX543]": 44811, "[XXXXX197]": 44465, "[XXXXX333]": 44601, "[XXXXX597]": 44865, "[XXXXX584]": 44852, "[XXXXX32]": 44300, "[XXXXX18]": 44286, "[XXXXX321]": 44589, "[XXXXX640]": 44908, "[XXXXX353]": 44621, "[XXXXX571]": 44839, "[XXXXX556]": 44824, "[XXXXX620]": 44888, "[XXXXX436]": 44704, "[XXXXX222]": 44490, "[XXXXX172]": 44440, "[XXXXX450]": 44718, "[XXXXX414]": 44682, "[XXXXX753]": 45021, "[XXXXX68]": 44336, "[XXXXX722]": 44990, "[XXXXX368]": 44636, "[XXXXX102]": 44370, "[XXXXX345]": 44613, "[XXXXX315]": 44583, "[XXXXX670]": 44938, "[XXXXX582]": 44850, "[XXXXX585]": 44853, "[XXXXX512]": 44780, "[XXXXX779]": 45047, "[XXXXX420]": 44688, "[XXXXX750]": 45018, "[XXXXX632]": 44900, "[XXXXX367]": 44635, "[XXXXX399]": 44667, "[XXXXX591]": 44859, "[XXXXX31]": 44299, "[XXXXX244]": 44512, "[XXXXX196]": 44464, "[XXXXX104]": 44372, "[XXXXX729]": 44997, "[XXXXX527]": 44795, "[XXXXX203]": 44471, "[XXXXX449]": 44717, "[XXXXX395]": 44663}
special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"bos_token": "[CLS]", "eos_token": "[SEP]", "unk_token": "<unk>", "sep_token": "[SEP]", "pad_token": "<pad>", "cls_token": "[CLS]", "mask_token": {"content": "[MASK]", "single_word": false, "lstrip": true, "rstrip": false, "normalized": false}, "additional_special_tokens": ["[XXXXX0]", "[XXXXX1]", "[XXXXX2]", "[XXXXX3]", "[XXXXX4]", "[XXXXX5]", "[XXXXX6]", "[XXXXX7]", "[XXXXX8]", "[XXXXX9]", "[XXXXX10]", "[XXXXX11]", "[XXXXX12]", "[XXXXX13]", "[XXXXX14]", "[XXXXX15]", "[XXXXX16]", "[XXXXX17]", "[XXXXX18]", "[XXXXX19]", "[XXXXX20]", "[XXXXX21]", "[XXXXX22]", "[XXXXX23]", "[XXXXX24]", "[XXXXX25]", "[XXXXX26]", "[XXXXX27]", "[XXXXX28]", "[XXXXX29]", "[XXXXX30]", "[XXXXX31]", "[XXXXX32]", "[XXXXX33]", "[XXXXX34]", "[XXXXX35]", "[XXXXX36]", "[XXXXX37]", "[XXXXX38]", "[XXXXX39]", "[XXXXX40]", "[XXXXX41]", "[XXXXX42]", "[XXXXX43]", "[XXXXX44]", "[XXXXX45]", "[XXXXX46]", "[XXXXX47]", "[XXXXX48]", "[XXXXX49]", "[XXXXX50]", "[XXXXX51]", "[XXXXX52]", "[XXXXX53]", "[XXXXX54]", "[XXXXX55]", "[XXXXX56]", "[XXXXX57]", "[XXXXX58]", "[XXXXX59]", "[XXXXX60]", "[XXXXX61]", "[XXXXX62]", "[XXXXX63]", "[XXXXX64]", "[XXXXX65]", "[XXXXX66]", "[XXXXX67]", "[XXXXX68]", "[XXXXX69]", "[XXXXX70]", "[XXXXX71]", "[XXXXX72]", "[XXXXX73]", "[XXXXX74]", "[XXXXX75]", "[XXXXX76]", "[XXXXX77]", "[XXXXX78]", "[XXXXX79]", "[XXXXX80]", "[XXXXX81]", "[XXXXX82]", "[XXXXX83]", "[XXXXX84]", "[XXXXX85]", "[XXXXX86]", "[XXXXX87]", "[XXXXX88]", "[XXXXX89]", "[XXXXX90]", "[XXXXX91]", "[XXXXX92]", "[XXXXX93]", "[XXXXX94]", "[XXXXX95]", "[XXXXX96]", "[XXXXX97]", "[XXXXX98]", "[XXXXX99]", "[XXXXX100]", "[XXXXX101]", "[XXXXX102]", "[XXXXX103]", "[XXXXX104]", "[XXXXX105]", "[XXXXX106]", "[XXXXX107]", "[XXXXX108]", "[XXXXX109]", "[XXXXX110]", "[XXXXX111]", "[XXXXX112]", "[XXXXX113]", "[XXXXX114]", "[XXXXX115]", "[XXXXX116]", "[XXXXX117]", "[XXXXX118]", "[XXXXX119]", "[XXXXX120]", "[XXXXX121]", "[XXXXX122]", "[XXXXX123]", "[XXXXX124]", "[XXXXX125]", "[XXXXX126]", "[XXXXX127]", "[XXXXX128]", "[XXXXX129]", "[XXXXX130]", "[XXXXX131]", "[XXXXX132]", "[XXXXX133]", "[XXXXX134]", "[XXXXX135]", "[XXXXX136]", "[XXXXX137]", "[XXXXX138]", "[XXXXX139]", "[XXXXX140]", "[XXXXX141]", "[XXXXX142]", "[XXXXX143]", "[XXXXX144]", "[XXXXX145]", "[XXXXX146]", "[XXXXX147]", "[XXXXX148]", "[XXXXX149]", "[XXXXX150]", "[XXXXX151]", "[XXXXX152]", "[XXXXX153]", "[XXXXX154]", "[XXXXX155]", "[XXXXX156]", "[XXXXX157]", "[XXXXX158]", "[XXXXX159]", "[XXXXX160]", "[XXXXX161]", "[XXXXX162]", "[XXXXX163]", "[XXXXX164]", "[XXXXX165]", "[XXXXX166]", "[XXXXX167]", "[XXXXX168]", "[XXXXX169]", "[XXXXX170]", "[XXXXX171]", "[XXXXX172]", "[XXXXX173]", "[XXXXX174]", "[XXXXX175]", "[XXXXX176]", "[XXXXX177]", "[XXXXX178]", "[XXXXX179]", "[XXXXX180]", "[XXXXX181]", "[XXXXX182]", "[XXXXX183]", "[XXXXX184]", "[XXXXX185]", "[XXXXX186]", "[XXXXX187]", "[XXXXX188]", "[XXXXX189]", "[XXXXX190]", "[XXXXX191]", "[XXXXX192]", "[XXXXX193]", "[XXXXX194]", "[XXXXX195]", "[XXXXX196]", "[XXXXX197]", "[XXXXX198]", "[XXXXX199]", "[XXXXX200]", "[XXXXX201]", "[XXXXX202]", "[XXXXX203]", "[XXXXX204]", "[XXXXX205]", "[XXXXX206]", "[XXXXX207]", "[XXXXX208]", "[XXXXX209]", "[XXXXX210]", "[XXXXX211]", "[XXXXX212]", "[XXXXX213]", "[XXXXX214]", "[XXXXX215]", "[XXXXX216]", "[XXXXX217]", "[XXXXX218]", "[XXXXX219]", "[XXXXX220]", "[XXXXX221]", "[XXXXX222]", "[XXXXX223]", "[XXXXX224]", "[XXXXX225]", "[XXXXX226]", "[XXXXX227]", "[XXXXX228]", "[XXXXX229]", "[XXXXX230]", "[XXXXX231]", "[XXXXX232]", "[XXXXX233]", "[XXXXX234]", "[XXXXX235]", "[XXXXX236]", "[XXXXX237]", "[XXXXX238]", "[XXXXX239]", "[XXXXX240]", "[XXXXX241]", "[XXXXX242]", "[XXXXX243]", "[XXXXX244]", "[XXXXX245]", "[XXXXX246]", "[XXXXX247]", "[XXXXX248]", "[XXXXX249]", "[XXXXX250]", "[XXXXX251]", "[XXXXX252]", "[XXXXX253]", "[XXXXX254]", "[XXXXX255]", "[XXXXX256]", "[XXXXX257]", "[XXXXX258]", "[XXXXX259]", "[XXXXX260]", "[XXXXX261]", "[XXXXX262]", "[XXXXX263]", "[XXXXX264]", "[XXXXX265]", "[XXXXX266]", "[XXXXX267]", "[XXXXX268]", "[XXXXX269]", "[XXXXX270]", "[XXXXX271]", "[XXXXX272]", "[XXXXX273]", "[XXXXX274]", "[XXXXX275]", "[XXXXX276]", "[XXXXX277]", "[XXXXX278]", "[XXXXX279]", "[XXXXX280]", "[XXXXX281]", "[XXXXX282]", "[XXXXX283]", "[XXXXX284]", "[XXXXX285]", "[XXXXX286]", "[XXXXX287]", "[XXXXX288]", "[XXXXX289]", "[XXXXX290]", "[XXXXX291]", "[XXXXX292]", "[XXXXX293]", "[XXXXX294]", "[XXXXX295]", "[XXXXX296]", "[XXXXX297]", "[XXXXX298]", "[XXXXX299]", "[XXXXX300]", "[XXXXX301]", "[XXXXX302]", "[XXXXX303]", "[XXXXX304]", "[XXXXX305]", "[XXXXX306]", "[XXXXX307]", "[XXXXX308]", "[XXXXX309]", "[XXXXX310]", "[XXXXX311]", "[XXXXX312]", "[XXXXX313]", "[XXXXX314]", "[XXXXX315]", "[XXXXX316]", "[XXXXX317]", "[XXXXX318]", "[XXXXX319]", "[XXXXX320]", "[XXXXX321]", "[XXXXX322]", "[XXXXX323]", "[XXXXX324]", "[XXXXX325]", "[XXXXX326]", "[XXXXX327]", "[XXXXX328]", "[XXXXX329]", "[XXXXX330]", "[XXXXX331]", "[XXXXX332]", "[XXXXX333]", "[XXXXX334]", "[XXXXX335]", "[XXXXX336]", "[XXXXX337]", "[XXXXX338]", "[XXXXX339]", "[XXXXX340]", "[XXXXX341]", "[XXXXX342]", "[XXXXX343]", "[XXXXX344]", "[XXXXX345]", "[XXXXX346]", "[XXXXX347]", "[XXXXX348]", "[XXXXX349]", "[XXXXX350]", "[XXXXX351]", "[XXXXX352]", "[XXXXX353]", "[XXXXX354]", "[XXXXX355]", "[XXXXX356]", "[XXXXX357]", "[XXXXX358]", "[XXXXX359]", "[XXXXX360]", "[XXXXX361]", "[XXXXX362]", "[XXXXX363]", "[XXXXX364]", "[XXXXX365]", "[XXXXX366]", "[XXXXX367]", "[XXXXX368]", "[XXXXX369]", "[XXXXX370]", "[XXXXX371]", "[XXXXX372]", "[XXXXX373]", "[XXXXX374]", "[XXXXX375]", "[XXXXX376]", "[XXXXX377]", "[XXXXX378]", "[XXXXX379]", "[XXXXX380]", "[XXXXX381]", "[XXXXX382]", "[XXXXX383]", "[XXXXX384]", "[XXXXX385]", "[XXXXX386]", "[XXXXX387]", "[XXXXX388]", "[XXXXX389]", "[XXXXX390]", "[XXXXX391]", "[XXXXX392]", "[XXXXX393]", "[XXXXX394]", "[XXXXX395]", "[XXXXX396]", "[XXXXX397]", "[XXXXX398]", "[XXXXX399]", "[XXXXX400]", "[XXXXX401]", "[XXXXX402]", "[XXXXX403]", "[XXXXX404]", "[XXXXX405]", "[XXXXX406]", "[XXXXX407]", "[XXXXX408]", "[XXXXX409]", "[XXXXX410]", "[XXXXX411]", "[XXXXX412]", "[XXXXX413]", "[XXXXX414]", "[XXXXX415]", "[XXXXX416]", "[XXXXX417]", "[XXXXX418]", "[XXXXX419]", "[XXXXX420]", "[XXXXX421]", "[XXXXX422]", "[XXXXX423]", "[XXXXX424]", "[XXXXX425]", "[XXXXX426]", "[XXXXX427]", "[XXXXX428]", "[XXXXX429]", "[XXXXX430]", "[XXXXX431]", "[XXXXX432]", "[XXXXX433]", "[XXXXX434]", "[XXXXX435]", "[XXXXX436]", "[XXXXX437]", "[XXXXX438]", "[XXXXX439]", "[XXXXX440]", "[XXXXX441]", "[XXXXX442]", "[XXXXX443]", "[XXXXX444]", "[XXXXX445]", "[XXXXX446]", "[XXXXX447]", "[XXXXX448]", "[XXXXX449]", "[XXXXX450]", "[XXXXX451]", "[XXXXX452]", "[XXXXX453]", "[XXXXX454]", "[XXXXX455]", "[XXXXX456]", "[XXXXX457]", "[XXXXX458]", "[XXXXX459]", "[XXXXX460]", "[XXXXX461]", "[XXXXX462]", "[XXXXX463]", "[XXXXX464]", "[XXXXX465]", "[XXXXX466]", "[XXXXX467]", "[XXXXX468]", "[XXXXX469]", "[XXXXX470]", "[XXXXX471]", "[XXXXX472]", "[XXXXX473]", "[XXXXX474]", "[XXXXX475]", "[XXXXX476]", "[XXXXX477]", "[XXXXX478]", "[XXXXX479]", "[XXXXX480]", "[XXXXX481]", "[XXXXX482]", "[XXXXX483]", "[XXXXX484]", "[XXXXX485]", "[XXXXX486]", "[XXXXX487]", "[XXXXX488]", "[XXXXX489]", "[XXXXX490]", "[XXXXX491]", "[XXXXX492]", "[XXXXX493]", "[XXXXX494]", "[XXXXX495]", "[XXXXX496]", "[XXXXX497]", "[XXXXX498]", "[XXXXX499]", "[XXXXX500]", "[XXXXX501]", "[XXXXX502]", "[XXXXX503]", "[XXXXX504]", "[XXXXX505]", "[XXXXX506]", "[XXXXX507]", "[XXXXX508]", "[XXXXX509]", "[XXXXX510]", "[XXXXX511]", "[XXXXX512]", "[XXXXX513]", "[XXXXX514]", "[XXXXX515]", "[XXXXX516]", "[XXXXX517]", "[XXXXX518]", "[XXXXX519]", "[XXXXX520]", "[XXXXX521]", "[XXXXX522]", "[XXXXX523]", "[XXXXX524]", "[XXXXX525]", "[XXXXX526]", "[XXXXX527]", "[XXXXX528]", "[XXXXX529]", "[XXXXX530]", "[XXXXX531]", "[XXXXX532]", "[XXXXX533]", "[XXXXX534]", "[XXXXX535]", "[XXXXX536]", "[XXXXX537]", "[XXXXX538]", "[XXXXX539]", "[XXXXX540]", "[XXXXX541]", "[XXXXX542]", "[XXXXX543]", "[XXXXX544]", "[XXXXX545]", "[XXXXX546]", "[XXXXX547]", "[XXXXX548]", "[XXXXX549]", "[XXXXX550]", "[XXXXX551]", "[XXXXX552]", "[XXXXX553]", "[XXXXX554]", "[XXXXX555]", "[XXXXX556]", "[XXXXX557]", "[XXXXX558]", "[XXXXX559]", "[XXXXX560]", "[XXXXX561]", "[XXXXX562]", "[XXXXX563]", "[XXXXX564]", "[XXXXX565]", "[XXXXX566]", "[XXXXX567]", "[XXXXX568]", "[XXXXX569]", "[XXXXX570]", "[XXXXX571]", "[XXXXX572]", "[XXXXX573]", "[XXXXX574]", "[XXXXX575]", "[XXXXX576]", "[XXXXX577]", "[XXXXX578]", "[XXXXX579]", "[XXXXX580]", "[XXXXX581]", "[XXXXX582]", "[XXXXX583]", "[XXXXX584]", "[XXXXX585]", "[XXXXX586]", "[XXXXX587]", "[XXXXX588]", "[XXXXX589]", "[XXXXX590]", "[XXXXX591]", "[XXXXX592]", "[XXXXX593]", "[XXXXX594]", "[XXXXX595]", "[XXXXX596]", "[XXXXX597]", "[XXXXX598]", "[XXXXX599]", "[XXXXX600]", "[XXXXX601]", "[XXXXX602]", "[XXXXX603]", "[XXXXX604]", "[XXXXX605]", "[XXXXX606]", "[XXXXX607]", "[XXXXX608]", "[XXXXX609]", "[XXXXX610]", "[XXXXX611]", "[XXXXX612]", "[XXXXX613]", "[XXXXX614]", "[XXXXX615]", "[XXXXX616]", "[XXXXX617]", "[XXXXX618]", "[XXXXX619]", "[XXXXX620]", "[XXXXX621]", "[XXXXX622]", "[XXXXX623]", "[XXXXX624]", "[XXXXX625]", "[XXXXX626]", "[XXXXX627]", "[XXXXX628]", "[XXXXX629]", "[XXXXX630]", "[XXXXX631]", "[XXXXX632]", "[XXXXX633]", "[XXXXX634]", "[XXXXX635]", "[XXXXX636]", "[XXXXX637]", "[XXXXX638]", "[XXXXX639]", "[XXXXX640]", "[XXXXX641]", "[XXXXX642]", "[XXXXX643]", "[XXXXX644]", "[XXXXX645]", "[XXXXX646]", "[XXXXX647]", "[XXXXX648]", "[XXXXX649]", "[XXXXX650]", "[XXXXX651]", "[XXXXX652]", "[XXXXX653]", "[XXXXX654]", "[XXXXX655]", "[XXXXX656]", "[XXXXX657]", "[XXXXX658]", "[XXXXX659]", "[XXXXX660]", "[XXXXX661]", "[XXXXX662]", "[XXXXX663]", "[XXXXX664]", "[XXXXX665]", "[XXXXX666]", "[XXXXX667]", "[XXXXX668]", "[XXXXX669]", "[XXXXX670]", "[XXXXX671]", "[XXXXX672]", "[XXXXX673]", "[XXXXX674]", "[XXXXX675]", "[XXXXX676]", "[XXXXX677]", "[XXXXX678]", "[XXXXX679]", "[XXXXX680]", "[XXXXX681]", "[XXXXX682]", "[XXXXX683]", "[XXXXX684]", "[XXXXX685]", "[XXXXX686]", "[XXXXX687]", "[XXXXX688]", "[XXXXX689]", "[XXXXX690]", "[XXXXX691]", "[XXXXX692]", "[XXXXX693]", "[XXXXX694]", "[XXXXX695]", "[XXXXX696]", "[XXXXX697]", "[XXXXX698]", "[XXXXX699]", "[XXXXX700]", "[XXXXX701]", "[XXXXX702]", "[XXXXX703]", "[XXXXX704]", "[XXXXX705]", "[XXXXX706]", "[XXXXX707]", "[XXXXX708]", "[XXXXX709]", "[XXXXX710]", "[XXXXX711]", "[XXXXX712]", "[XXXXX713]", "[XXXXX714]", "[XXXXX715]", "[XXXXX716]", "[XXXXX717]", "[XXXXX718]", "[XXXXX719]", "[XXXXX720]", "[XXXXX721]", "[XXXXX722]", "[XXXXX723]", "[XXXXX724]", "[XXXXX725]", "[XXXXX726]", "[XXXXX727]", "[XXXXX728]", "[XXXXX729]", "[XXXXX730]", "[XXXXX731]", "[XXXXX732]", "[XXXXX733]", "[XXXXX734]", "[XXXXX735]", "[XXXXX736]", "[XXXXX737]", "[XXXXX738]", "[XXXXX739]", "[XXXXX740]", "[XXXXX741]", "[XXXXX742]", "[XXXXX743]", "[XXXXX744]", "[XXXXX745]", "[XXXXX746]", "[XXXXX747]", "[XXXXX748]", "[XXXXX749]", "[XXXXX750]", "[XXXXX751]", "[XXXXX752]", "[XXXXX753]", "[XXXXX754]", "[XXXXX755]", "[XXXXX756]", "[XXXXX757]", "[XXXXX758]", "[XXXXX759]", "[XXXXX760]", "[XXXXX761]", "[XXXXX762]", "[XXXXX763]", "[XXXXX764]", "[XXXXX765]", "[XXXXX766]", "[XXXXX767]", "[XXXXX768]", "[XXXXX769]", "[XXXXX770]", "[XXXXX771]", "[XXXXX772]", "[XXXXX773]", "[XXXXX774]", "[XXXXX775]", "[XXXXX776]", "[XXXXX777]", "[XXXXX778]", "[XXXXX779]", "[XXXXX780]", "[XXXXX781]", "[XXXXX782]", "[XXXXX783]", "[XXXXX784]", "[XXXXX785]", "[XXXXX786]", "[XXXXX787]"]}
spiece.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a7877fd219a9c8d44ed2e211c11124978d0e4620c8dcf69f0bf8fc3f6e47064
3
+ size 961334
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"do_lower_case": false, "remove_space": true, "keep_accents": true, "bos_token": "[CLS]", "eos_token": "[SEP]", "unk_token": "<unk>", "sep_token": "[SEP]", "pad_token": "<pad>", "cls_token": "[CLS]", "mask_token": {"content": "[MASK]", "single_word": false, "lstrip": true, "rstrip": false, "normalized": false, "__type": "AddedToken"}, "sp_model_kwargs": {}, "name_or_path": "models/5mb/gla_latn_5mb", "model_input_names": ["input_ids", "attention_mask"], "special_tokens_map_file": "models/5mb/gla_latn_5mb/special_tokens_map.json", "tokenizer_class": "AlbertTokenizer"}