nbaden's picture
Upload tokenizer
eace907
raw
history blame
667 Bytes
{
"tur": {
"[PAD]": 46,
"[UNK]": 45,
"c": 1,
"i": 2,
"o": 3,
"y": 4,
"|": 0,
"«": 5,
"»": 6,
"а": 7,
"б": 8,
"в": 9,
"г": 10,
"д": 11,
"е": 12,
"ж": 13,
"з": 14,
"и": 15,
"й": 16,
"к": 17,
"л": 18,
"м": 19,
"н": 20,
"о": 21,
"п": 22,
"р": 23,
"с": 24,
"т": 25,
"у": 26,
"ф": 27,
"х": 28,
"ц": 29,
"ч": 30,
"ш": 31,
"щ": 32,
"ы": 33,
"ь": 34,
"э": 35,
"ю": 36,
"я": 37,
"і": 38,
"ј": 39,
"ҕ": 40,
"ҥ": 41,
"ү": 42,
"һ": 43,
"ө": 44
}
}