Upload tokenizer
4800b6a
verified
|
{ |
|
"ta": { |
|
"[PAD]": 51, |
|
"[UNK]": 50, |
|
"|": 0, |
|
"அ": 1, |
|
"ஆ": 2, |
|
"இ": 3, |
|
"ஈ": 4, |
|
"உ": 5, |
|
"ஊ": 6, |
|
"எ": 7, |
|
"ஏ": 8, |
|
"ஐ": 9, |
|
"ஒ": 10, |
|
"ஓ": 11, |
|
"ஔ": 12, |
|
"க": 13, |
|
"ங": 14, |
|
"ச": 15, |
|
"ஜ": 16, |
|
"ஞ": 17, |
|
"ட": 18, |
|
"ண": 19, |
|
"த": 20, |
|
"ந": 21, |
|
"ன": 22, |
|
"ப": 23, |
|
"ம": 24, |
|
"ய": 25, |
|
"ர": 26, |
|
"ற": 27, |
|
"ல": 28, |
|
"ள": 29, |
|
"ழ": 30, |
|
"வ": 31, |
|
"ஷ": 32, |
|
"ஸ": 33, |
|
"ஹ": 34, |
|
"ா": 35, |
|
"ி": 36, |
|
"ீ": 37, |
|
"ு": 38, |
|
"ூ": 39, |
|
"ெ": 40, |
|
"ே": 41, |
|
"ை": 42, |
|
"ொ": 43, |
|
"ோ": 44, |
|
"ௌ": 45, |
|
"்": 46, |
|
"ௗ": 47, |
|
"ഥ": 48, |
|
"◯": 49 |
|
} |
|
} |
|
|