w2v-bert-Telugu-large / vocab.json
Anujgr8's picture
Upload tokenizer
4517bc1 verified
raw
history blame
No virus
1.01 kB
{
"&": 1,
"/": 2,
"[PAD]": 79,
"[UNK]": 78,
"\\": 3,
"_": 4,
"e": 5,
"g": 6,
"l": 7,
"n": 8,
"p": 9,
"r": 10,
"s": 11,
"t": 12,
"|": 0,
"ఁ": 13,
"ం": 14,
"ః": 15,
"అ": 16,
"ఆ": 17,
"ఇ": 18,
"ఈ": 19,
"ఉ": 20,
"ఊ": 21,
"ఋ": 22,
"ఎ": 23,
"ఏ": 24,
"ఐ": 25,
"ఒ": 26,
"ఓ": 27,
"ఔ": 28,
"క": 29,
"ఖ": 30,
"గ": 31,
"ఘ": 32,
"ఙ": 33,
"చ": 34,
"ఛ": 35,
"జ": 36,
"ఞ": 37,
"ట": 38,
"ఠ": 39,
"డ": 40,
"ఢ": 41,
"ణ": 42,
"త": 43,
"థ": 44,
"ద": 45,
"ధ": 46,
"న": 47,
"ప": 48,
"ఫ": 49,
"బ": 50,
"భ": 51,
"మ": 52,
"య": 53,
"ర": 54,
"ఱ": 55,
"ల": 56,
"ళ": 57,
"వ": 58,
"శ": 59,
"ష": 60,
"స": 61,
"హ": 62,
"ా": 63,
"ి": 64,
"ీ": 65,
"ు": 66,
"ూ": 67,
"ృ": 68,
"ె": 69,
"ే": 70,
"ై": 71,
"ొ": 72,
"ో": 73,
"ౌ": 74,
"్": 75,
"‌": 76,
"’": 77
}