Bauyrjan commited on
Commit
0203b22
·
1 Parent(s): b4c32c1

add tokenizer

Browse files
Files changed (1) hide show
  1. vocab.json +1 -1
vocab.json CHANGED
@@ -1 +1 @@
1
- {"": 0, "": 2, "": 3, "": 4, "": 5, "": 6, "": 7, "": 8, "": 9, "": 10, "": 11, "": 12, "": 13, "": 14, "": 15, "": 16, "": 17, "": 18, "": 19, "": 20, "": 21, "": 22, "": 23, "": 24, "": 25, "": 26, "": 27, "": 28, "": 29, "": 30, "": 31, "": 32, "": 33, "": 34, "": 35, "|": 1, "[UNK]": 36, "[PAD]": 37}
 
1
+ {"в": 0, "ч": 1, "ы": 3, "ө": 4, "г": 5, "щ": 6, "у": 7, "л": 8, "ш": 9, "т": 10, "н": 11, "м": 12, "о": 13, "": 14, "ӊ": 15, "х": 16, "ц": 17, "й": 18, "с": 19, "ё": 20, "ф": 21, "ю": 22, "э": 23, "ң": 24, "ь": 25, "я": 26, "и": 27, "": 28, "д": 29, "б": 30, "п": 31, "ж": 32, "к": 33, "": 34, "е": 35, "ъ": 36, "ү": 37, "а": 38, "р": 39, "з": 40, "|": 2, "[UNK]": 41, "[PAD]": 42}