volodya-leveryev commited on
Commit
ee39f68
·
1 Parent(s): 4f1f9e2

Upload tokenizer

Browse files
Files changed (1) hide show
  1. vocab.json +34 -34
vocab.json CHANGED
@@ -1,44 +1,44 @@
1
  {
2
  "sah": {
3
- "-": 12,
4
  "<pad>": 39,
5
  "<unk>": 38,
6
- "y": 22,
7
- "|": 34,
8
- "а": 33,
9
- "б": 32,
10
- "в": 1,
11
- "г": 0,
12
- "д": 17,
13
  "е": 29,
14
- "ж": 28,
15
- "з": 30,
16
- "и": 6,
17
- "й": 27,
18
- "к": 11,
19
- "л": 3,
20
- "м": 36,
21
- "н": 7,
22
- "о": 19,
23
- "п": 8,
24
  "р": 23,
25
- "с": 20,
26
- "т": 10,
27
  "у": 9,
28
- "ф": 2,
29
- "х": 26,
30
- "ц": 31,
31
- "ч": 37,
32
- "ш": 4,
33
- "щ": 16,
34
- "ы": 15,
35
- "ь": 25,
36
- "э": 18,
37
- "я": 24,
38
- "ҕ": 13,
39
- "ҥ": 21,
40
  "ү": 5,
41
- "һ": 14,
42
- "ө": 35
43
  }
44
  }
 
1
  {
2
  "sah": {
3
+ "-": 34,
4
  "<pad>": 39,
5
  "<unk>": 38,
6
+ "y": 18,
7
+ "|": 17,
8
+ "а": 2,
9
+ "б": 24,
10
+ "в": 0,
11
+ "г": 36,
12
+ "д": 15,
13
  "е": 29,
14
+ "ж": 19,
15
+ "з": 20,
16
+ "и": 25,
17
+ "й": 16,
18
+ "к": 33,
19
+ "л": 35,
20
+ "м": 8,
21
+ "н": 27,
22
+ "о": 11,
23
+ "п": 13,
24
  "р": 23,
25
+ "с": 12,
26
+ "т": 1,
27
  "у": 9,
28
+ "ф": 32,
29
+ "х": 14,
30
+ "ц": 6,
31
+ "ч": 26,
32
+ "ш": 31,
33
+ "щ": 10,
34
+ "ы": 37,
35
+ "ь": 30,
36
+ "э": 4,
37
+ "я": 21,
38
+ "ҕ": 22,
39
+ "ҥ": 28,
40
  "ү": 5,
41
+ "һ": 7,
42
+ "ө": 3
43
  }
44
  }