dtrifuno commited on
Commit
66e9d15
1 Parent(s): 3162c08

Upload tokenizer

Browse files
Files changed (1) hide show
  1. vocab.json +32 -32
vocab.json CHANGED
@@ -1,36 +1,36 @@
1
  {
2
  "[PAD]": 33,
3
  "[UNK]": 32,
4
- "|": 1,
5
- "а": 3,
6
- "б": 30,
7
- "в": 0,
8
- "г": 6,
9
- "д": 27,
10
- "е": 8,
11
- "ж": 13,
12
- "з": 24,
13
- "и": 15,
14
- "к": 16,
15
- "л": 7,
16
- "м": 19,
17
- "н": 20,
18
- "о": 18,
19
- "п": 17,
20
- "р": 31,
21
- "с": 25,
22
- "т": 9,
23
- "у": 22,
24
- "ф": 28,
25
- "х": 11,
26
- "ц": 29,
27
- "ч": 12,
28
- "ш": 2,
29
- "ѓ": 14,
30
- "ѕ": 5,
31
- "ј": 10,
32
- "љ": 26,
33
- "њ": 21,
34
- "ќ": 4,
35
- "џ": 23
36
  }
 
1
  {
2
  "[PAD]": 33,
3
  "[UNK]": 32,
4
+ "|": 0,
5
+ "а": 1,
6
+ "б": 2,
7
+ "в": 3,
8
+ "г": 4,
9
+ "д": 5,
10
+ "е": 6,
11
+ "ж": 7,
12
+ "з": 8,
13
+ "и": 9,
14
+ "к": 10,
15
+ "л": 11,
16
+ "м": 12,
17
+ "н": 13,
18
+ "о": 14,
19
+ "п": 15,
20
+ "р": 16,
21
+ "с": 17,
22
+ "т": 18,
23
+ "у": 19,
24
+ "ф": 20,
25
+ "х": 21,
26
+ "ц": 22,
27
+ "ч": 23,
28
+ "ш": 24,
29
+ "ѓ": 25,
30
+ "ѕ": 26,
31
+ "ј": 27,
32
+ "љ": 28,
33
+ "њ": 29,
34
+ "ќ": 30,
35
+ "џ": 31
36
  }