timotewos commited on
Commit
abad9d3
1 Parent(s): ae3f565

Upload tokenizer

Browse files
Files changed (2) hide show
  1. README.md +3 -3
  2. vocab.json +227 -227
README.md CHANGED
@@ -11,8 +11,8 @@ model-index:
11
  - name: wav2vec2-large-xls-r-300m-amharic-demo-colab
12
  results:
13
  - task:
14
- name: Automatic Speech Recognition
15
  type: automatic-speech-recognition
 
16
  dataset:
17
  name: common_voice_16_1
18
  type: common_voice_16_1
@@ -20,9 +20,9 @@ model-index:
20
  split: test
21
  args: am
22
  metrics:
23
- - name: Wer
24
- type: wer
25
  value: 1.0006671114076051
 
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
11
  - name: wav2vec2-large-xls-r-300m-amharic-demo-colab
12
  results:
13
  - task:
 
14
  type: automatic-speech-recognition
15
+ name: Automatic Speech Recognition
16
  dataset:
17
  name: common_voice_16_1
18
  type: common_voice_16_1
 
20
  split: test
21
  args: am
22
  metrics:
23
+ - type: wer
 
24
  value: 1.0006671114076051
25
+ name: Wer
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
vocab.json CHANGED
@@ -1,232 +1,232 @@
1
  {
2
  "[PAD]": 229,
3
  "[UNK]": 228,
4
- "|": 114,
5
- "ሀ": 225,
6
- "ሁ": 43,
7
- "ሂ": 24,
8
- "ሃ": 189,
9
- "ሄ": 32,
10
- "ህ": 129,
11
- "ሆ": 221,
12
- "ለ": 152,
13
- "ሉ": 108,
14
- "ሊ": 69,
15
- "ላ": 4,
16
- "ሌ": 102,
17
- "ል": 17,
18
- "ሎ": 50,
19
- "ሏ": 30,
20
- "ሐ": 60,
21
- "ሑ": 35,
22
- "ሓ": 206,
23
- "ሔ": 82,
24
- "ሕ": 128,
25
- "መ": 56,
26
- "ሙ": 210,
27
- "ሚ": 41,
28
- "ማ": 166,
29
- "ሜ": 180,
30
- "ም": 40,
31
- "ሞ": 226,
32
- "ሟ": 194,
33
- "ሠ": 47,
34
- "ሡ": 149,
35
- "ሣ": 86,
36
- "ሥ": 99,
37
- "ሦ": 81,
38
- "ረ": 88,
39
- "ሩ": 190,
40
- "ሪ": 185,
41
- "ራ": 135,
42
- "ሬ": 162,
43
- "ር": 58,
44
- "ሮ": 48,
45
- "ሯ": 39,
46
- "ሰ": 105,
47
- "ሱ": 148,
48
- "ሲ": 144,
49
- "ሳ": 156,
50
- "ሴ": 95,
51
- "ስ": 27,
52
- "ሶ": 115,
53
- "ሷ": 53,
54
- "ሸ": 94,
55
- "ሹ": 85,
56
- "ሺ": 215,
57
- "ሻ": 3,
58
- "ሼ": 179,
59
- "ሽ": 193,
60
- "ሾ": 71,
61
- "ቀ": 200,
62
- "ቁ": 224,
63
- "ቂ": 87,
64
- "ቃ": 160,
65
- "ቄ": 153,
66
- "ቅ": 163,
67
- "ቆ": 175,
68
- "ቋ": 204,
69
- "በ": 101,
70
- "ቡ": 34,
71
- "ቢ": 170,
72
- "ባ": 122,
73
- "ቤ": 109,
74
- "ብ": 79,
75
- "ቦ": 171,
76
- "ቧ": 46,
77
- "ቨ": 61,
78
- "ቪ": 137,
79
- "ቫ": 143,
80
- "ቭ": 10,
81
- "ቮ": 74,
82
- "ተ": 165,
83
- "ቱ": 51,
84
- "ቲ": 49,
85
- "ታ": 130,
86
- "ቴ": 184,
87
- "ት": 107,
88
- "ቶ": 191,
89
- "ቷ": 178,
90
- "ቸ": 63,
91
- "ቹ": 223,
92
- "ቺ": 209,
93
- "ቻ": 25,
94
- "ቼ": 116,
95
- "ች": 5,
96
- "ቾ": 77,
97
- "ቿ": 158,
98
- "ኀ": 1,
99
- "ኃ": 119,
100
- "ኅ": 222,
101
- "ኋ": 205,
102
- "ነ": 14,
103
- "ኑ": 8,
104
- "ኒ": 211,
105
- "ና": 83,
106
- "ኔ": 151,
107
- "ን": 172,
108
- "ኖ": 201,
109
- "ኗ": 216,
110
- "ኘ": 33,
111
- "ኙ": 123,
112
- "ኛ": 169,
113
- "ኝ": 183,
114
- "ኞ": 97,
115
- "ኟ": 177,
116
- "አ": 45,
117
- "ኡ": 145,
118
- "ኢ": 154,
119
- "ኤ": 13,
120
- "እ": 75,
121
- "ኦ": 12,
122
- "ከ": 140,
123
- "ኩ": 64,
124
- "ኪ": 113,
125
- "ካ": 36,
126
- "ኬ": 134,
127
- "ክ": 192,
128
  "ኮ": 168,
129
- "ኳ": 125,
130
- "ኸ": 93,
131
- "ኽ": 197,
132
- "ወ": 72,
133
- "ዊ": 142,
134
- "ዋ": 65,
135
- "ዌ": 187,
136
- "ው": 198,
137
- "ዎ": 213,
138
- "ዐ": 188,
139
- "ዑ": 212,
140
- "ዒ": 7,
141
- "ዓ": 139,
142
- "ዕ": 132,
143
- "ዖ": 124,
144
- "ዘ": 117,
145
- "ዙ": 100,
146
- "ዚ": 121,
147
- "ዛ": 181,
148
- "ዜ": 173,
149
- "ዝ": 15,
150
- "ዞ": 16,
151
- "ዟ": 161,
152
- "ዢ": 167,
153
- "ዣ": 217,
154
- "ዤ": 159,
155
- "ዥ": 186,
156
- "ዦ": 126,
157
- "የ": 0,
158
- "ዩ": 67,
159
- "ያ": 76,
160
- "ዬ": 104,
161
- "ይ": 37,
162
- "ዮ": 2,
163
- "ደ": 202,
164
- "ዱ": 220,
165
- "ዲ": 155,
166
- "ዳ": 28,
167
- "ዴ": 23,
168
- "ድ": 31,
169
- "ዶ": 120,
170
- "ዷ": 92,
171
- "ጀ": 29,
172
- "ጁ": 207,
173
- "ጂ": 57,
174
- "ጃ": 208,
175
- "ጄ": 203,
176
- "ጅ": 103,
177
- "ጆ": 9,
178
- "ገ": 42,
179
- "ጉ": 68,
180
- "ጊ": 84,
181
- "ጋ": 141,
182
- "ጌ": 146,
183
- "ግ": 118,
184
- "ጎ": 22,
185
- "ጓ": 90,
186
- "ጠ": 150,
187
- "ጡ": 62,
188
- "ጢ": 131,
189
- "ጣ": 19,
190
- "ጤ": 20,
191
- "ጥ": 106,
192
- "ጦ": 11,
193
- "ጧ": 52,
194
- "ጨ": 199,
195
- "ጩ": 55,
196
- "ጪ": 70,
197
- "ጫ": 73,
198
- "ጬ": 110,
199
- "ጭ": 127,
200
- "ጮ": 91,
201
- "ጲ": 196,
202
- "ጴ": 138,
203
- "ጵ": 219,
204
- "ጶ": 111,
205
- "ጸ": 59,
206
- "ጹ": 98,
207
- "ጺ": 195,
208
- "ጻ": 96,
209
- "ጽ": 21,
210
- "ጾ": 80,
211
- "ጿ": 26,
212
- "ፀ": 164,
213
- "ፁ": 133,
214
- "ፃ": 38,
215
- "ፅ": 18,
216
- "ፈ": 6,
217
- "ፉ": 218,
218
- "ፊ": 89,
219
- "ፋ": 112,
220
- "ፌ": 176,
221
- "ፍ": 54,
222
- "ፎ": 136,
223
- "ፏ": 227,
224
- "ፑ": 66,
225
- "ፒ": 78,
226
- "ፓ": 182,
227
- "ፔ": 147,
228
- "ፕ": 174,
229
- "ፖ": 214,
230
- "“": 157,
231
- "”": 44
232
  }
 
1
  {
2
  "[PAD]": 229,
3
  "[UNK]": 228,
4
+ "|": 187,
5
+ "ሀ": 141,
6
+ "ሁ": 12,
7
+ "ሂ": 113,
8
+ "ሃ": 219,
9
+ "ሄ": 181,
10
+ "ህ": 221,
11
+ "ሆ": 178,
12
+ "ለ": 78,
13
+ "ሉ": 4,
14
+ "ሊ": 16,
15
+ "ላ": 86,
16
+ "ሌ": 139,
17
+ "ል": 15,
18
+ "ሎ": 24,
19
+ "ሏ": 81,
20
+ "ሐ": 76,
21
+ "ሑ": 64,
22
+ "ሓ": 44,
23
+ "ሔ": 171,
24
+ "ሕ": 45,
25
+ "መ": 74,
26
+ "ሙ": 124,
27
+ "ሚ": 191,
28
+ "ማ": 199,
29
+ "ሜ": 94,
30
+ "ም": 183,
31
+ "ሞ": 84,
32
+ "ሟ": 157,
33
+ "ሠ": 35,
34
+ "ሡ": 72,
35
+ "ሣ": 222,
36
+ "ሥ": 140,
37
+ "ሦ": 132,
38
+ "ረ": 151,
39
+ "ሩ": 225,
40
+ "ሪ": 226,
41
+ "ራ": 133,
42
+ "ሬ": 122,
43
+ "ር": 147,
44
+ "ሮ": 189,
45
+ "ሯ": 188,
46
+ "ሰ": 214,
47
+ "ሱ": 150,
48
+ "ሲ": 68,
49
+ "ሳ": 42,
50
+ "ሴ": 63,
51
+ "ስ": 53,
52
+ "ሶ": 27,
53
+ "ሷ": 208,
54
+ "ሸ": 128,
55
+ "ሹ": 21,
56
+ "ሺ": 43,
57
+ "ሻ": 160,
58
+ "ሼ": 186,
59
+ "ሽ": 201,
60
+ "ሾ": 227,
61
+ "ቀ": 129,
62
+ "ቁ": 200,
63
+ "ቂ": 9,
64
+ "ቃ": 179,
65
+ "ቄ": 105,
66
+ "ቅ": 115,
67
+ "ቆ": 101,
68
+ "ቋ": 206,
69
+ "በ": 111,
70
+ "ቡ": 50,
71
+ "ቢ": 60,
72
+ "ባ": 10,
73
+ "ቤ": 223,
74
+ "ብ": 217,
75
+ "ቦ": 185,
76
+ "ቧ": 167,
77
+ "ቨ": 103,
78
+ "ቪ": 184,
79
+ "ቫ": 158,
80
+ "ቭ": 195,
81
+ "ቮ": 107,
82
+ "ተ": 47,
83
+ "ቱ": 177,
84
+ "ቲ": 163,
85
+ "ታ": 51,
86
+ "ቴ": 146,
87
+ "ት": 137,
88
+ "ቶ": 159,
89
+ "ቷ": 98,
90
+ "ቸ": 148,
91
+ "ቹ": 93,
92
+ "ቺ": 212,
93
+ "ቻ": 2,
94
+ "ቼ": 62,
95
+ "ች": 117,
96
+ "ቾ": 92,
97
+ "ቿ": 20,
98
+ "ኀ": 210,
99
+ "ኃ": 156,
100
+ "ኅ": 73,
101
+ "ኋ": 7,
102
+ "ነ": 56,
103
+ "ኑ": 134,
104
+ "ኒ": 190,
105
+ "ና": 57,
106
+ "ኔ": 65,
107
+ "ን": 164,
108
+ "ኖ": 216,
109
+ "ኗ": 55,
110
+ "ኘ": 215,
111
+ "ኙ": 22,
112
+ "ኛ": 207,
113
+ "ኝ": 83,
114
+ "ኞ": 144,
115
+ "ኟ": 61,
116
+ "አ": 1,
117
+ "ኡ": 3,
118
+ "ኢ": 202,
119
+ "ኤ": 192,
120
+ "እ": 48,
121
+ "ኦ": 58,
122
+ "ከ": 99,
123
+ "ኩ": 87,
124
+ "ኪ": 135,
125
+ "ካ": 66,
126
+ "ኬ": 32,
127
+ "ክ": 96,
128
  "ኮ": 168,
129
+ "ኳ": 29,
130
+ "ኸ": 224,
131
+ "ኽ": 174,
132
+ "ወ": 198,
133
+ "ዊ": 69,
134
+ "ዋ": 108,
135
+ "ዌ": 19,
136
+ "ው": 49,
137
+ "ዎ": 138,
138
+ "ዐ": 209,
139
+ "ዑ": 127,
140
+ "ዒ": 95,
141
+ "ዓ": 166,
142
+ "ዕ": 97,
143
+ "ዖ": 118,
144
+ "ዘ": 172,
145
+ "ዙ": 33,
146
+ "ዚ": 70,
147
+ "ዛ": 0,
148
+ "ዜ": 13,
149
+ "ዝ": 161,
150
+ "ዞ": 38,
151
+ "ዟ": 119,
152
+ "ዢ": 46,
153
+ "ዣ": 52,
154
+ "ዤ": 114,
155
+ "ዥ": 169,
156
+ "ዦ": 30,
157
+ "የ": 125,
158
+ "ዩ": 220,
159
+ "ያ": 25,
160
+ "ዬ": 89,
161
+ "ይ": 6,
162
+ "ዮ": 175,
163
+ "ደ": 106,
164
+ "ዱ": 162,
165
+ "ዲ": 91,
166
+ "ዳ": 123,
167
+ "ዴ": 152,
168
+ "ድ": 102,
169
+ "ዶ": 88,
170
+ "ዷ": 204,
171
+ "ጀ": 218,
172
+ "ጁ": 149,
173
+ "ጂ": 71,
174
+ "ጃ": 126,
175
+ "ጄ": 11,
176
+ "ጅ": 41,
177
+ "ጆ": 40,
178
+ "ገ": 176,
179
+ "ጉ": 180,
180
+ "ጊ": 143,
181
+ "ጋ": 14,
182
+ "ጌ": 131,
183
+ "ግ": 120,
184
+ "ጎ": 110,
185
+ "ጓ": 213,
186
+ "ጠ": 194,
187
+ "ጡ": 8,
188
+ "ጢ": 136,
189
+ "ጣ": 142,
190
+ "ጤ": 153,
191
+ "ጥ": 121,
192
+ "ጦ": 112,
193
+ "ጧ": 5,
194
+ "ጨ": 155,
195
+ "ጩ": 116,
196
+ "ጪ": 205,
197
+ "ጫ": 85,
198
+ "ጬ": 79,
199
+ "ጭ": 154,
200
+ "ጮ": 67,
201
+ "ጲ": 193,
202
+ "ጴ": 31,
203
+ "ጵ": 145,
204
+ "ጶ": 18,
205
+ "ጸ": 90,
206
+ "ጹ": 36,
207
+ "ጺ": 173,
208
+ "ጻ": 104,
209
+ "ጽ": 23,
210
+ "ጾ": 77,
211
+ "ጿ": 203,
212
+ "ፀ": 54,
213
+ "ፁ": 37,
214
+ "ፃ": 109,
215
+ "ፅ": 80,
216
+ "ፈ": 28,
217
+ "ፉ": 34,
218
+ "ፊ": 82,
219
+ "ፋ": 196,
220
+ "ፌ": 17,
221
+ "ፍ": 59,
222
+ "ፎ": 39,
223
+ "ፏ": 26,
224
+ "ፑ": 165,
225
+ "ፒ": 130,
226
+ "ፓ": 197,
227
+ "ፔ": 75,
228
+ "ፕ": 211,
229
+ "ፖ": 100,
230
+ "“": 170,
231
+ "”": 182
232
  }