Update README.md
Browse files
README.md
CHANGED
@@ -86,7 +86,7 @@ processor = Wav2Vec2Processor.from_pretrained("anas/wav2vec2-large-xlsr-arabic")
|
|
86 |
model = Wav2Vec2ForCTC.from_pretrained("anas/wav2vec2-large-xlsr-arabic/")
|
87 |
model.to("cuda")
|
88 |
|
89 |
-
chars_to_ignore_regex = '[
|
90 |
|
91 |
resampler = torchaudio.transforms.Resample(48_000, 16_000)
|
92 |
|
@@ -137,4 +137,6 @@ print("WER: {:2f}".format(100 * wer.compute(predictions=result["pred_strings"],
|
|
137 |
|
138 |
The Common Voice Corpus 4 `train`, `validation`, datasets were used for training
|
139 |
|
140 |
-
The script used for training can be found [here](...)
|
|
|
|
|
|
86 |
model = Wav2Vec2ForCTC.from_pretrained("anas/wav2vec2-large-xlsr-arabic/")
|
87 |
model.to("cuda")
|
88 |
|
89 |
+
chars_to_ignore_regex = '[\\,\\؟\\.\\!\\-\\;\\\\:\\'\\"\\☭\\«\\»\\؛\\—\\ـ\\_\\،\\“\\%\\‘\\”\\�]'
|
90 |
|
91 |
resampler = torchaudio.transforms.Resample(48_000, 16_000)
|
92 |
|
|
|
137 |
|
138 |
The Common Voice Corpus 4 `train`, `validation`, datasets were used for training
|
139 |
|
140 |
+
The script used for training can be found [here](...)
|
141 |
+
Twitter [here](@hasnii_anas)
|
142 |
+
Email [here]([email protected])
|