hoangbinhmta99
/

wav2vec-NCKH-2022

Automatic Speech Recognition

feature-extraction

Inference Endpoints

Model card Files Files and versions Community

wav2vec-NCKH-2022 / README.md

hoangbinhmta99's picture

Update README.md

f3c6047 almost 3 years ago

|

1.66 kB

	---
	language: vi
	datasets:
	- vivos
	- common_voice
	metrics:
	- wer
	pipeline_tag: automatic-speech-recognition
	tags:
	- audio
	- speech
	- Transformer
	license: cc-by-nc-4.0
	model-index:
	- name: Wav2vec2 NCKH Vietnamese 2022
	results:
	- task:
	name: Speech Recognition
	type: automatic-speech-recognition
	dataset:
	name: Common Voice vi
	type: common_voice
	args: vi
	metrics:
	- name: Test WER
	type: wer
	value: No
	---

	Convert from model .pt to transformer
	Link: https://huggingface.co/tommy19970714/wav2vec2-base-960h
	Bash:
	```bash
	pip install transformers[sentencepiece]
	pip install fairseq -U
	git clone https://github.com/huggingface/transformers.git
	cp transformers/src/transformers/models/wav2vec2/convert_wav2vec2_original_pytorch_checkpoint_to_pytorch.py .
	wget https://dl.fbaipublicfiles.com/fairseq/wav2vec/wav2vec_small.pt -O ./wav2vec_small.pt
	mkdir dict
	wget https://dl.fbaipublicfiles.com/fairseq/wav2vec/dict.ltr.txt
	mkdir outputs
	python convert_wav2vec2_original_pytorch_checkpoint_to_pytorch.py
	--pytorch_dump_folder_path ./outputs --checkpoint_path ./finetuned/wav2vec_small.pt
	--dict_path ./dict/dict.ltr.txt --not_finetuned
	```
	# install and upload model
	```
	curl -s https://packagecloud.io/install/repositories/github/git-lfs/script.deb.sh \| sudo bash
	git lfs install
	sudo apt-get install git-lfs
	git lfs install
	git clone https://huggingface.co/hoangbinhmta99/wav2vec-demo
	ls
	cd wav2vec-demo/
	git status
	git add .
	git commit -m "First model version"
	git config --global user.email [yourname]
	git config --global user.name [yourpass]
	git commit -m "First model version"
	git push
	```