RasmusToivanen commited on
Commit
ef1a65c
1 Parent(s): 78d0acf

add secrets

Browse files
Files changed (1) hide show
  1. app.py +8 -9
app.py CHANGED
@@ -3,7 +3,7 @@ import librosa
3
  import soundfile as sf
4
  import torch
5
  import warnings
6
-
7
  from transformers import Wav2Vec2ProcessorWithLM, Wav2Vec2CTCTokenizer
8
 
9
  warnings.filterwarnings("ignore")
@@ -11,22 +11,21 @@ warnings.filterwarnings("ignore")
11
  #load wav2vec2 tokenizer and model
12
 
13
  from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
14
- import time
15
  from fastapi import FastAPI, HTTPException, File
16
- model_name = "Finnish-NLP/wav2vec2-xlsr-300m-finnish-lm"
17
  from transformers import pipeline
18
- #feature_extractor = AutoFeatureExtractor.from_pretrained(model_name)
19
- #tokenizer = AutoTokenizer.from_pretrained(model_name)
20
- #model = Wav2Vec2ForCTC.from_pretrained(model_name)
21
- pipe = pipeline(model="Finnish-NLP/wav2vec2-xlsr-1b-finnish-lm-v2",chunk_length_s=20, stride_length_s=(4, 2))
22
 
23
 
 
 
 
24
 
25
 
26
  device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
27
  model_checkpoint = 'Finnish-NLP/t5x-small-nl24-finnish'
28
- tokenizer = AutoTokenizer.from_pretrained(model_checkpoint, use_auth_token=True)
29
- model = AutoModelForSeq2SeqLM.from_pretrained('model_t5', from_flax=False, torch_dtype=torch.float32).to(device)
30
 
31
 
32
  # define speech-to-text function
 
3
  import soundfile as sf
4
  import torch
5
  import warnings
6
+ import os
7
  from transformers import Wav2Vec2ProcessorWithLM, Wav2Vec2CTCTokenizer
8
 
9
  warnings.filterwarnings("ignore")
 
11
  #load wav2vec2 tokenizer and model
12
 
13
  from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
14
+
15
  from fastapi import FastAPI, HTTPException, File
16
+
17
  from transformers import pipeline
 
 
 
 
18
 
19
 
20
+ pipe = pipeline(model="Finnish-NLP/wav2vec2-xlsr-1b-finnish-lm-v2",chunk_length_s=20, stride_length_s=(4, 2))
21
+
22
+ token = os.getenv()
23
 
24
 
25
  device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
26
  model_checkpoint = 'Finnish-NLP/t5x-small-nl24-finnish'
27
+ tokenizer = AutoTokenizer.from_pretrained(model_checkpoint, use_auth_token=os.environ.get('hf_token'))
28
+ model = AutoModelForSeq2SeqLM.from_pretrained('Finnish-NLP/case_correction_model', from_flax=False, torch_dtype=torch.float32, use_auth_token=os.environ.get('hf_token')).to(device)
29
 
30
 
31
  # define speech-to-text function