Spaces:

VDNT11
/

AIML_project

Sleeping

VDNT11 commited on Nov 21, 2024

Commit

c3e8af7

verified ·

1 Parent(s): 4283a1b

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -10,18 +10,25 @@ import uuid
 device = "cuda:0" if torch.cuda.is_available() else "cpu"
 torch_dtype = torch.float16 if torch.cuda.is_available() else torch.float32
-# Load Whisper model from Hugging Face
 @st.cache_resource
 def load_model():
-    model_id = "openai/whisper-large-v2"
     model = AutoModelForSpeechSeq2Seq.from_pretrained(
-        model_id, torch_dtype=torch_dtype, low_cpu_mem_usage=True, use_safetensors=True
     )
     model.to(device)
     processor = AutoProcessor.from_pretrained(model_id)
     pipe = pipeline(
         "automatic-speech-recognition",
         model=model,
@@ -29,6 +36,7 @@ def load_model():
         feature_extractor=processor.feature_extractor,
         torch_dtype=torch_dtype,
         device=device,
     )
     return pipe, processor

 device = "cuda:0" if torch.cuda.is_available() else "cpu"
 torch_dtype = torch.float16 if torch.cuda.is_available() else torch.float32
 @st.cache_resource
 def load_model():
+    # Use a specific Hindi-optimized Whisper model
+    model_id = "openai/whisper-large-v2"  # or consider a multilingual model
+    # For Hindi, you might want to specify additional parameters
     model = AutoModelForSpeechSeq2Seq.from_pretrained(
+        model_id,
+        torch_dtype=torch_dtype,
+        low_cpu_mem_usage=True,
+        use_safetensors=True,
     )
     model.to(device)
+    # Use the processor from the same model
     processor = AutoProcessor.from_pretrained(model_id)
+    # Create pipeline with language specification
     pipe = pipeline(
         "automatic-speech-recognition",
         model=model,
         feature_extractor=processor.feature_extractor,
         torch_dtype=torch_dtype,
         device=device,
+        generate_kwargs={"language": "hi"}  # Specify Hindi language
     )
     return pipe, processor