speech-to-dutch-translation

Build error

App Files Files Community

susnato commited on Jul 21, 2023

Commit

c13b6ed

1 Parent(s): 03610db

Update app.py

Browse files

Files changed (1) hide show

app.py +10 -10

app.py CHANGED Viewed

@@ -1,7 +1,6 @@
-import gradio as gr
-import numpy as np
 import torch
-from datasets import load_dataset
 from transformers import AutoProcessor, AutoModel, pipeline, MarianMTModel, MarianTokenizer
@@ -21,7 +20,7 @@ martian_mt_tokenizer = MarianTokenizer.from_pretrained("AbhirupGhosh/opus-mt-fin
 def translate_english_to_hindi(english_text):
     tokenized_text = martian_mt_tokenizer.encode(english_text, return_tensors="pt")
-    generated_token_ids = martian_mt_model.generate(tokenized_text)
     hindi_text = martian_mt_tokenizer.decode(generated_token_ids.numpy()[0])
     hindi_text = hindi_text.replace("</s>", "")
     hindi_text = hindi_text.replace("<pad>", "")
@@ -30,21 +29,22 @@ def translate_english_to_hindi(english_text):
 def translate_to_english(audio):
-    outputs = asr_pipe(audio, max_new_tokens=256, generate_kwargs={"task": "transcribe"})
     return outputs["text"]
 def synthesise(text):
-    inputs = processor(text=text, return_tensors="pt")
-    speech_values = model.generate(**inputs)
     speech_values = speech_values.cpu().numpy()
     return speech_values
 def speech_to_hindi_translation(audio):
     english_text = translate_to_english(audio)
     hindi_text = translate_english_to_hindi(english_text)
-    synthesised_speech = synthesise(hindi_text)
     synthesised_speech = (synthesised_speech * 32767).astype(np.int16)
     return 22050, synthesised_speech
@@ -67,7 +67,7 @@ file_translate = gr.Interface(
     fn=speech_to_hindi_translation,
     inputs=gr.Audio(source="upload", type="filepath"),
     outputs=gr.Audio(label="Generated Speech", type="numpy"),
-    # examples=[["./example.wav"]],
     title=title,
     description=description,
 )

 import torch
+import numpy as np
+import gradio as gr
 from transformers import AutoProcessor, AutoModel, pipeline, MarianMTModel, MarianTokenizer
 def translate_english_to_hindi(english_text):
     tokenized_text = martian_mt_tokenizer.encode(english_text, return_tensors="pt")
+    generated_token_ids = martian_mt_model.generate(tokenized_text, use_cache=True)
     hindi_text = martian_mt_tokenizer.decode(generated_token_ids.numpy()[0])
     hindi_text = hindi_text.replace("</s>", "")
     hindi_text = hindi_text.replace("<pad>", "")
 def translate_to_english(audio):
+    outputs = asr_pipe(audio, generate_kwargs={"task": "transcribe", "use_cache":"True"})
     return outputs["text"]
 def synthesise(text):
+    inputs = processor(text=text, return_tensors="pt").to(device)
+    speech_values = model.generate(**inputs, use_cache=True)
     speech_values = speech_values.cpu().numpy()
     return speech_values
 def speech_to_hindi_translation(audio):
     english_text = translate_to_english(audio)
     hindi_text = translate_english_to_hindi(english_text)
+    synthesised_speech = synthesise(hindi_text)[0]
     synthesised_speech = (synthesised_speech * 32767).astype(np.int16)
     return 22050, synthesised_speech
     fn=speech_to_hindi_translation,
     inputs=gr.Audio(source="upload", type="filepath"),
     outputs=gr.Audio(label="Generated Speech", type="numpy"),
+    examples=["/home/susnato/Downloads/example.wav"],
     title=title,
     description=description,
 )