MultiMed

Runtime error

App Files Files Community

Tonic commited on Nov 19, 2023

Commit

e98c8c0

1 Parent(s): 81dcc03

Update app.py

Browse files

Files changed (1) hide show

app.py +17 -18

app.py CHANGED Viewed

@@ -140,22 +140,24 @@ def process_speech(input_language, audio_input):
         return f"{e}"
 def convert_text_to_speech(input_text: str, source_language: str, target_language: str) -> tuple[str, str]:
     client = Client("https://facebook-seamless-m4t.hf.space/--replicas/8cllp/")
     try:
         result = client.predict(
-            "T2ST",  # Task
-            "",  # Audio source
-            None,  # Input audio mic
-            None,  # Input audio file
-            input_text,  # Input text
-            source_language,  # Source language
-            target_language,  # Target language
-            api_name="/run",  # API endpoint
         )
         # Initialize variables
         translated_text = ""
         new_file_path = ""
@@ -170,23 +172,20 @@ def convert_text_to_speech(input_text: str, source_language: str, target_languag
                 if not translated_text:
                     translated_text = item
             elif os.path.isdir(item):
-                # Process the directory to find the first audio file
                 for file in os.listdir(item):
                     file_path = os.path.join(item, file)
-                    if os.path.isfile(file_path) and file_path.endswith('.wav'):
-                        new_file_name = f"audio_output_{uuid.uuid4()}.wav"
-                        new_file_path = os.path.join(os.path.dirname(file_path), new_file_name)
-                        os.rename(file_path, new_file_path)
-                        break  # Stop after finding the first audio file
                 if new_file_path:
-                    break  # Exit if an audio file has been processed
         return new_file_path, translated_text
     except Exception as e:
         return f"Error in text-to-speech conversion: {str(e)}", ""
 def process_image(image_input):

         return f"{e}"
+import os
+import uuid
 def convert_text_to_speech(input_text: str, source_language: str, target_language: str) -> tuple[str, str]:
     client = Client("https://facebook-seamless-m4t.hf.space/--replicas/8cllp/")
     try:
         result = client.predict(
+            task_name="T2ST",
+            audio_source="",
+            input_audio_mic=None,
+            input_audio_file=None,
+            input_text=input_text,
+            source_language=source_language,
+            target_language=target_language,
+            api_name="/run",
         )
         # Initialize variables
         translated_text = ""
         new_file_path = ""
                 if not translated_text:
                     translated_text = item
             elif os.path.isdir(item):
+                # Find the first MP3 file in the directory
                 for file in os.listdir(item):
                     file_path = os.path.join(item, file)
+                    if os.path.isfile(file_path) and file_path.endswith('.mp3'):
+                        # Return the path of the MP3 file directly without renaming
+                        new_file_path = file_path
+                        break
                 if new_file_path:
+                    break
         return new_file_path, translated_text
     except Exception as e:
         return f"Error in text-to-speech conversion: {str(e)}", ""
 def process_image(image_input):