Spaces:

vsrinivas
/

Multi_Language_Video_Conference

Sleeping

App Files Files Community

vsrinivas commited on Oct 14, 2024

Commit

1589ebc

verified ·

1 Parent(s): 7053531

Update app.py

Browse files

Files changed (1) hide show

app.py +17 -27

app.py CHANGED Viewed

@@ -33,23 +33,21 @@ language_codes = {"English":"en", "Hindi":"hi", "Portuguese":"pt", "Chinese":"zh
 "Ukrainian":"uk", "Greek":"el", "Czech":"cs", "Danish":"da", "Finnish":"fi",
 "Bulgarian":"bg", "Croatian":"hr", "Slovak":"sk"}
-# meeting_texts = []
 n_participants = 4 # This can be adjusted based on the number of people in the call
 language_choices = ["English", "Polish", "Hindi", "Arabic"]
 def clear_all():
-    # global meeting_texts
-    # meeting_texts = []  # Reset meeting texts
-    return [None] * (n_participants * 5 + 1)  # Reset outputs of transcripts, translated texts, and dubbed videos
 def wait_for_dubbing_completion(dubbing_id: str) -> bool:
     """
     Waits for the dubbing process to complete by periodically checking the status.
     Args:
         dubbing_id (str): The dubbing project id.
     Returns:
         bool: True if the dubbing is successful, False otherwise.
     """
@@ -77,11 +75,9 @@ def wait_for_dubbing_completion(dubbing_id: str) -> bool:
 def download_dubbed_file(dubbing_id: str, language_code: str) -> str:
     """
     Downloads the dubbed file for a given dubbing ID and language code.
     Args:
         dubbing_id: The ID of the dubbing project.
         language_code: The language code for the dubbing.
     Returns:
         The file path to the downloaded dubbed file.
     """
@@ -104,13 +100,11 @@ def create_dub_from_file(
 # ) -> Optional[str]:
     """
     Dubs an audio or video file from one language to another and saves the output.
     Args:
         input_file_path (str): The file path of the audio or video to dub.
         file_format (str): The file format of the input file.
         source_language (str): The language of the input file.
         target_language (str): The target language to dub into.
     Returns:
         Optional[str]: The file path of the dubbed file or None if operation failed.
     """
@@ -136,17 +130,20 @@ def create_dub_from_file(
         return None
-def summarize(meeting_texts):
     mt = ', '.join([f"{k}: {v}" for i in meeting_texts for k, v in i.items()])
     meeting_date_time = str(datetime.now().strftime("%Y-%m-%d %H:%M:%S"))
     meeting_texts = meeting_date_time + '\n' + mt
     minutes_of_meeting = ""
     for chunk in AI71(AI71_API_KEY.strip()).chat.completions.create(
         model="tiiuae/falcon-180b-chat",
         messages=[
             {"role": "system", "content": f"""You are an expereiced Secretary who can summarize meeting discussions into minutes of meeting.
-            Summarize the meetings discussions provided as Speakerwise conversation.
             Strictly consider only the context given in user content {meeting_texts} for summarization.
             Ensure to mention the title as 'Minutes of Meeting held on {meeting_date_time} and present the summary with better viewing format and title in bold letters"""},
             {"role": "user", "content": meeting_texts},
@@ -195,12 +192,12 @@ def synthesize_speech(video, source_language,target_language):
     return dub_video
 # This function handles the processing when any participant speaks
-def process_speaker(video, speaker_idx, n_participants, meeting_texts, *language_list):
     transcript = speech_to_text(video)
     # Create outputs for each participant
     outputs = []
-    # global meeting_texts
     def process_translation_dubbing(i):
         if i != speaker_idx:
             participant_language = language_codes[language_list[i]]
@@ -220,7 +217,6 @@ def process_speaker(video, speaker_idx, n_participants, meeting_texts, *language
         else:
             outputs.append(translated_text)
             outputs.append(dubbed_video)
     if speaker_idx == 0:
         meeting_texts.append({f"Speaker_{speaker_idx+1}":outputs[0]})
     else:
@@ -228,11 +224,9 @@ def process_speaker(video, speaker_idx, n_participants, meeting_texts, *language
     print(len(outputs))
     print(outputs)
-    outputs.extend(meeting_texts)
     print('meeting_texts: ',meeting_texts)
     return outputs
 def create_participant_row(i, language_choices):
     """Creates the UI for a single participant."""
     with gr.Row():
@@ -243,15 +237,12 @@ def create_participant_row(i, language_choices):
         dubbed_video = gr.Video(label="Speaker's Dubbed Video")
         return video_input, language_dropdown, transcript_output, translated_text, dubbed_video
 # Main dynamic Gradio interface
 def create_gradio_interface(n_participants, language_choices):
     with gr.Blocks() as demo:
         gr.Markdown("""# LinguaPolis: Bridging Languages, Uniting Teams Globally - Multilingual Conference Call Simulation
         ## Record your video or upload your video and press the corresponding Submit button at the bottom""")
-        # meeting_texts = []
         video_inputs = []
         language_dropdowns = []
         transcript_outputs = []
@@ -259,7 +250,7 @@ def create_gradio_interface(n_participants, language_choices):
         dubbed_videos = []
         clear_button = gr.Button("Clear All")
         # Create a row for each participant
         for i in range(n_participants):
             video_input, language_dropdown, transcript_output, translated_text, dubbed_video = create_participant_row(i, language_choices)
@@ -273,13 +264,12 @@ def create_gradio_interface(n_participants, language_choices):
         for i in range(n_participants):
             gr.Button(f"Submit Speaker {i+1}'s Speech").click(
                 process_speaker,
-                # [video_inputs[i], gr.State(i), gr.State(n_participants)] + [language_dropdowns[j] for j in range(n_participants)],
-                [video_inputs[i], gr.State(i), gr.State(n_participants)] + [gr.State(value=[])] + [language_dropdowns[j] for j in range(n_participants)],
-                [transcript_outputs[i]] + [k for j in zip(translated_texts[:i]+translated_texts[i+1:], dubbed_videos[:i]+dubbed_videos[i+1:]) for k in j] + [gr.State()]
            )
         minutes = gr.Textbox(label="Minutes of Meeting")
-        gr.Button(f"Generate Minutes of meeting").click(summarize, meeting_texts, minutes)
         # Clear button to reset inputs and outputs
         clear_button.click(clear_all, None, [*video_inputs, *transcript_outputs, *translated_texts, *dubbed_videos, minutes])
@@ -287,4 +277,4 @@ def create_gradio_interface(n_participants, language_choices):
     demo.queue().launch(debug=True, share=True)
-create_gradio_interface(n_participants, language_choices)

 "Ukrainian":"uk", "Greek":"el", "Czech":"cs", "Danish":"da", "Finnish":"fi",
 "Bulgarian":"bg", "Croatian":"hr", "Slovak":"sk"}
+meeting_texts = []
 n_participants = 4 # This can be adjusted based on the number of people in the call
 language_choices = ["English", "Polish", "Hindi", "Arabic"]
 def clear_all():
+    global meeting_texts
+    meeting_texts = []  # Reset meeting texts
+    return [None] * (n_participants * 4 + 1)  # Reset outputs of transcripts, translated texts, and dubbed videos
 def wait_for_dubbing_completion(dubbing_id: str) -> bool:
     """
     Waits for the dubbing process to complete by periodically checking the status.
     Args:
         dubbing_id (str): The dubbing project id.
     Returns:
         bool: True if the dubbing is successful, False otherwise.
     """
 def download_dubbed_file(dubbing_id: str, language_code: str) -> str:
     """
     Downloads the dubbed file for a given dubbing ID and language code.
     Args:
         dubbing_id: The ID of the dubbing project.
         language_code: The language code for the dubbing.
     Returns:
         The file path to the downloaded dubbed file.
     """
 # ) -> Optional[str]:
     """
     Dubs an audio or video file from one language to another and saves the output.
     Args:
         input_file_path (str): The file path of the audio or video to dub.
         file_format (str): The file format of the input file.
         source_language (str): The language of the input file.
         target_language (str): The target language to dub into.
     Returns:
         Optional[str]: The file path of the dubbed file or None if operation failed.
     """
         return None
+def summarize(meeting_texts=meeting_texts):
     mt = ', '.join([f"{k}: {v}" for i in meeting_texts for k, v in i.items()])
     meeting_date_time = str(datetime.now().strftime("%Y-%m-%d %H:%M:%S"))
     meeting_texts = meeting_date_time + '\n' + mt
+    # meeting_conversation_processed ='\n'.join(mt)
+    # print("M:", session_conversation_processed)
     minutes_of_meeting = ""
     for chunk in AI71(AI71_API_KEY.strip()).chat.completions.create(
         model="tiiuae/falcon-180b-chat",
         messages=[
             {"role": "system", "content": f"""You are an expereiced Secretary who can summarize meeting discussions into minutes of meeting.
+            Summarize the meetings discussions provided as Speakerwise conversation.
             Strictly consider only the context given in user content {meeting_texts} for summarization.
             Ensure to mention the title as 'Minutes of Meeting held on {meeting_date_time} and present the summary with better viewing format and title in bold letters"""},
             {"role": "user", "content": meeting_texts},
     return dub_video
 # This function handles the processing when any participant speaks
+def process_speaker(video, speaker_idx, n_participants, *language_list):
     transcript = speech_to_text(video)
     # Create outputs for each participant
     outputs = []
+    global meeting_texts
     def process_translation_dubbing(i):
         if i != speaker_idx:
             participant_language = language_codes[language_list[i]]
         else:
             outputs.append(translated_text)
             outputs.append(dubbed_video)
     if speaker_idx == 0:
         meeting_texts.append({f"Speaker_{speaker_idx+1}":outputs[0]})
     else:
     print(len(outputs))
     print(outputs)
     print('meeting_texts: ',meeting_texts)
     return outputs
 def create_participant_row(i, language_choices):
     """Creates the UI for a single participant."""
     with gr.Row():
         dubbed_video = gr.Video(label="Speaker's Dubbed Video")
         return video_input, language_dropdown, transcript_output, translated_text, dubbed_video
 # Main dynamic Gradio interface
 def create_gradio_interface(n_participants, language_choices):
     with gr.Blocks() as demo:
         gr.Markdown("""# LinguaPolis: Bridging Languages, Uniting Teams Globally - Multilingual Conference Call Simulation
         ## Record your video or upload your video and press the corresponding Submit button at the bottom""")
         video_inputs = []
         language_dropdowns = []
         transcript_outputs = []
         dubbed_videos = []
         clear_button = gr.Button("Clear All")
         # Create a row for each participant
         for i in range(n_participants):
             video_input, language_dropdown, transcript_output, translated_text, dubbed_video = create_participant_row(i, language_choices)
         for i in range(n_participants):
             gr.Button(f"Submit Speaker {i+1}'s Speech").click(
                 process_speaker,
+                [video_inputs[i], gr.State(i), gr.State(n_participants)] + [language_dropdowns[j] for j in range(n_participants)],
+                [transcript_outputs[i]] + [k for j in zip(translated_texts[:i]+translated_texts[i+1:], dubbed_videos[:i]+dubbed_videos[i+1:]) for k in j]
            )
         minutes = gr.Textbox(label="Minutes of Meeting")
+        gr.Button(f"Generate Minutes of meeting").click(summarize, None, minutes)
         # Clear button to reset inputs and outputs
         clear_button.click(clear_all, None, [*video_inputs, *transcript_outputs, *translated_texts, *dubbed_videos, minutes])
     demo.queue().launch(debug=True, share=True)
+create_gradio_interface(n_participants, language_choices)