Spaces:

marquesafonso
/

multilang-asr-transcriber

Running

marquesafonso commited on Aug 31, 2024

Commit

55728fe

1 Parent(s): 27d74f3

add clean text transcription output

Files changed (2) hide show

app.py CHANGED Viewed

@@ -8,11 +8,12 @@ def main():
         video_file = gr.File(file_types=["video"],type="filepath", label="Upload a video")
         max_words_per_line = gr.Number(value=6, label="Max words per line")
         task = gr.Dropdown(choices=["transcribe", "translate"], value="transcribe", label="Select Task")
-        text_output = gr.Textbox(label="Text transcription", show_copy_button=True)
         srt_file = gr.File(file_count="single", type="filepath", file_types=[".srt"], label="SRT file")
         gr.Interface(transcriber,
                     inputs=[video_file, max_words_per_line, task],
-                    outputs=[text_output, srt_file],
                     allow_flagging="never")
     demo.launch()

         video_file = gr.File(file_types=["video"],type="filepath", label="Upload a video")
         max_words_per_line = gr.Number(value=6, label="Max words per line")
         task = gr.Dropdown(choices=["transcribe", "translate"], value="transcribe", label="Select Task")
+        text_output = gr.Textbox(label="SRT Text transcription", show_copy_button=True)
         srt_file = gr.File(file_count="single", type="filepath", file_types=[".srt"], label="SRT file")
+        text_clean_output = gr.Textbox(label="Text transcription", show_copy_button=True)
         gr.Interface(transcriber,
                     inputs=[video_file, max_words_per_line, task],
+                    outputs=[text_output, srt_file, text_clean_output],
                     allow_flagging="never")
     demo.launch()

src/transcriber.py CHANGED Viewed

@@ -23,6 +23,7 @@ def convert_seconds_to_time(seconds):
 def write_srt(segments, max_words_per_line, srt_path):
     with open(srt_path, "w", encoding='utf-8') as file:
         result = ''
         line_counter = 1
         for _, segment in enumerate(segments):
             words_in_line = []
@@ -35,11 +36,12 @@ def write_srt(segments, max_words_per_line, srt_path):
                         end_time = convert_seconds_to_time(words_in_line[-1].end)
                         line_text = ' '.join([w.word.strip() for w in words_in_line])
                         result += f"{line_counter}\n{start_time} --> {end_time}\n{line_text}\n\n"
                         # Reset for the next line and increment line counter
                         line_counter += 1
                     words_in_line = []  # Reset words list for the next line
         file.write(result)
-        return result, srt_path
 def transcriber(video_input:gr.File,
                 max_words_per_line:int,

 def write_srt(segments, max_words_per_line, srt_path):
     with open(srt_path, "w", encoding='utf-8') as file:
         result = ''
+        result_clean = []
         line_counter = 1
         for _, segment in enumerate(segments):
             words_in_line = []
                         end_time = convert_seconds_to_time(words_in_line[-1].end)
                         line_text = ' '.join([w.word.strip() for w in words_in_line])
                         result += f"{line_counter}\n{start_time} --> {end_time}\n{line_text}\n\n"
+                        result_clean += [line_text]
                         # Reset for the next line and increment line counter
                         line_counter += 1
                     words_in_line = []  # Reset words list for the next line
         file.write(result)
+        return result, srt_path, " ".join(result_clean)
 def transcriber(video_input:gr.File,
                 max_words_per_line:int,