Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -48,20 +48,13 @@ def write_srt(transcription, output_file, tokenizer=None, translation_model=None
|
|
48 |
def save_as_word(transcription, file_name, tokenizer=None, translation_model=None):
|
49 |
doc = Document()
|
50 |
doc.add_heading('Video Subtitles', 0)
|
51 |
-
for
|
52 |
-
start = segment['start']
|
53 |
-
end = segment['end']
|
54 |
text = segment['text']
|
55 |
|
56 |
if translation_model:
|
57 |
text = translate_text(text, tokenizer, translation_model)
|
58 |
|
59 |
-
|
60 |
-
end_time = whisper.utils.format_timestamp(end)
|
61 |
-
|
62 |
-
doc.add_paragraph(f"{i + 1}")
|
63 |
-
doc.add_paragraph(f"{start_time} --> {end_time}")
|
64 |
-
doc.add_paragraph(f"{text.strip()}\n")
|
65 |
|
66 |
word_file = f"{file_name}.docx"
|
67 |
doc.save(word_file)
|
@@ -74,19 +67,12 @@ def save_as_pdf(transcription, file_name, tokenizer=None, translation_model=None
|
|
74 |
pdf.set_font("Arial", size=12)
|
75 |
pdf.cell(200, 10, txt="Video Subtitles", ln=True, align="C")
|
76 |
|
77 |
-
for
|
78 |
-
start = segment['start']
|
79 |
-
end = segment['end']
|
80 |
text = segment['text']
|
81 |
|
82 |
if translation_model:
|
83 |
text = translate_text(text, tokenizer, translation_model)
|
84 |
|
85 |
-
start_time = whisper.utils.format_timestamp(start)
|
86 |
-
end_time = whisper.utils.format_timestamp(end)
|
87 |
-
|
88 |
-
pdf.cell(200, 10, txt=f"{i + 1}", ln=True)
|
89 |
-
pdf.cell(200, 10, txt=f"{start_time} --> {end_time}", ln=True)
|
90 |
pdf.multi_cell(200, 10, txt=f"{text.strip()}\n")
|
91 |
|
92 |
pdf_file = f"{file_name}.pdf"
|
@@ -97,23 +83,18 @@ def save_as_powerpoint(transcription, file_name, tokenizer=None, translation_mod
|
|
97 |
prs = Presentation()
|
98 |
slide_layout = prs.slide_layouts[1] # Title and Content layout
|
99 |
|
100 |
-
for
|
101 |
-
start = segment['start']
|
102 |
-
end = segment['end']
|
103 |
text = segment['text']
|
104 |
|
105 |
if translation_model:
|
106 |
text = translate_text(text, tokenizer, translation_model)
|
107 |
|
108 |
-
start_time = whisper.utils.format_timestamp(start)
|
109 |
-
end_time = whisper.utils.format_timestamp(end)
|
110 |
-
|
111 |
slide = prs.slides.add_slide(slide_layout)
|
112 |
title = slide.shapes.title
|
113 |
body = slide.shapes.placeholders[1]
|
114 |
|
115 |
-
title.text =
|
116 |
-
body.text =
|
117 |
|
118 |
ppt_file = f"{file_name}.pptx"
|
119 |
prs.save(ppt_file)
|
|
|
48 |
def save_as_word(transcription, file_name, tokenizer=None, translation_model=None):
|
49 |
doc = Document()
|
50 |
doc.add_heading('Video Subtitles', 0)
|
51 |
+
for segment in transcription['segments']:
|
|
|
|
|
52 |
text = segment['text']
|
53 |
|
54 |
if translation_model:
|
55 |
text = translate_text(text, tokenizer, translation_model)
|
56 |
|
57 |
+
doc.add_paragraph(text.strip())
|
|
|
|
|
|
|
|
|
|
|
58 |
|
59 |
word_file = f"{file_name}.docx"
|
60 |
doc.save(word_file)
|
|
|
67 |
pdf.set_font("Arial", size=12)
|
68 |
pdf.cell(200, 10, txt="Video Subtitles", ln=True, align="C")
|
69 |
|
70 |
+
for segment in transcription['segments']:
|
|
|
|
|
71 |
text = segment['text']
|
72 |
|
73 |
if translation_model:
|
74 |
text = translate_text(text, tokenizer, translation_model)
|
75 |
|
|
|
|
|
|
|
|
|
|
|
76 |
pdf.multi_cell(200, 10, txt=f"{text.strip()}\n")
|
77 |
|
78 |
pdf_file = f"{file_name}.pdf"
|
|
|
83 |
prs = Presentation()
|
84 |
slide_layout = prs.slide_layouts[1] # Title and Content layout
|
85 |
|
86 |
+
for segment in transcription['segments']:
|
|
|
|
|
87 |
text = segment['text']
|
88 |
|
89 |
if translation_model:
|
90 |
text = translate_text(text, tokenizer, translation_model)
|
91 |
|
|
|
|
|
|
|
92 |
slide = prs.slides.add_slide(slide_layout)
|
93 |
title = slide.shapes.title
|
94 |
body = slide.shapes.placeholders[1]
|
95 |
|
96 |
+
title.text = "Subtitle"
|
97 |
+
body.text = text.strip()
|
98 |
|
99 |
ppt_file = f"{file_name}.pptx"
|
100 |
prs.save(ppt_file)
|