ChiBenevisamPas commited on
Commit
9a2739a
·
verified ·
1 Parent(s): bccbcad

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +6 -25
app.py CHANGED
@@ -48,20 +48,13 @@ def write_srt(transcription, output_file, tokenizer=None, translation_model=None
48
  def save_as_word(transcription, file_name, tokenizer=None, translation_model=None):
49
  doc = Document()
50
  doc.add_heading('Video Subtitles', 0)
51
- for i, segment in enumerate(transcription['segments']):
52
- start = segment['start']
53
- end = segment['end']
54
  text = segment['text']
55
 
56
  if translation_model:
57
  text = translate_text(text, tokenizer, translation_model)
58
 
59
- start_time = whisper.utils.format_timestamp(start)
60
- end_time = whisper.utils.format_timestamp(end)
61
-
62
- doc.add_paragraph(f"{i + 1}")
63
- doc.add_paragraph(f"{start_time} --> {end_time}")
64
- doc.add_paragraph(f"{text.strip()}\n")
65
 
66
  word_file = f"{file_name}.docx"
67
  doc.save(word_file)
@@ -74,19 +67,12 @@ def save_as_pdf(transcription, file_name, tokenizer=None, translation_model=None
74
  pdf.set_font("Arial", size=12)
75
  pdf.cell(200, 10, txt="Video Subtitles", ln=True, align="C")
76
 
77
- for i, segment in enumerate(transcription['segments']):
78
- start = segment['start']
79
- end = segment['end']
80
  text = segment['text']
81
 
82
  if translation_model:
83
  text = translate_text(text, tokenizer, translation_model)
84
 
85
- start_time = whisper.utils.format_timestamp(start)
86
- end_time = whisper.utils.format_timestamp(end)
87
-
88
- pdf.cell(200, 10, txt=f"{i + 1}", ln=True)
89
- pdf.cell(200, 10, txt=f"{start_time} --> {end_time}", ln=True)
90
  pdf.multi_cell(200, 10, txt=f"{text.strip()}\n")
91
 
92
  pdf_file = f"{file_name}.pdf"
@@ -97,23 +83,18 @@ def save_as_powerpoint(transcription, file_name, tokenizer=None, translation_mod
97
  prs = Presentation()
98
  slide_layout = prs.slide_layouts[1] # Title and Content layout
99
 
100
- for i, segment in enumerate(transcription['segments']):
101
- start = segment['start']
102
- end = segment['end']
103
  text = segment['text']
104
 
105
  if translation_model:
106
  text = translate_text(text, tokenizer, translation_model)
107
 
108
- start_time = whisper.utils.format_timestamp(start)
109
- end_time = whisper.utils.format_timestamp(end)
110
-
111
  slide = prs.slides.add_slide(slide_layout)
112
  title = slide.shapes.title
113
  body = slide.shapes.placeholders[1]
114
 
115
- title.text = f"Subtitle {i + 1}"
116
- body.text = f"{start_time} --> {end_time}\n\n{text.strip()}"
117
 
118
  ppt_file = f"{file_name}.pptx"
119
  prs.save(ppt_file)
 
48
  def save_as_word(transcription, file_name, tokenizer=None, translation_model=None):
49
  doc = Document()
50
  doc.add_heading('Video Subtitles', 0)
51
+ for segment in transcription['segments']:
 
 
52
  text = segment['text']
53
 
54
  if translation_model:
55
  text = translate_text(text, tokenizer, translation_model)
56
 
57
+ doc.add_paragraph(text.strip())
 
 
 
 
 
58
 
59
  word_file = f"{file_name}.docx"
60
  doc.save(word_file)
 
67
  pdf.set_font("Arial", size=12)
68
  pdf.cell(200, 10, txt="Video Subtitles", ln=True, align="C")
69
 
70
+ for segment in transcription['segments']:
 
 
71
  text = segment['text']
72
 
73
  if translation_model:
74
  text = translate_text(text, tokenizer, translation_model)
75
 
 
 
 
 
 
76
  pdf.multi_cell(200, 10, txt=f"{text.strip()}\n")
77
 
78
  pdf_file = f"{file_name}.pdf"
 
83
  prs = Presentation()
84
  slide_layout = prs.slide_layouts[1] # Title and Content layout
85
 
86
+ for segment in transcription['segments']:
 
 
87
  text = segment['text']
88
 
89
  if translation_model:
90
  text = translate_text(text, tokenizer, translation_model)
91
 
 
 
 
92
  slide = prs.slides.add_slide(slide_layout)
93
  title = slide.shapes.title
94
  body = slide.shapes.placeholders[1]
95
 
96
+ title.text = "Subtitle"
97
+ body.text = text.strip()
98
 
99
  ppt_file = f"{file_name}.pptx"
100
  prs.save(ppt_file)