Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -1,167 +1,148 @@
|
|
1 |
-
|
|
|
2 |
import traceback
|
3 |
-
import
|
4 |
-
import glob
|
5 |
-
import asyncio
|
6 |
-
from image_fetcher import main
|
7 |
-
from video import create_text_image
|
8 |
-
from moviepy.editor import *
|
9 |
from PIL import Image
|
10 |
-
import
|
11 |
-
import numpy as np
|
12 |
from gtts import gTTS
|
13 |
from mutagen.mp3 import MP3
|
14 |
-
|
15 |
-
import
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
16 |
|
17 |
-
|
18 |
-
|
19 |
-
|
20 |
-
|
21 |
-
|
22 |
-
audio = MP3(filename)
|
23 |
duration = audio.info.length
|
24 |
-
IMAGE_PATH = "/tmp/images/slide"+str(id)+".png" # Ensure this path is correct
|
25 |
-
VIDEO_DURATION = duration # seconds
|
26 |
-
HIGHLIGHT_COLOR = (255, 255, 0) # Yellow highlight
|
27 |
-
HIGHLIGHT_OPACITY = 0.5 # Semi-transparent
|
28 |
-
|
29 |
-
# --- OCR STEP ---
|
30 |
-
img = Image.open(IMAGE_PATH)
|
31 |
-
data = pytesseract.image_to_data(img, output_type=pytesseract.Output.DICT)
|
32 |
-
|
33 |
-
# Extract words and their positions
|
34 |
-
words = []
|
35 |
-
for i in range(len(data['text'])):
|
36 |
-
word = data['text'][i].strip()
|
37 |
-
if word and int(data['conf'][i]) > 60:
|
38 |
-
x, y, w, h = data['left'][i], data['top'][i], data['width'][i], data['height'][i]
|
39 |
-
words.append({'text': word, 'box': (x, y, w, h)})
|
40 |
-
|
41 |
-
# --- BASE IMAGE CLIP ---
|
42 |
-
image_clip = ImageClip(IMAGE_PATH).set_duration(VIDEO_DURATION)
|
43 |
-
|
44 |
-
# --- HIGHLIGHT WORDS ONE BY ONE ---
|
45 |
-
n_words = len(words)
|
46 |
-
highlight_duration = VIDEO_DURATION / n_words
|
47 |
-
|
48 |
-
highlight_clips = []
|
49 |
-
|
50 |
-
for i, word in enumerate(words):
|
51 |
-
x, y, w, h = word['box']
|
52 |
-
start = i * highlight_duration
|
53 |
-
end = start + highlight_duration
|
54 |
-
|
55 |
-
# Create highlight rectangle
|
56 |
-
rect = ColorClip(size=(w, h), color=HIGHLIGHT_COLOR)
|
57 |
-
rect = rect.set_opacity(HIGHLIGHT_OPACITY).set_position((x, y)).set_start(start).set_end(end)
|
58 |
-
|
59 |
-
highlight_clips.append(rect)
|
60 |
-
|
61 |
-
# --- FINAL VIDEO --
|
62 |
-
|
63 |
-
final_clip = CompositeVideoClip([image_clip] + highlight_clips)
|
64 |
-
audio = AudioFileClip(filename)
|
65 |
-
final_clip = final_clip.set_audio(audio)
|
66 |
-
final_clip.write_videofile("/tmp/clip"+str(id)+".mp4", fps=24)
|
67 |
|
68 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
69 |
|
70 |
-
@app.route("/")
|
71 |
-
def home():
|
72 |
-
return "Flask Video Generator is Running"
|
73 |
|
74 |
@app.route("/generate", methods=["POST"])
|
75 |
def generate_video():
|
76 |
try:
|
77 |
data = request.get_json()
|
78 |
prompt = data.get("duration", '').strip()
|
79 |
-
prompts=prompt.replace("**","")
|
80 |
-
|
81 |
-
if prompts
|
82 |
-
return jsonify({"error": "prompts be
|
83 |
-
|
84 |
-
|
85 |
-
#asyncio.run(main(line))
|
86 |
-
raw_lines = prompts.splitlines(keepends=False)
|
87 |
lines = []
|
88 |
-
|
89 |
i = 0
|
|
|
90 |
while i < len(raw_lines):
|
91 |
line = raw_lines[i].strip()
|
92 |
-
|
93 |
-
#
|
94 |
-
|
95 |
-
block = line # Start block with heading
|
96 |
i += 1
|
97 |
-
|
98 |
-
# Accumulate body lines until next heading or 5+ lines
|
99 |
paragraph_lines = []
|
|
|
100 |
while i < len(raw_lines):
|
101 |
next_line = raw_lines[i].strip()
|
102 |
-
|
103 |
-
# Stop if next line is a heading
|
104 |
-
if next_line.strip().startswith("#") and (next_line.endswith('?') or next_line.endswith(':')):
|
105 |
break
|
106 |
-
|
107 |
paragraph_lines.append(next_line)
|
108 |
i += 1
|
109 |
-
|
110 |
-
# If we've gathered enough lines for a slide, break to next
|
111 |
if len(paragraph_lines) >= 5:
|
112 |
break
|
113 |
-
|
114 |
-
# Combine heading + paragraph
|
115 |
if paragraph_lines:
|
116 |
block += '\n' + '\n'.join(paragraph_lines)
|
117 |
-
|
118 |
lines.append(block)
|
119 |
-
|
120 |
else:
|
121 |
-
# Group normal lines (not part of any heading)
|
122 |
block_lines = []
|
123 |
count = 0
|
124 |
-
|
125 |
while i < len(raw_lines) and count < 5:
|
126 |
next_line = raw_lines[i].strip()
|
127 |
-
|
128 |
-
# If this is a heading, break to handle it separately
|
129 |
-
if next_line.strip().startswith("#") and (next_line.endswith('?') or next_line.endswith(':')):
|
130 |
break
|
131 |
-
|
132 |
block_lines.append(next_line)
|
133 |
i += 1
|
134 |
count += 1
|
135 |
-
|
136 |
if block_lines:
|
137 |
lines.append('\n'.join(block_lines))
|
138 |
-
|
139 |
-
#
|
140 |
-
|
141 |
-
image_olst=[]
|
142 |
for id in range(len(lines)):
|
143 |
-
|
|
|
144 |
for i in range(len(lines)):
|
145 |
-
video_func(i,lines)
|
146 |
-
|
147 |
-
for id in range(len(lines))
|
148 |
-
clip = VideoFileClip(f"clip{id}.mp4")
|
149 |
-
clips.append(clip)
|
150 |
-
|
151 |
final_video = concatenate_videoclips(clips)
|
152 |
-
|
|
|
|
|
|
|
153 |
for img in image_olst:
|
154 |
os.remove(img)
|
155 |
|
156 |
-
return send_file(
|
157 |
|
158 |
except Exception as e:
|
159 |
traceback.print_exc()
|
160 |
return jsonify({"error": str(e)}), 500
|
161 |
|
|
|
|
|
|
|
|
|
|
|
|
|
162 |
if __name__ == "__main__":
|
163 |
app.run(host="0.0.0.0", port=7860)
|
164 |
|
165 |
-
# Example call (remove or change in your actual app)
|
166 |
-
|
167 |
|
|
|
1 |
+
import os
|
2 |
+
import tempfile
|
3 |
import traceback
|
4 |
+
from flask import Flask, request, jsonify, send_file
|
|
|
|
|
|
|
|
|
|
|
5 |
from PIL import Image
|
6 |
+
from moviepy.editor import *
|
|
|
7 |
from gtts import gTTS
|
8 |
from mutagen.mp3 import MP3
|
9 |
+
import pytesseract
|
10 |
+
import numpy as np
|
11 |
+
|
12 |
+
app = Flask(__name__)
|
13 |
+
|
14 |
+
def video_func(id, lines):
|
15 |
+
try:
|
16 |
+
# Temp files
|
17 |
+
temp_audio = tempfile.NamedTemporaryFile(delete=False, suffix='.mp3')
|
18 |
+
temp_audio.close()
|
19 |
|
20 |
+
# Text-to-Speech
|
21 |
+
tts = gTTS(text=lines[id], lang='ta', slow=False)
|
22 |
+
tts.save(temp_audio.name)
|
23 |
+
|
24 |
+
audio = MP3(temp_audio.name)
|
|
|
25 |
duration = audio.info.length
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
26 |
|
27 |
+
image_path = f"/tmp/images/slide{id}.png"
|
28 |
+
video_duration = duration
|
29 |
+
highlight_color = (255, 255, 0)
|
30 |
+
highlight_opacity = 0.5
|
31 |
+
|
32 |
+
# OCR: Extract words
|
33 |
+
img = Image.open(image_path)
|
34 |
+
data = pytesseract.image_to_data(img, output_type=pytesseract.Output.DICT)
|
35 |
+
|
36 |
+
words = []
|
37 |
+
for i in range(len(data['text'])):
|
38 |
+
word = data['text'][i].strip()
|
39 |
+
if word and int(data['conf'][i]) > 60:
|
40 |
+
x, y, w, h = data['left'][i], data['top'][i], data['width'][i], data['height'][i]
|
41 |
+
words.append({'text': word, 'box': (x, y, w, h)})
|
42 |
+
|
43 |
+
image_clip = ImageClip(image_path).set_duration(video_duration)
|
44 |
+
|
45 |
+
# Highlight effect
|
46 |
+
n_words = len(words)
|
47 |
+
highlight_duration = video_duration / max(n_words, 1)
|
48 |
+
highlight_clips = []
|
49 |
+
|
50 |
+
for i, word in enumerate(words):
|
51 |
+
x, y, w, h = word['box']
|
52 |
+
start = i * highlight_duration
|
53 |
+
end = start + highlight_duration
|
54 |
+
|
55 |
+
rect = ColorClip(size=(w, h), color=highlight_color)
|
56 |
+
rect = rect.set_opacity(highlight_opacity).set_position((x, y)).set_start(start).set_end(end)
|
57 |
+
highlight_clips.append(rect)
|
58 |
+
|
59 |
+
final_clip = CompositeVideoClip([image_clip] + highlight_clips)
|
60 |
+
audio = AudioFileClip(temp_audio.name)
|
61 |
+
final_clip = final_clip.set_audio(audio)
|
62 |
+
final_clip.write_videofile(f"/tmp/clip{id}.mp4", fps=24)
|
63 |
+
|
64 |
+
except Exception as e:
|
65 |
+
print(f"Error in video_func for ID {id}: {e}")
|
66 |
+
traceback.print_exc()
|
67 |
|
|
|
|
|
|
|
68 |
|
69 |
@app.route("/generate", methods=["POST"])
|
70 |
def generate_video():
|
71 |
try:
|
72 |
data = request.get_json()
|
73 |
prompt = data.get("duration", '').strip()
|
74 |
+
prompts = prompt.replace("**", "")
|
75 |
+
|
76 |
+
if not prompts:
|
77 |
+
return jsonify({"error": "prompts must not be empty"}), 400
|
78 |
+
|
79 |
+
raw_lines = prompts.splitlines()
|
|
|
|
|
80 |
lines = []
|
|
|
81 |
i = 0
|
82 |
+
|
83 |
while i < len(raw_lines):
|
84 |
line = raw_lines[i].strip()
|
85 |
+
|
86 |
+
if line.startswith("#") and (line.endswith('?') or line.endswith(':')):
|
87 |
+
block = line
|
|
|
88 |
i += 1
|
|
|
|
|
89 |
paragraph_lines = []
|
90 |
+
|
91 |
while i < len(raw_lines):
|
92 |
next_line = raw_lines[i].strip()
|
93 |
+
if next_line.startswith("#") and (next_line.endswith('?') or next_line.endswith(':')):
|
|
|
|
|
94 |
break
|
|
|
95 |
paragraph_lines.append(next_line)
|
96 |
i += 1
|
|
|
|
|
97 |
if len(paragraph_lines) >= 5:
|
98 |
break
|
99 |
+
|
|
|
100 |
if paragraph_lines:
|
101 |
block += '\n' + '\n'.join(paragraph_lines)
|
|
|
102 |
lines.append(block)
|
|
|
103 |
else:
|
|
|
104 |
block_lines = []
|
105 |
count = 0
|
|
|
106 |
while i < len(raw_lines) and count < 5:
|
107 |
next_line = raw_lines[i].strip()
|
108 |
+
if next_line.startswith("#") and (next_line.endswith('?') or next_line.endswith(':')):
|
|
|
|
|
109 |
break
|
|
|
110 |
block_lines.append(next_line)
|
111 |
i += 1
|
112 |
count += 1
|
|
|
113 |
if block_lines:
|
114 |
lines.append('\n'.join(block_lines))
|
115 |
+
|
116 |
+
# Slide image creation
|
117 |
+
image_olst = []
|
|
|
118 |
for id in range(len(lines)):
|
119 |
+
create_text_image(lines[id], id, image_olst)
|
120 |
+
|
121 |
for i in range(len(lines)):
|
122 |
+
video_func(i, lines)
|
123 |
+
|
124 |
+
clips = [VideoFileClip(f"/tmp/clip{id}.mp4") for id in range(len(lines))]
|
|
|
|
|
|
|
125 |
final_video = concatenate_videoclips(clips)
|
126 |
+
output_path = "/tmp/final_output.mp4"
|
127 |
+
final_video.write_videofile(output_path, fps=24)
|
128 |
+
|
129 |
+
# Clean up
|
130 |
for img in image_olst:
|
131 |
os.remove(img)
|
132 |
|
133 |
+
return send_file(output_path, mimetype='video/mp4')
|
134 |
|
135 |
except Exception as e:
|
136 |
traceback.print_exc()
|
137 |
return jsonify({"error": str(e)}), 500
|
138 |
|
139 |
+
|
140 |
+
@app.route("/")
|
141 |
+
def home():
|
142 |
+
return "Flask Video Generator is Running"
|
143 |
+
|
144 |
+
|
145 |
if __name__ == "__main__":
|
146 |
app.run(host="0.0.0.0", port=7860)
|
147 |
|
|
|
|
|
148 |
|