File size: 1,280 Bytes
efb4cb8 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 |
import cv2
from moviepy.editor import VideoFileClip
from gemini_vision import process_frame_with_gemini, summarize_with_gemini, extract_code_with_gemini
def frame_generator(video_path):
video = cv2.VideoCapture(video_path)
while True:
ret, frame = video.read()
if not ret:
break
yield frame
video.release()
def process_video(video_path, summary_words):
# Process frames with Gemini Vision Pro
extracted_text = ""
for frame in frame_generator(video_path):
extracted_text += process_frame_with_gemini(frame) + " "
# Extract audio and transcribe
video = VideoFileClip(video_path)
audio = video.audio
audio_path = "temp_audio.wav"
audio.write_audiofile(audio_path)
# Use Gemini Vision Pro for transcription (assuming it can handle audio)
transcription = process_frame_with_gemini(audio_path, mode="audio")
# Summarize content using Gemini
summary = summarize_with_gemini(transcription, max_words=summary_words)
# Extract code using Gemini
extracted_code = extract_code_with_gemini(transcription)
return {
'summary': summary,
'extracted_text': extracted_text,
'transcription': transcription,
'extracted_code': extracted_code
} |