Spaces:
Sleeping
Sleeping
File size: 3,862 Bytes
3fdcc70 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 |
import io
import os
import os.path as osp
import uuid
import requests
from pathlib import Path
import av
import numpy as np
import moviepy.editor as mpe
from cllm.services.utils import get_bytes_value
__ALL__ = [
"video_classification",
"video_captioning",
"image_to_video",
"text_to_video",
"video_to_webpage",
"dub_video",
]
HOST = os.environ.get("CLLM_SERVICES_HOST", "localhost")
PORT = os.environ.get("CLLM_SERVICES_PORT", 10056)
def setup(host="localhost", port=10056):
global HOST, PORT
HOST = host
PORT = port
def video_classification(video: str | Path | bytes, **kwargs):
host = kwargs.get("host", HOST)
port = kwargs.get("port", PORT)
url = f"http://{host}:{port}/video_classification"
files = {"video": (video, get_bytes_value(video))}
response = requests.post(url, files=files)
return response.json()
def video_captioning(video: str | Path, **kwargs):
host = kwargs.get("host", HOST)
port = kwargs.get("port", PORT)
url = f"http://{host}:{port}/video_captioning"
files = {"video": (video, get_bytes_value(video))}
response = requests.post(url, files=files)
return response.json()
def image_audio_to_video(image: str | Path, audio: str | Path, **kwargs):
host = kwargs.get("host", HOST)
port = kwargs.get("port", PORT)
url = f"http://{host}:{port}/image_audio_to_video"
files = {
"image": (image, get_bytes_value(image)),
"audio": (audio, get_bytes_value(audio)),
}
response = requests.post(url, files=files)
return response.content
def image_to_video(image: str | Path, **kwargs):
host = kwargs.get("host", HOST)
port = kwargs.get("port", PORT)
url = f"http://{host}:{port}/image_to_video"
files = {"image": (image, get_bytes_value(image))}
response = requests.post(url, files=files)
return response.content
def text_to_video(prompt: str, **kwargs):
host = kwargs.get("host", HOST)
port = kwargs.get("port", PORT)
url = f"http://{host}:{port}/text_to_video"
data = {"prompt": prompt}
response = requests.post(url, data=data)
return response.content
def video_to_webpage(
video: str | Path,
title: str,
tags: list[str],
description: str,
**kwargs,
):
host = kwargs.get("host", HOST)
port = kwargs.get("port", PORT)
url = f"http://{host}:{port}/video_to_webpage"
files = {"video": (video, get_bytes_value(video))}
data = {
"title": title,
"tags": tags,
"description": description,
}
response = requests.post(url, files=files, data=data)
return response.json()
def dub_video(video: str | Path | bytes, audio: str | Path | bytes, **kwargs):
root_dir = kwargs["root_dir"]
vid_file_location = osp.join(root_dir, video)
aud_file_location = osp.join(root_dir, audio)
video = mpe.VideoFileClip(vid_file_location)
# read audio file
audio = mpe.AudioFileClip(aud_file_location)
# set audio for video
new_video = video.set_audio(audio)
# export the video file
save_path = osp.join(root_dir, f"new_{str(uuid.uuid4())[:6]}.mp4")
new_video.write_videofile(save_path)
return open(save_path, "rb").read()
def decoding_key_frames(video: str | Path | bytes, **kwargs):
video = io.BytesIO(get_bytes_value(video))
container = av.open(video)
# extract evenly spaced frames from video
seg_len = container.streams.video[0].frames
indices = set(np.linspace(0, seg_len, num=4, endpoint=False).astype(np.int64))
frames = []
container.seek(0)
for i, frame in enumerate(container.decode(video=0)):
if i in indices:
stream = io.BytesIO()
# frame = frame.to_image().save(f"frame_{i}.png")
frame = frame.to_image().save(stream)
frames.append(frame)
return frames
|