Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
import { v4 as uuidv4 } from "uuid" | |
import { Video, VideoShot } from "../types.mts" | |
import { generateVideo } from "../providers/video-generation/generateVideoWithZeroscope.mts" | |
import { upscaleVideo } from "../providers/video-upscaling/upscaleVideo.mts" | |
import { interpolateVideo } from "../providers/video-interpolation/interpolateVideo.mts" | |
import { postInterpolation } from "../production/postInterpolation.mts" | |
import { generateAudio } from "../providers/audio-generation/generateAudio.mts" | |
import { addAudioToVideo } from "../utils/video/addAudioToVideo.mts" | |
import { downloadFileToTmp } from "../utils/download/downloadFileToTmp.mts" | |
import { copyVideoFromTmpToPending } from "./copyVideoFromTmpToPending.mts" | |
import { saveAndCheckIfNeedToStop } from "./saveAndCheckIfNeedToStop.mts" | |
import { updateShotPreview } from "./updateShotPreview.mts" | |
import { enrichVideoSpecsUsingLLM } from "../providers/language-model/enrichVideoSpecsUsingLLM.mts" | |
export const processVideo = async (video: Video) => { | |
// just a an additional precaution, for consistency and robustness | |
if (["pause", "completed", "abort", "delete"].includes(video.status)) { return } | |
console.log(`processing video video ${video.id}`) | |
// always count 2 more steps: 1 for the LLM, 1 for the final assembly | |
let nbTotalSteps = 2 | |
for (const shot of video.shots) { | |
nbTotalSteps += shot.nbTotalSteps | |
} | |
let nbCompletedSteps = 0 | |
if (!video.hasGeneratedSpecs) { | |
try { | |
await enrichVideoSpecsUsingLLM(video) | |
} catch (err) { | |
console.error(`LLM error: ${err}`) | |
video.error = `LLM error: ${err}` | |
video.status = "delete" | |
if (await saveAndCheckIfNeedToStop(video)) { return } | |
} | |
nbCompletedSteps++ | |
video.hasGeneratedSpecs = true | |
video.progressPercent = Math.round((nbCompletedSteps / nbTotalSteps) * 100) | |
if (await saveAndCheckIfNeedToStop(video)) { return } | |
} | |
for (const shot of video.shots) { | |
nbCompletedSteps += shot.nbCompletedSteps | |
// skip shots completed previously | |
if (shot.completed) { | |
continue | |
} | |
console.log(`need to complete shot ${shot.id}`) | |
// currenty we cannot generate too many frames at once, | |
// otherwise the upscaler will have trouble | |
// so for now, we fix it to 24 frames | |
// const nbFramesForBaseModel = Math.min(3, Math.max(1, Math.round(duration))) * 8 | |
const nbFramesForBaseModel = 24 | |
if (!shot.hasGeneratedPreview) { | |
console.log("generating a preview of the final result..") | |
let generatedPreviewVideoUrl = "" | |
try { | |
generatedPreviewVideoUrl = await generateVideo(shot.shotPrompt, { | |
seed: shot.seed, | |
nbFrames: nbFramesForBaseModel, | |
nbSteps: 10, // for the preview, we only give a rough approximation | |
}) | |
console.log("downloading preview video..") | |
// download to /tmp | |
await downloadFileToTmp(generatedPreviewVideoUrl, shot.fileName) | |
await copyVideoFromTmpToPending(shot.fileName) | |
shot.hasGeneratedPreview = true | |
shot.nbCompletedSteps++ | |
nbCompletedSteps++ | |
shot.progressPercent = Math.round((shot.nbCompletedSteps / shot.nbTotalSteps) * 100) | |
video.progressPercent = Math.round((nbCompletedSteps / nbTotalSteps) * 100) | |
await updateShotPreview(video, shot) | |
if (await saveAndCheckIfNeedToStop(video)) { return } | |
} catch (err) { | |
console.error(`failed to generate preview for shot ${shot.id} (${err})`) | |
// something is wrong, let's put the whole thing back into the queue | |
video.error = `failed to generate preview for shot ${shot.id} (will try again later)` | |
if (await saveAndCheckIfNeedToStop(video)) { return } | |
// always try to yield whenever possible | |
return | |
} | |
} | |
const notAllShotsHavePreview = video.shots.some(s => !s.hasGeneratedPreview) | |
if (notAllShotsHavePreview)Β { | |
console.log(`step 2 isn't unlocked yet, because not all videos have generated preview`) | |
continue | |
} | |
if (!shot.hasGeneratedVideo) { | |
console.log("generating primordial pixel soup (raw video)..") | |
let generatedVideoUrl = "" | |
const nbFramesForBaseModel = 24 | |
try { | |
generatedVideoUrl = await generateVideo(shot.shotPrompt, { | |
seed: shot.seed, | |
nbFrames: nbFramesForBaseModel, | |
nbSteps: shot.steps, | |
}) | |
console.log("downloading video..") | |
await downloadFileToTmp(generatedVideoUrl, shot.fileName) | |
await copyVideoFromTmpToPending(shot.fileName) | |
shot.hasGeneratedVideo = true | |
shot.nbCompletedSteps++ | |
nbCompletedSteps++ | |
shot.progressPercent = Math.round((shot.nbCompletedSteps / shot.nbTotalSteps) * 100) | |
video.progressPercent = Math.round((nbCompletedSteps / nbTotalSteps) * 100) | |
await updateShotPreview(video, shot) | |
if (await saveAndCheckIfNeedToStop(video)) { return } | |
} catch (err) { | |
console.error(`failed to generate shot ${shot.id} (${err})`) | |
// something is wrong, let's put the whole thing back into the queue | |
video.error = `failed to generate shot ${shot.id} (will try again later)` | |
if (await saveAndCheckIfNeedToStop(video)) { return } | |
break | |
} | |
} | |
if (!shot.hasUpscaledVideo) { | |
console.log("upscaling video..") | |
try { | |
await upscaleVideo(shot.fileName, shot.shotPrompt) | |
shot.hasUpscaledVideo = true | |
shot.nbCompletedSteps++ | |
nbCompletedSteps++ | |
shot.progressPercent = Math.round((shot.nbCompletedSteps / shot.nbTotalSteps) * 100) | |
video.progressPercent = Math.round((nbCompletedSteps / nbTotalSteps) * 100) | |
await updateShotPreview(video, shot) | |
if (await saveAndCheckIfNeedToStop(video)) { return } | |
} catch (err) { | |
console.error(`failed to upscale shot ${shot.id} (${err})`) | |
// something is wrong, let's put the whole thing back into the queue | |
video.error = `failed to upscale shot ${shot.id} (will try again later)` | |
if (await saveAndCheckIfNeedToStop(video)) { return } | |
break | |
} | |
} | |
if (!shot.hasInterpolatedVideo) { | |
console.log("interpolating video..") | |
// ATTENTION 1: | |
// the interpolation step always create a SLOW MOTION video | |
// it means it can last a lot longer (eg. 2x, 3x, 4x.. longer) | |
// than the duration generated by the original video model | |
// ATTENTION 2: | |
// the interpolation step generates videos in 910x512! | |
// ATTENTION 3: | |
// the interpolation step parameters are currently not passed to the space, | |
// so changing those two variables below will have no effect! | |
const interpolationSteps = 2 | |
const interpolatedFramesPerSecond = 30 | |
console.log('creating slow-mo video (910x512 @ 30 FPS)') | |
try { | |
await interpolateVideo( | |
shot.fileName, | |
interpolationSteps, | |
interpolatedFramesPerSecond | |
) | |
shot.hasInterpolatedVideo = true | |
shot.nbCompletedSteps++ | |
nbCompletedSteps++ | |
shot.progressPercent = Math.round((shot.nbCompletedSteps / shot.nbTotalSteps) * 100) | |
video.progressPercent = Math.round((nbCompletedSteps / nbTotalSteps) * 100) | |
// note: showing the intermediary result isn't very interesting here | |
// with our current interpolation settings, the 3 seconds video generated by the model | |
// become a 7 seconds video, at 30 FPS | |
// so we want to scale it back to the desired duration length | |
// also, as a last trick we want to upscale it (without AI) and add some FXs | |
console.log('performing final scaling (1280x720 @ 30 FPS)') | |
try { | |
await postInterpolation(shot.fileName, shot.durationMs, shot.fps, shot.noiseAmount) | |
shot.hasPostProcessedVideo = true | |
shot.nbCompletedSteps++ | |
nbCompletedSteps++ | |
shot.progressPercent = Math.round((shot.nbCompletedSteps / shot.nbTotalSteps) * 100) | |
video.progressPercent = Math.round((nbCompletedSteps / nbTotalSteps) * 100) | |
await updateShotPreview(video, shot) | |
if (await saveAndCheckIfNeedToStop(video)) { return } | |
} catch (err) { | |
throw err | |
} | |
} catch (err) { | |
console.error(`failed to interpolate and post-process shot ${shot.id} (${err})`) | |
// something is wrong, let's put the whole thing back into the queue | |
video.error = `failed to interpolate and shot ${shot.id} (will try again later)` | |
if (await saveAndCheckIfNeedToStop(video)) { return } | |
break | |
} | |
} | |
let foregroundAudioFileName = `${video.ownerId}_${video.id}_${shot.id}_${uuidv4()}.m4a` | |
if (!shot.hasGeneratedForegroundAudio) { | |
if (shot.foregroundAudioPrompt) { | |
console.log("generating foreground audio..") | |
try { | |
await generateAudio(shot.foregroundAudioPrompt, foregroundAudioFileName) | |
shot.hasGeneratedForegroundAudio = true | |
shot.nbCompletedSteps++ | |
nbCompletedSteps++ | |
shot.progressPercent = Math.round((shot.nbCompletedSteps / shot.nbTotalSteps) * 100) | |
video.progressPercent = Math.round((nbCompletedSteps / nbTotalSteps) * 100) | |
await addAudioToVideo(shot.fileName, foregroundAudioFileName) | |
await updateShotPreview(video, shot) | |
if (await saveAndCheckIfNeedToStop(video)) { return } | |
} catch (err) { | |
console.error(`failed to generate foreground audio for ${shot.id} (${err})`) | |
// something is wrong, let's put the whole thing back into the queue | |
video.error = `failed to generate foreground audio ${shot.id} (will try again later)` | |
if (await saveAndCheckIfNeedToStop(video)) { return } | |
break | |
} | |
} else { | |
shot.hasGeneratedForegroundAudio = true | |
shot.nbCompletedSteps++ | |
nbCompletedSteps++ | |
shot.progressPercent = Math.round((shot.nbCompletedSteps / shot.nbTotalSteps) * 100) | |
video.progressPercent = Math.round((nbCompletedSteps / nbTotalSteps) * 100) | |
if (await saveAndCheckIfNeedToStop(video)) { return } | |
} | |
} | |
shot.completed = true | |
shot.completedAt = new Date().toISOString() | |
shot.progressPercent = 100 | |
video.nbCompletedShots++ | |
if (await saveAndCheckIfNeedToStop(video)) { return } | |
} | |
console.log(`end of the loop:`) | |
console.log(`nb completed shots: ${video.nbCompletedShots}`) | |
console.log(`len of the shot array: ${video.shots.length}`) | |
// now time to check the end game | |
if (video.nbCompletedShots === video.shots.length) { | |
console.log(`we have finished each individual shot!`) | |
if (!video.hasAssembledVideo) { | |
video.hasAssembledVideo = true | |
} | |
/* | |
console.log(`assembling the final..`) | |
console.log(`note: this might be redundant..`) | |
if (!video.hasAssembledVideo) { | |
video.hasAssembledVideo = true | |
if (video.shots.length === 1) { | |
console.log(`we only have one shot, so this gonna be easy`) | |
video.hasAssembledVideo = true | |
// the single shot (so, the first) becomes the final movie | |
await copyVideoFromPendingToCompleted(video.shots[0].fileName, video.fileName) | |
if (await saveAndCheckIfNeedToStop(video)) { return } | |
} else { | |
console.log(`assembling ${video.shots.length} shots together, might take a while`) | |
try { | |
await assembleShots(video.shots, video.fileName) | |
console.log(`finished assembling the ${video.shots.length} shots together!`) | |
await copyVideoFromPendingToCompleted(video.fileName) | |
video.hasAssembledVideo = true | |
if (await saveAndCheckIfNeedToStop(video)) { return } | |
} catch (err) { | |
console.error(`failed to assemble the shots together (${err})`) | |
// something is wrong, let's put the whole thing back into the queue | |
video.error = `failed to assemble the shots together (will try again later)` | |
if (await saveAndCheckIfNeedToStop(video)) { return } | |
} | |
} | |
} | |
*/ | |
nbCompletedSteps++ | |
video.completed = true | |
if (await saveAndCheckIfNeedToStop(video)) { return } | |
} | |
} |