VideoChain-API / src /production /generateVoice.mts
jbilcke-hf's picture
jbilcke-hf HF staff
VS -> VC
12506f0
raw
history blame
1.39 kB
import puppeteer from "puppeteer"
import { downloadFileToTmp } from "../utils/downloadFileToTmp.mts"
const instances: string[] = [
process.env.VC_VOICE_GENERATION_SPACE_API_URL
]
// TODO we should use an inference endpoint instead
export async function generateVoice(prompt: string, voiceFileName: string) {
const instance = instances.shift()
instances.push(instance)
console.log("instance:", instance)
const browser = await puppeteer.launch({
headless: false,
protocolTimeout: 800000,
})
const page = await browser.newPage()
await page.goto(instance, {
waitUntil: "networkidle2",
})
await new Promise(r => setTimeout(r, 3000))
const firstTextarea = await page.$('textarea[data-testid="textbox"]')
await firstTextarea.type(prompt)
// console.log("looking for the button to submit")
const submitButton = await page.$("button.lg")
// console.log("clicking on the button")
await submitButton.click()
await page.waitForSelector("audio", {
timeout: 800000, // need to be large enough in case someone else attemps to use our space
})
const voiceRemoteUrl = await page.$$eval("audio", el => el.map(x => x.getAttribute("src"))[0])
console.log({
voiceRemoteUrl,
})
console.log(`- downloading ${voiceFileName} from ${voiceRemoteUrl}`)
await downloadFileToTmp(voiceRemoteUrl, voiceFileName)
return voiceFileName
}