File size: 1,847 Bytes
53aa97a |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 |
import puppeteer from "puppeteer"
import { downloadFileToTmp } from "../utils/downloadFileToTmp.mts"
export const state = {
load: 0
}
const instances: string[] = [
process.env.VC_VOICE_GENERATION_SPACE_API_URL
]
// TODO we should use an inference endpoint instead
export async function generateVoice(prompt: string, voiceFileName: string) {
if (state.load === instances.length) {
throw new Error(`all voice generation servers are busy, try again later..`)
}
state.load += 1
try {
const instance = instances.shift()
instances.push(instance)
console.log("instance:", instance)
const browser = await puppeteer.launch({
headless: true,
protocolTimeout: 800000,
})
try {
const page = await browser.newPage()
await page.goto(instance, {
waitUntil: "networkidle2",
})
await new Promise(r => setTimeout(r, 3000))
const firstTextarea = await page.$('textarea[data-testid="textbox"]')
await firstTextarea.type(prompt)
// console.log("looking for the button to submit")
const submitButton = await page.$("button.lg")
// console.log("clicking on the button")
await submitButton.click()
await page.waitForSelector("audio", {
timeout: 800000, // need to be large enough in case someone else attemps to use our space
})
const voiceRemoteUrl = await page.$$eval("audio", el => el.map(x => x.getAttribute("src"))[0])
console.log({
voiceRemoteUrl,
})
console.log(`- downloading ${voiceFileName} from ${voiceRemoteUrl}`)
await downloadFileToTmp(voiceRemoteUrl, voiceFileName)
return voiceFileName
} catch (err) {
throw err
} finally {
await browser.close()
}
} catch (err) {
throw err
} finally {
state.load -= 1
}
}
|