Spaces:
Running
Running
File size: 5,932 Bytes
0931910 dc92d10 0931910 dc92d10 0931910 20172dc bd49a31 20172dc 89dc4a6 bd49a31 20172dc 89dc4a6 bd49a31 89dc4a6 20172dc 89dc4a6 bd49a31 fe7b9b7 20172dc 89dc4a6 20172dc bd49a31 20172dc 183d840 d89ea65 183d840 595d5ff 183d840 662a135 38f204d 662a135 595d5ff 662a135 183d840 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 |
js_update_ipa_output = """
function updateCssText(text, letters, idxSelectedWord) {
let wordsArr = text.split(" ")
let lettersWordsArr = letters.split(" ")
let speechOutputContainer = document.querySelector('#speech-output');
speechOutputContainer.textContent = ""
for (let idx in wordsArr) {
let word = wordsArr[idx]
let letterIsCorrect = lettersWordsArr[idx]
for (let idx1 in word) {
let letterCorrect = letterIsCorrect[idx1] == "1"
let containerLetter = document.createElement("span")
let color = letterCorrect ? 'green' : "red"
containerLetter.style.cssText = idx == idxSelectedWord ? `color: ${color}; text-decoration-line: underline;` : `color: ${color};`
containerLetter.innerText = word[idx1];
speechOutputContainer.appendChild(containerLetter)
}
let containerSpace = document.createElement("span")
containerSpace.textContent = " "
speechOutputContainer.appendChild(containerSpace)
}
}
"""
js_play_audio = """
function playAudio(text, language, sleepTime = 0) {
let voice_idx = 0;
let voice_synth = null;
let synth = window.speechSynthesis;
let voice_lang;
let sleepTimeAdditional = 500; // for some reason using this with a default input argument give an object instead of the correct number
function sleep (time) {
return new Promise((resolve) => setTimeout(resolve, time));
}
function setSpeech() {
return new Promise(
function (resolve, reject) {
let id;
id = setInterval(() => {
if (synth.getVoices().length !== 0) {
resolve(synth.getVoices());
clearInterval(id);
}
}, 10);
}
)
}
switch (language) {
case 'de':
voice_lang = 'de-DE';
break;
case 'en':
voice_lang = 'en-US';
break;
default:
const msg = `Error: language ${language} not valid!`
console.error(msg);
alert(msg)
throw new Error(msg)
}
let s = setSpeech();
s.then((voices) => {
let voicesSynth = voices.filter(voice => voice.lang === voice_lang);
if (voicesSynth.length === 0) {
console.error(`No voice found for language ${voice_lang}, retry for less restrictive check (startsWith)...`)
voicesSynth = voices.filter(voice => voice.lang.startsWith(language));
}
if (voicesSynth.length === 0) {
const msg = `Error: no voice found for language ${voice_lang} / ${language}, you should use the Text-To-Speech backend feature...`
console.error(msg);
alert(msg)
throw new Error(msg)
}
var utterThis = new SpeechSynthesisUtterance(text);
utterThis.voice = voicesSynth[0];
utterThis.rate = 0.7;
if (sleepTime > 0) {
sleepTime *= 1000;
sleepTime += sleepTimeAdditional;
}
console.log("start js_play_audio:: sleepTime:", sleepTime, "#")
sleep(sleepTime).then(() => {
synth.speak(utterThis);
})
// todo: capture audio from speech synthesis to reuse on the frontend
// https://stackoverflow.com/questions/45003548/how-to-capture-generated-audio-from-window-speechsynthesis-speak-call
});
}
"""
head_driver_tour = """
<link href="https://cdn.jsdelivr.net/npm/[email protected]/dist/driver.min.css" rel="stylesheet">
<script type="module">
import { driver } from 'https://cdn.jsdelivr.net/npm/[email protected]/+esm'
const driverSteps = [
{ element: "id-ai-pronunciation-trainer-gradio-app-container", popover: { title: "AI Pronunciation Trainer Gradio App", description: "A quick tour of the features of the Gradio app 'AI Pronunciation Trainer'." } },
{ element: "#id-choose-random-phrase-by-language-and-difficulty", popover: { title: "Choose a Random Phrase", description: "Choose a random sentence to be used as input for speech recognition, defining your own language and difficulty..." } },
{ element: "#accordion-examples-id-element", popover: { title: "Text Examples", description: "...Or start with these text examples, increasing in difficulty." } },
{ element: "#text-student-transcription-id-element", popover: { title: "Phrase to Read for Speech Recognition", description: "You can also write your own sentence." } },
{ element: "#btn-run-tts-id-element", popover: { title: "In-Browser Text-to-Speech", description: "Execute the text-to-speech functionality in the browser by reading the student's transcription." } },
{ element: "#btn-run-tts-backend-id-element", popover: { title: "Backend Text-to-Speech", description: "Execute the text-to-speech functionality in the backend by reading the student's transcription." } },
{ element: "#btn-clear-tts-backend-id-element", popover: { title: "Clear Text-to-Speech", description: "Clear the synthetic audio output of the text-to-speech synthesis." } },
{ element: ".speech-output-group", popover: { title: "Detailed Speech Accuracy Output", description: "Detailed output of speech accuracy, word by word." } },
{ element: "#id-replay-splitted-audio-by-words", popover: { title: "Replay Split Audio by Words", description: "Replay your recorded audio split into single words followed by the 'ideal' pronunciation spelled by the text-to-speech audio output for the same word." } },
{ element: "#accordion-models-env-variables-id-element", popover: { title: "Environment variables in use now", description: "Show the environment variables in use right now (e.g. speech-to-text models, samplerate values, etc)." } },
];
const driverObj = driver({
showProgress: true,
steps: driverSteps
});
driverObj.drive();
</script>
"""
|