Spaces:

djkesu
/

tortoise5c

Sleeping

djkesu commited on Sep 28, 2023

Commit

77c96db

•

1 Parent(s): f90475c

Started saving latents during voice creation

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,5 +1,3 @@
-# AGPL: a notification must be added stating that changes have been made to that file.
 import os
 import shutil
 from pathlib import Path
@@ -24,7 +22,6 @@ from app_utils.funcs import (
     load_voice_conditionings,
 )
 LATENT_MODES = [
     "Tortoise original (bad)",
     "average per 4.27s (broken on small files)",
@@ -71,11 +68,13 @@ def main():
                     bytes_data = uploaded_file.read()
                     with open(f"{voices_dir}voice_sample{index}.wav", "wb") as wav_file:
                         wav_file.write(bytes_data)
-                #create conditioning latents and save them
-                voice_samples, conditioning_latents = get_condi(
-                    [new_voice_name], []
-                )
                 st.session_state["text_input_key"] = str(randint(1000, 100000000))
                 st.session_state["file_uploader_key"] = str(randint(1000, 100000000))
                 st.experimental_rerun()
@@ -109,6 +108,7 @@ def main():
         help="Which voice preset to use.",
         index=1,
     )
     with st.expander("Advanced"):
         col1, col2 = st.columns(2)
         with col1:
@@ -126,7 +126,6 @@ def main():
             )
             sampler = st.radio(
                 "Sampler",
-                #SAMPLERS,
                 ["dpm++2m", "p", "ddim"],
                 help="Diffusion sampler. Note that dpm++2m is experimental and typically requires more steps.",
                 index=1,

 import os
 import shutil
 from pathlib import Path
     load_voice_conditionings,
 )
 LATENT_MODES = [
     "Tortoise original (bad)",
     "average per 4.27s (broken on small files)",
                     bytes_data = uploaded_file.read()
                     with open(f"{voices_dir}voice_sample{index}.wav", "wb") as wav_file:
                         wav_file.write(bytes_data)
+                # Generate conditioning latents and samples here
+                voice_samples, conditioning_latents = generate_conditioning(voices_dir)
+                # Save the conditioning latents and samples
+                save_conditioning(voices_dir, voice_samples, conditioning_latents)
                 st.session_state["text_input_key"] = str(randint(1000, 100000000))
                 st.session_state["file_uploader_key"] = str(randint(1000, 100000000))
                 st.experimental_rerun()
         help="Which voice preset to use.",
         index=1,
     )
     with st.expander("Advanced"):
         col1, col2 = st.columns(2)
         with col1:
             )
             sampler = st.radio(
                 "Sampler",
                 ["dpm++2m", "p", "ddim"],
                 help="Diffusion sampler. Note that dpm++2m is experimental and typically requires more steps.",
                 index=1,