ebook2audiobookXTTS

Sleeping

App Files Files Community

drewThomasson commited on Oct 8, 2024

Commit

4a45bb8

verified ·

1 Parent(s): a105e1c

Update app.py

Browse files

Files changed (1) hide show

app.py +136 -81

app.py CHANGED Viewed

@@ -2,12 +2,38 @@ print("starting...")
 import argparse
-# Argument parser to handle optional parameters
-parser = argparse.ArgumentParser(description="Launch the Gradio app with optional share parameter.")
-parser.add_argument("--share", type=bool, default=False, help="Set to True to enable Gradio share link.")
 args = parser.parse_args()
 import os
 import shutil
 import subprocess
@@ -15,7 +41,6 @@ import re
 from pydub import AudioSegment
 import tempfile
 from pydub import AudioSegment
-import os
 import nltk
 from nltk.tokenize import sent_tokenize
 import sys
@@ -162,15 +187,24 @@ def create_m4b_from_chapters(input_dir, ebook_file, output_dir):
         except Exception as e:
             print(f"Error extracting eBook metadata or cover: {e}")
         return None
-    # Combine WAV files into a single file
-    def combine_wav_files(chapter_files, output_path):
         # Initialize an empty audio segment
         combined_audio = AudioSegment.empty()
-        # Sequentially append each file to the combined_audio
-        for chapter_file in chapter_files:
-            audio_segment = AudioSegment.from_wav(chapter_file)
-            combined_audio += audio_segment
         # Export the combined audio to the output file path
         combined_audio.export(output_path, format='wav')
         print(f"Combined audio saved to {output_path}")
@@ -234,7 +268,7 @@ def create_m4b_from_chapters(input_dir, ebook_file, output_dir):
-#this code right here isnt the book grabbing thing but its before to refrence in ordero to create the sepecial chapter labeled book thing with calibre idk some systems cant seem to get it so just in case but the next bit of code after this is the book grabbing code with booknlp
 import os
 import subprocess
 import ebooklib
@@ -682,78 +716,99 @@ def download_audiobooks():
     return list_audiobook_files(audiobook_output_path)
-language_options = [
-    "en", "es", "fr", "de", "it", "pt", "pl", "tr", "ru", "nl", "cs", "ar", "zh-cn", "ja", "hu", "ko"
-]
-theme = gr.themes.Soft(
-    primary_hue="blue",
-    secondary_hue="blue",
-    neutral_hue="blue",
-    text_size=gr.themes.sizes.text_md,
-)
 # Gradio UI setup
-with gr.Blocks(theme=theme) as demo:
-    gr.Markdown(
-    """
-    # eBook to Audiobook Converter
-    Transform your eBooks into immersive audiobooks with optional custom TTS models.
-    This interface is based on [Ebook2AudioBookXTTS](https://github.com/DrewThomasson/ebook2audiobookXTTS).
-    """
-    )
-    with gr.Row():
-        with gr.Column(scale=3):
-            ebook_file = gr.File(label="eBook File")
-            target_voice_file = gr.File(label="Target Voice File (Optional)")
-            language = gr.Dropdown(label="Language", choices=language_options, value="en")
-        with gr.Column(scale=3):
-            use_custom_model = gr.Checkbox(label="Use Custom Model")
-            custom_model_file = gr.File(label="Custom Model File (Optional)", visible=False)
-            custom_config_file = gr.File(label="Custom Config File (Optional)", visible=False)
-            custom_vocab_file = gr.File(label="Custom Vocab File (Optional)", visible=False)
-            custom_model_url = gr.Textbox(label="Custom Model Zip URL (Optional)", visible=False)
-    convert_btn = gr.Button("Convert to Audiobook", variant="primary")
-    output = gr.Textbox(label="Conversion Status")
-    audio_player = gr.Audio(label="Audiobook Player", type="filepath")
-    download_btn = gr.Button("Download Audiobook Files")
-    download_files = gr.File(label="Download Files", interactive=False)
-    convert_btn.click(
-        convert_ebook_to_audio,
-        inputs=[ebook_file, target_voice_file, language, use_custom_model, custom_model_file, custom_config_file, custom_vocab_file, custom_model_url],
-        outputs=[output, audio_player]
-    )
-    use_custom_model.change(
-        lambda x: [gr.update(visible=x)] * 4,
-        inputs=[use_custom_model],
-        outputs=[custom_model_file, custom_config_file, custom_vocab_file, custom_model_url]
-    )
-    download_btn.click(
-        download_audiobooks,
-        outputs=[download_files]
     )
-#demo.launch(share=True)
-#demo.launch() # Removing share = True for Gradio Interface
-# Get the correct local IP or localhost
-hostname = socket.gethostname()
-local_ip = socket.gethostbyname(hostname)
-# Ensure Gradio runs and prints the correct local IP
-print(f"Running on local URL: http://{local_ip}:7860")
-print(f"Running on local URL: http://localhost:7860")
-# Your Gradio launch command
-demo.launch(server_name="0.0.0.0", server_port=7860, share=args.share)

 import argparse
+language_options = [
+    "en", "es", "fr", "de", "it", "pt", "pl", "tr", "ru", "nl", "cs", "ar", "zh-cn", "ja", "hu", "ko"
+]
+# Convert the list of languages to a string to display in the help text
+language_options_str = ", ".join(language_options)
+# Argument parser to handle optional parameters with descriptions
+parser = argparse.ArgumentParser(
+    description="Convert eBooks to Audiobooks using a Text-to-Speech model. You can either launch the Gradio interface or run the script in headless mode for direct conversion.",
+    epilog="Example: python script.py --headless --ebook path_to_ebook --voice path_to_voice --language en --use_custom_model True --custom_model model.pth --custom_config config.json --custom_vocab vocab.json"
+)
+parser.add_argument("--share", type=bool, default=False, help="Set to True to enable a public shareable Gradio link. Defaults to False.")
+parser.add_argument("--headless", type=bool, default=False, help="Set to True to run in headless mode without the Gradio interface. Defaults to False.")
+parser.add_argument("--ebook", type=str, help="Path to the ebook file for conversion. Required in headless mode.")
+parser.add_argument("--voice", type=str, help="Path to the target voice file for TTS. Optional, uses a default voice if not provided.")
+parser.add_argument("--language", type=str, default="en",
+                    help=f"Language for the audiobook conversion. Options: {language_options_str}. Defaults to English (en).")
+parser.add_argument("--use_custom_model", type=bool, default=False,
+                    help="Set to True to use a custom TTS model. Defaults to False. Must be True to use custom models, otherwise you'll get an error.")
+parser.add_argument("--custom_model", type=str, help="Path to the custom model file (.pth). Required if using a custom model.")
+parser.add_argument("--custom_config", type=str, help="Path to the custom config file (config.json). Required if using a custom model.")
+parser.add_argument("--custom_vocab", type=str, help="Path to the custom vocab file (vocab.json). Required if using a custom model.")
+parser.add_argument("--custom_model_url", type=str,
+                    help=("URL to download the custom model as a zip file. Optional, but will be used if provided. "
+                          "Examples include David Attenborough's model: "
+                          "'https://huggingface.co/drewThomasson/xtts_David_Attenborough_fine_tune/resolve/main/Finished_model_files.zip?download=true'. "
+                          "More XTTS fine-tunes can be found on my Hugging Face at 'https://huggingface.co/drewThomasson'."))
 args = parser.parse_args()
 import os
 import shutil
 import subprocess
 from pydub import AudioSegment
 import tempfile
 from pydub import AudioSegment
 import nltk
 from nltk.tokenize import sent_tokenize
 import sys
         except Exception as e:
             print(f"Error extracting eBook metadata or cover: {e}")
         return None
+        # Combine WAV files into a single file
+    def combine_wav_files(chapter_files, output_path, batch_size=256):
         # Initialize an empty audio segment
         combined_audio = AudioSegment.empty()
+        # Process the chapter files in batches
+        for i in range(0, len(chapter_files), batch_size):
+            batch_files = chapter_files[i:i + batch_size]
+            batch_audio = AudioSegment.empty()  # Initialize an empty AudioSegment for the batch
+            # Sequentially append each file in the current batch to the batch_audio
+            for chapter_file in batch_files:
+                audio_segment = AudioSegment.from_wav(chapter_file)
+                batch_audio += audio_segment
+            # Combine the batch audio with the overall combined_audio
+            combined_audio += batch_audio
         # Export the combined audio to the output file path
         combined_audio.export(output_path, format='wav')
         print(f"Combined audio saved to {output_path}")
+#this code right here isnt the book grabbing thing but its before to refrence in order to create the sepecial chapter labeled book thing with calibre idk some systems cant seem to get it so just in case but the next bit of code after this is the book grabbing code with booknlp
 import os
 import subprocess
 import ebooklib
     return list_audiobook_files(audiobook_output_path)
 # Gradio UI setup
+def run_gradio_interface():
+    language_options = [
+        "en", "es", "fr", "de", "it", "pt", "pl", "tr", "ru", "nl", "cs", "ar", "zh-cn", "ja", "hu", "ko"
+    ]
+    theme = gr.themes.Soft(
+        primary_hue="blue",
+        secondary_hue="blue",
+        neutral_hue="blue",
+        text_size=gr.themes.sizes.text_md,
     )
+    with gr.Blocks(theme=theme) as demo:
+        gr.Markdown(
+        """
+        # eBook to Audiobook Converter
+        Transform your eBooks into immersive audiobooks with optional custom TTS models.
+        This interface is based on [Ebook2AudioBookXTTS](https://github.com/DrewThomasson/ebook2audiobookXTTS).
+        """
+        )
+        with gr.Row():
+            with gr.Column(scale=3):
+                ebook_file = gr.File(label="eBook File")
+                target_voice_file = gr.File(label="Target Voice File (Optional)")
+                language = gr.Dropdown(label="Language", choices=language_options, value="en")
+            with gr.Column(scale=3):
+                use_custom_model = gr.Checkbox(label="Use Custom Model")
+                custom_model_file = gr.File(label="Custom Model File (Optional)", visible=False)
+                custom_config_file = gr.File(label="Custom Config File (Optional)", visible=False)
+                custom_vocab_file = gr.File(label="Custom Vocab File (Optional)", visible=False)
+                custom_model_url = gr.Textbox(label="Custom Model Zip URL (Optional)", visible=False)
+        convert_btn = gr.Button("Convert to Audiobook", variant="primary")
+        output = gr.Textbox(label="Conversion Status")
+        audio_player = gr.Audio(label="Audiobook Player", type="filepath")
+        download_btn = gr.Button("Download Audiobook Files")
+        download_files = gr.File(label="Download Files", interactive=False)
+        convert_btn.click(
+            convert_ebook_to_audio,
+            inputs=[ebook_file, target_voice_file, language, use_custom_model, custom_model_file, custom_config_file, custom_vocab_file, custom_model_url],
+            outputs=[output, audio_player]
+        )
+        use_custom_model.change(
+            lambda x: [gr.update(visible=x)] * 4,
+            inputs=[use_custom_model],
+            outputs=[custom_model_file, custom_config_file, custom_vocab_file, custom_model_url]
+        )
+        download_btn.click(
+            download_audiobooks,
+            outputs=[download_files]
+        )
+    # Get the correct local IP or localhost
+    hostname = socket.gethostname()
+    local_ip = socket.gethostbyname(hostname)
+    # Ensure Gradio runs and prints the correct local IP
+    print(f"Running on local URL: http://{local_ip}:7860")
+    print(f"Running on local URL: http://localhost:7860")
+    # Launch Gradio app
+    demo.launch(server_name="0.0.0.0", server_port=7860, share=args.share)
+# Check if running in headless mode
+if args.headless:
+    if not args.ebook:
+        print("Error: In headless mode, you must specify an ebook file using --ebook.")
+        exit(1)
+    ebook_file_path = args.ebook
+    target_voice = args.voice if args.voice else None
+    custom_model = None
+    if args.use_custom_model:
+        custom_model = {
+            'model': args.custom_model,
+            'config': args.custom_config,
+            'vocab': args.custom_vocab
+        }
+    # Example headless execution
+    convert_ebook_to_audio(ebook_file_path, target_voice, args.language, args.use_custom_model, args.custom_model, args.custom_config, args.custom_vocab)
+else:
+    # Launch Gradio UI
+    run_gradio_interface()