Spaces:

GH111
/

wonderlore

Sleeping

App Files Files Community

GH111 commited on Dec 10, 2023

Commit

7da30cc

1 Parent(s): 82e33f9

Update app.py

Browse files

Files changed (1) hide show

app.py +50 -34

app.py CHANGED Viewed

@@ -1,64 +1,80 @@
 import gradio as gr
 from transformers import pipeline
 from gtts import gTTS
 from io import BytesIO
-from PIL import Image, ImageDraw, ImageFont
-from IPython.display import Audio
-# Create a text generation pipeline with GPT-2
-story_generator = pipeline("text-generation", model="EleutherAI/gpt-neo-1.3B")
 # Set the context for the storyteller
 messages = [{"role": "system", "content": "You are a magical storyteller, creating wonderful tales for kids. Make them imaginative and full of joy!"}]
 # Define the Storyteller function
-def StorytellerGPT(tell_story):
     messages.append({"role": "user", "content": tell_story})
-    # Generate story using Hugging Face's GPT-2
-    story_reply = story_generator(tell_story, max_length=100, num_return_sequences=1)[0]['generated_text']
     messages.append({"role": "assistant", "content": story_reply})
     # Convert text to speech
     tts = gTTS(text=story_reply, lang='en', slow=False)
     audio_io = BytesIO()
     tts.save(audio_io)
     audio_io.seek(0)
-    # Convert text to image
-    image = generate_dynamic_image(story_reply)
-    return story_reply, Audio(data=audio_io.read(), autoplay=True), image
-# Function to generate a dynamic image based on the story text
-def generate_dynamic_image(story_text):
-    # Create a blank image
-    image = Image.new("RGB", (500, 300), (255, 255, 255))
-    draw = ImageDraw.Draw(image)
-    # Use a truetype font file, replace "arial.ttf" with the path to your font file
-    font = ImageFont.truetype("arial.ttf", 20)
-    # Write the story text on the image
-    lines = [story_text[i:i+40] for i in range(0, len(story_text), 40)]
-    y_position = 10
-    for line in lines:
-        draw.text((10, y_position), line, font=font, fill=(0, 0, 0))
-        y_position += 30
-    return image
-# Create the Gradio Interface
 demo = gr.Interface(
-    fn=StorytellerGPT,
-    inputs="text",
     outputs=["text", "audio", "image"],
     title="📖 Storytelling Magic",
-    description="A magical storyteller app for kids! Type a sentence, and let the app create an enchanting story for you."
 )
 # Launch the Gradio Interface
 demo.launch()

+# Import libraries
+!pip install gradio transformers
+!pip install -q gradio
+!pip install -q openai
+!pip install -q gTTS
 import gradio as gr
 from transformers import pipeline
 from gtts import gTTS
 from io import BytesIO
+from PIL import Image
+from diffusers import DiffusionPipeline
+# Use a pipeline as a high-level helper for text generation
+vision_alpha_pipe = pipeline("text-generation", model="NousResearch/Nous-Hermes-2-Vision-Alpha")
+# Initialize DiffusionPipeline for text-to-image
+image_generation_pipe = DiffusionPipeline.from_pretrained("stabilityai/stable-video-diffusion-img2vid-xt")
 # Set the context for the storyteller
 messages = [{"role": "system", "content": "You are a magical storyteller, creating wonderful tales for kids. Make them imaginative and full of joy!"}]
+# Initialize page number
+current_page = 0
 # Define the Storyteller function
+def StorytellerNous(character, child_name, lesson_choice, tell_story, _):
+    global current_page
+    # Set the characters and lesson based on user choices
+    character_info = f"Once upon a time, {child_name} met {character}. "
+    lesson_info = f"Today's lesson is about {lesson_choice}. "
     messages.append({"role": "user", "content": tell_story})
+    # Generate story using Nous-Hermes-2-Vision-Alpha
+    input_text = character_info + lesson_info + tell_story
+    story_reply = vision_alpha_pipe(input_text, max_length=150, num_return_sequences=1, no_repeat_ngram_size=2, top_k=50, top_p=0.95)[0]['generated_text']
     messages.append({"role": "assistant", "content": story_reply})
     # Convert text to speech
     tts = gTTS(text=story_reply, lang='en', slow=False)
     audio_io = BytesIO()
     tts.save(audio_io)
     audio_io.seek(0)
+    # Convert text to image using DiffusionPipeline
+    image_reply = image_generation_pipe(story_reply)
+    # Display the story on separate pages
+    story_pages = story_reply.split("\n\n")  # Split the story into pages
+    current_page = min(current_page, len(story_pages) - 1)  # Ensure the current_page is within bounds
+    return story_pages[current_page], Audio(data=audio_io.read(), autoplay=True), image_reply
+# Create the Gradio Interface with styling
 demo = gr.Interface(
+    fn=StorytellerNous,
+    inputs=[
+        gr.Textbox("text", label="Child's Name"),
+        gr.Dropdown(["unicorn", "dragon", "wizard"], label="Choose a Character"),
+        gr.Dropdown(["kindness", "creativity", "bravery"], label="Choose a Lesson"),
+        gr.Textbox("text", label="Start the Story with"),
+        gr.Button("Next Page"),
+    ],
     outputs=["text", "audio", "image"],
     title="📖 Storytelling Magic",
+    description="A magical storyteller app for kids! Choose characters, add your name, and select the lesson you want to learn.",
+    live=True,  # Enable live updates for CSS changes
+    css=f"""body {{
+        background-image: url('https://www.bing.com/images/create/a-castle-ai-metaverse-style/1-657576205c7146f2b7f2f8d1c552810f?id=dZs6kpD2HfmH4eojx%2bHjdA%3d%3d&view=detailv2&idpp=genimg&FORM=GCRIDP&mode=overlay');
+        background-size: cover;
+        background-position: center;
+        font-family: 'Comic Sans MS', cursive, sans-serif; /* Optional: Change the font */
+    }}""",
 )
 # Launch the Gradio Interface
 demo.launch()