Spaces:

mayf
/

1

Sleeping

App Files Files Community

1 / app.py

mayf

Update app.py

8e5f097 verified 2 months ago

raw

history blame

3.46 kB

	# app.py
	import streamlit as st
	from PIL import Image
	from io import BytesIO
	from huggingface_hub import InferenceApi
	from gtts import gTTS
	import tempfile

	# —––––––– Page Config
	st.set_page_config(page_title="Magic Story Generator", layout="centered")
	st.title("📖✨ Turn Images into Children's Stories")

	# —––––––– Clients (cached)
	@st.cache_resource
	def load_clients():
	hf_token = st.secrets["HF_TOKEN"]
	return (
	InferenceApi("Salesforce/blip-image-captioning-base", token=hf_token),
	InferenceApi("deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B", token=hf_token)
	)

	caption_client, story_client = load_clients()

	# —––––––– Main Flow
	uploaded = st.file_uploader("Upload a child-friendly image:", type=["jpg", "png", "jpeg"])
	if not uploaded:
	st.info("🌈 Please upload an image to start the magic!")
	else:
	# Process Image
	img = Image.open(uploaded).convert("RGB")
	st.image(img, use_column_width=True)

	# Generate Caption
	with st.spinner("🔍 Discovering image secrets..."):
	try:
	img_bytes = BytesIO()
	img.save(img_bytes, format="JPEG")
	caption_response = caption_client(data=img_bytes.getvalue())
	caption = caption_response[0]['generated_text'].strip() if isinstance(caption_response, list) else ""

	if not caption:
	st.error("😢 Couldn't understand this image. Try another one!")
	st.stop()
	except Exception as e:
	st.error(f"🚨 Oops! Problem making caption: {str(e)}")
	st.stop()

	st.success(f"Caption Magic: {caption}")

	# Story Generation Prompt
	story_prompt = (
	f"Image description: {caption}\n\n"
	"Write a 50-100 word children's story that:\n"
	"1. Features the main subject as a friendly character\n"
	"2. Includes a simple adventure or discovery\n"
	"3. Ends with a happy or funny conclusion\n"
	"4. Uses simple language for ages 3-8\n\n"
	"Story:\n"
	)

	# Generate Story
	with st.spinner("📝 Writing magical story..."):
	try:
	story_response = story_client(
	story_prompt,
	max_new_tokens=200,
	temperature=0.8,
	top_p=0.95,
	repetition_penalty=1.15,
	do_sample=True,
	no_repeat_ngram_size=2
	)

	# Process response
	full_text = story_response[0]['generated_text']
	story = full_text.split("Story:")[-1].strip()

	# Ensure clean ending
	if "." in story:
	story = story.rsplit(".", 1)[0] + "."

	except Exception as e:
	st.error(f"🚨 Story magic failed: {str(e)}")
	st.stop()

	# Display Story
	st.subheader("📚 Your Magical Story")
	st.write(story)

	# Audio Conversion
	with st.spinner("🔊 Adding story voice..."):
	try:
	tts = gTTS(text=story, lang="en", slow=False)
	with tempfile.NamedTemporaryFile(delete=False, suffix=".mp3") as fp:
	tts.save(fp.name)
	st.audio(fp.name, format="audio/mp3")
	except Exception as e:
	st.warning("⚠️ Couldn't make audio version: " + str(e))

	st.markdown("---\nMade with ❤️ by your friendly story wizard")