import streamlit as st from PIL import Image from transformers import pipeline from gtts import gTTS import os os.system("pip install transformers==4.36.2") def main(): st.set_page_config(page_title="AI Storyteller", page_icon="📖") # Beautify | UI 美化 page_bg_img = """ """ st.markdown(page_bg_img, unsafe_allow_html=True) # 🎯 Load Hugging Face Models | 加載 Hugging Face 模型 image_to_text_model = pipeline("image-to-text", model="Salesforce/blip-image-captioning-base") story_generator = pipeline("text-generation", model="facebook/opt-350m", device=-1) # Image to Text (Generate Caption) | 圖片 → 文字（生成描述） def img2text(image_path): text = image_to_text_model(image_path)[0]["generated_text"] return text # Text to Story (Generate a Complete Story) | 文字 → 故事（生成完整故事） def text2story(text): prompt = f"Write a fun and magical children's story based on this idea: {text}.\n\nOnce upon a time..." story = story_generator(prompt, max_length=300, do_sample=True, temperature=0.8, top_p=0.9, repetition_penalty=1.2)[0]['generated_text'] return story # Story to Speech (TTS) | 故事 → 語音（TTS） def text2audio_gtts(story_text, filename="story.mp3"): # Avoid filename conflicts | 避免文件冲突 if os.path.exists(filename): os.remove(filename) # Limit text length (to prevent gTTS crashes)| 限制 TTS 文本長度（避免 gTTS 崩潰） max_chars = 500 # gTTS 可能不支持過長文本 story_text = story_text[:max_chars] # Generate Speech | 生成语音 tts = gTTS(text=story_text, lang="en") tts.save(filename) return filename # Streamlit Web UI st.header("📖 AI Storyteller: Turn Your Image into a Story with Audio") uploaded_file = st.file_uploader("Upload image below", type=["jpg", "png"]) if uploaded_file: # Save image locally | 保存圖片到本地 image_path = "uploaded_image.jpg" with open(image_path, "wb") as f: f.write(uploaded_file.getbuffer()) # Load and Display Image | 讀取並顯示圖片 image = Image.open(image_path) st.image(image, caption="Uploaded Image", use_container_width=True) # Generate Image Caption | 生成圖片描述 st.text("🔍 Generating image caption...") caption = img2text(image_path) st.write("**Image Description:**", caption) # Generate Story | 生成故事 st.text("📝 Generating story...") story = text2story(caption) st.write("**Generated Story:**") st.write(story) # Generate Audio | 生成語音 st.text("🔊 Generating audio...") audio_file = text2audio_gtts(story) # Play Audio | 播放音頻 st.audio(audio_file, format="audio/mp3") # Download Audio | 下載按钮 with open(audio_file, "rb") as file: st.download_button("📥 Download Audio", file, file_name="story.mp3") # Add a Python standard entry check so that the program starts with main() | 加入 Python 標準入口檢查，讓程式從 main() 開始執行 if __name__ == "__main__": main()