Spaces:

mayf
/

1

Sleeping

mayf commited on Apr 28

Commit

504dc12

verified ·

1 Parent(s): 8367fb2

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,3 +1,5 @@
 import streamlit as st
 from PIL import Image
 from transformers import pipeline
@@ -11,9 +13,9 @@ st.title("🖼️ ➡️ 📖 Interactive Storyteller")
 # —––––––– Cache model loading
 @st.cache_resource
 def load_pipelines():
-    # 1) Image captioning
     captioner = pipeline(
-        "image-captioning",
         model="Salesforce/blip-image-captioning-base"
     )
     # 2) Story generation with Flan-T5
@@ -33,7 +35,9 @@ if uploaded:
     # —––––––– 1. Caption
     with st.spinner("🔍 Looking at the image..."):
-        cap = captioner(image)[0]["generated_text"]
     st.markdown(f"**Caption:** {cap}")
     # —––––––– 2. Story generation
@@ -60,4 +64,4 @@ if uploaded:
         tmp = tempfile.NamedTemporaryFile(suffix=".mp3", delete=False)
         tts.write_to_fp(tmp)
         tmp.flush()
-    st.audio(tmp.name, format="audio/mp3")

+# app.py
 import streamlit as st
 from PIL import Image
 from transformers import pipeline
 # —––––––– Cache model loading
 @st.cache_resource
 def load_pipelines():
+    # 1) Image-to-text (captioning)
     captioner = pipeline(
+        "image-to-text",
         model="Salesforce/blip-image-captioning-base"
     )
     # 2) Story generation with Flan-T5
     # —––––––– 1. Caption
     with st.spinner("🔍 Looking at the image..."):
+        cap_outputs = captioner(image)
+        # BLIP returns a list of dicts with key "generated_text"
+        cap = cap_outputs[0].get("generated_text", "").strip()
     st.markdown(f"**Caption:** {cap}")
     # —––––––– 2. Story generation
         tmp = tempfile.NamedTemporaryFile(suffix=".mp3", delete=False)
         tts.write_to_fp(tmp)
         tmp.flush()
+    st.audio(tmp.name, format="audio/mp3")