Spaces:

keplersj
/

photo-merge

Runtime error

keplersj commited on Jan 4, 2024

Commit

4dba69f

1 Parent(s): 7d3d31c

use transfromer pipeline

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,10 +1,8 @@
 import streamlit as st
 from PIL import Image
-from transformers import BlipProcessor, BlipForConditionalGeneration
 from diffusers import StableDiffusionPipeline
-processor = BlipProcessor.from_pretrained("Salesforce/blip-image-captioning-large")
-model = BlipForConditionalGeneration.from_pretrained("Salesforce/blip-image-captioning-large")
 pipe = StableDiffusionPipeline.from_pretrained("CompVis/stable-diffusion-v1-4")
 captions = []
@@ -12,6 +10,13 @@ captions = []
 with st.sidebar:
     files = st.file_uploader("Upload images to blend", accept_multiple_files=True)
     st.divider()
     image_gen_guidance = st.slider("Stable Diffusion: Guidance Scale", value=7.5)
     image_gen_steps = st.slider("stable Diffusion: Inference Steps", value=50)
@@ -22,12 +27,11 @@ with col1:
         image = Image.open(file_name)
         with st.spinner('Captioning Provided Image'):
-            inputs = processor(image, return_tensors="pt")
-            out = model.generate(**inputs)
-            description = processor.decode(out[0], skip_special_tokens=True)
-            captions.append(description)
-        st.image(image, caption=description)
 with col2:
     if len(captions) > 0:

 import streamlit as st
 from PIL import Image
+from transformers import pipeline as transformer
 from diffusers import StableDiffusionPipeline
 pipe = StableDiffusionPipeline.from_pretrained("CompVis/stable-diffusion-v1-4")
 captions = []
 with st.sidebar:
     files = st.file_uploader("Upload images to blend", accept_multiple_files=True)
     st.divider()
+    caption_model = st.selectbox("Caption Model", [
+        "ydshieh/vit-gpt2-coco-en",
+        "Salesforce/blip-image-captioning-large",
+        "nlpconnect/vit-gpt2-image-captioning",
+        "microsoft/git-base"
+    ])
+    st.divider()
     image_gen_guidance = st.slider("Stable Diffusion: Guidance Scale", value=7.5)
     image_gen_steps = st.slider("stable Diffusion: Inference Steps", value=50)
         image = Image.open(file_name)
         with st.spinner('Captioning Provided Image'):
+            captioner = transformer(model=caption_model)
+            caption = captioner(image)[0].generated_text
+        captions.append(caption)
+        st.image(image, caption=caption)
 with col2:
     if len(captions) > 0: