Spaces:

awacke1
/

TorchTransformers-CV-SFT

Running

App Files Files Community

awacke1 commited on Mar 28

Commit

6e0bba0

verified ·

1 Parent(s): de093f2

Update app.py

Browse files

Files changed (1) hide show

app.py +8 -8

app.py CHANGED Viewed

@@ -419,7 +419,7 @@ def process_video_and_audio(video_input):
         # Display frames and transcript
         st.markdown("### Video Frames")
         for frame_b64 in base64Frames:
-            st.image(f"data:image/jpg;base64,{frame_b64}", use_column_width=True)
         st.markdown("### Audio Transcription")
         st.write(transcription.text)
         return transcription.text
@@ -472,9 +472,9 @@ def integrated_workflow():
             mode = st.selectbox("Snapshot Mode", ["single", "twopage", "allpages"])
             snapshots = asyncio.run(process_pdf_snapshot(file_path, mode))
             for snapshot in snapshots:
-                st.image(Image.open(snapshot), caption=f"Snapshot: {snapshot}", use_column_width=True)
         else:
-            st.image(Image.open(file_path), caption="Uploaded Image", use_column_width=True)
         # Run OCR on the file (using first page or the image itself)
         if st.button("Run OCR on File"):
             if uploaded_file.type == "application/pdf":
@@ -520,7 +520,7 @@ def update_gallery():
         for idx, file in enumerate(all_files[:st.session_state.get('gallery_size', 5)]):
             with cols[idx % 2]:
                 if file.endswith('.png'):
-                    st.image(Image.open(file), caption=os.path.basename(file), use_column_width=True)
                 else:
                     st.markdown(os.path.basename(file))
                 if st.button("Delete "+os.path.basename(file), key="del_"+file):
@@ -563,7 +563,7 @@ with tabs[1]:
             filename = generate_filename("cam0_snapshot", "png")
             with open(filename, "wb") as f:
                 f.write(cam0_img.getvalue())
-            st.image(Image.open(filename), caption="Camera 0 Snapshot", use_column_width=True)
             st.session_state.history.append(f"Captured {filename}")
     with col2:
         cam1_img = st.camera_input("Take a picture - Cam 1", key="cam1")
@@ -571,7 +571,7 @@ with tabs[1]:
             filename = generate_filename("cam1_snapshot", "png")
             with open(filename, "wb") as f:
                 f.write(cam1_img.getvalue())
-            st.image(Image.open(filename), caption="Camera 1 Snapshot", use_column_width=True)
             st.session_state.history.append(f"Captured {filename}")
     st.markdown("---")
     st.subheader("Generate New Image with Diffusion")
@@ -579,7 +579,7 @@ with tabs[1]:
     if st.button("Generate Image"):
         output_file = generate_filename("gen_output", "png")
         result_img = asyncio.run(process_image_gen(prompt_img, output_file))
-        st.image(result_img, caption="Generated Image", use_column_width=True)
 # --- PDF & Documents Tab ---
 with tabs[2]:
@@ -633,7 +633,7 @@ with tabs[3]:
         image_file = st.file_uploader("Upload an image", type=["png", "jpg", "jpeg"], key="chat_image")
         if image_file:
             image = Image.open(image_file)
-            st.image(image, caption="Uploaded Image", use_column_width=True)
             response = process_image_with_prompt(image, text_prompt)
             st.markdown(response)
     elif mode == "Audio":

         # Display frames and transcript
         st.markdown("### Video Frames")
         for frame_b64 in base64Frames:
+            st.image(f"data:image/jpg;base64,{frame_b64}", use_container_width=True)
         st.markdown("### Audio Transcription")
         st.write(transcription.text)
         return transcription.text
             mode = st.selectbox("Snapshot Mode", ["single", "twopage", "allpages"])
             snapshots = asyncio.run(process_pdf_snapshot(file_path, mode))
             for snapshot in snapshots:
+                st.image(Image.open(snapshot), caption=f"Snapshot: {snapshot}", use_container_width=True)
         else:
+            st.image(Image.open(file_path), caption="Uploaded Image", use_container_width=True)
         # Run OCR on the file (using first page or the image itself)
         if st.button("Run OCR on File"):
             if uploaded_file.type == "application/pdf":
         for idx, file in enumerate(all_files[:st.session_state.get('gallery_size', 5)]):
             with cols[idx % 2]:
                 if file.endswith('.png'):
+                    st.image(Image.open(file), caption=os.path.basename(file), use_container_width=True)
                 else:
                     st.markdown(os.path.basename(file))
                 if st.button("Delete "+os.path.basename(file), key="del_"+file):
             filename = generate_filename("cam0_snapshot", "png")
             with open(filename, "wb") as f:
                 f.write(cam0_img.getvalue())
+            st.image(Image.open(filename), caption="Camera 0 Snapshot", use_container_width=True)
             st.session_state.history.append(f"Captured {filename}")
     with col2:
         cam1_img = st.camera_input("Take a picture - Cam 1", key="cam1")
             filename = generate_filename("cam1_snapshot", "png")
             with open(filename, "wb") as f:
                 f.write(cam1_img.getvalue())
+            st.image(Image.open(filename), caption="Camera 1 Snapshot", use_container_width=True)
             st.session_state.history.append(f"Captured {filename}")
     st.markdown("---")
     st.subheader("Generate New Image with Diffusion")
     if st.button("Generate Image"):
         output_file = generate_filename("gen_output", "png")
         result_img = asyncio.run(process_image_gen(prompt_img, output_file))
+        st.image(result_img, caption="Generated Image", use_container_width=True)
 # --- PDF & Documents Tab ---
 with tabs[2]:
         image_file = st.file_uploader("Upload an image", type=["png", "jpg", "jpeg"], key="chat_image")
         if image_file:
             image = Image.open(image_file)
+            st.image(image, caption="Uploaded Image", use_container_width=True)
             response = process_image_with_prompt(image, text_prompt)
             st.markdown(response)
     elif mode == "Audio":