Spaces:

VinitT
/

StoryGeneraterFromImages

Sleeping

App Files Files Community

VinitT commited on Sep 17, 2024

Commit

2867c32

verified ·

1 Parent(s): 5b0226f

Update app.py

Browse files

Files changed (1) hide show

app.py +25 -15

app.py CHANGED Viewed

@@ -34,7 +34,7 @@ if uploaded_files:
                 # Open the image
                 image = Image.open(uploaded_file)
                 # Resize image to reduce memory usage
-                image = image.resize((512, 512))
                 st.image(image, caption='Uploaded Image.', use_column_width=True)
                 st.write("Generating description...")
@@ -55,7 +55,7 @@ if uploaded_files:
                     # Convert the frame to an image
                     image = Image.fromarray(cv2.cvtColor(frame, cv2.COLOR_BGR2RGB))
                     # Resize image to reduce memory usage
-                    image = image.resize((512, 512))
                     st.image(image, caption='First Frame of Uploaded Video.', use_column_width=True)
                     st.write("Generating description...")
@@ -66,6 +66,11 @@ if uploaded_files:
                 st.error("Unsupported file type.")
                 continue
             messages = [
                 {
                     "role": "user",
@@ -94,19 +99,24 @@ if uploaded_files:
             inputs = inputs.to(device)  # Ensure inputs are on the same device as the model
             # Inference: Generation of the output
-            generated_ids = model.generate(**inputs, max_new_tokens=512)
-            generated_ids_trimmed = [
-                out_ids[len(in_ids) :] for in_ids, out_ids in zip(inputs.input_ids, generated_ids)
-            ]
-            output_text = processor.batch_decode(
-                generated_ids_trimmed, skip_special_tokens=True, clean_up_tokenization_spaces=False
-            )
-            st.write("Description:")
-            st.write(output_text[0])
-            # Append the output text to the list
-            all_output_texts.append(output_text[0])
             # Clear memory after processing each file
             del image, inputs, generated_ids, generated_ids_trimmed, output_text

                 # Open the image
                 image = Image.open(uploaded_file)
                 # Resize image to reduce memory usage
+                image = image.resize((256, 256))  # Reduce size to save memory
                 st.image(image, caption='Uploaded Image.', use_column_width=True)
                 st.write("Generating description...")
                     # Convert the frame to an image
                     image = Image.fromarray(cv2.cvtColor(frame, cv2.COLOR_BGR2RGB))
                     # Resize image to reduce memory usage
+                    image = image.resize((256, 256))  # Reduce size to save memory
                     st.image(image, caption='First Frame of Uploaded Video.', use_column_width=True)
                     st.write("Generating description...")
                 st.error("Unsupported file type.")
                 continue
+            # Ensure the image is loaded correctly
+            if image is None:
+                st.error("Failed to load the image.")
+                continue
             messages = [
                 {
                     "role": "user",
             inputs = inputs.to(device)  # Ensure inputs are on the same device as the model
             # Inference: Generation of the output
+            try:
+                generated_ids = model.generate(**inputs, max_new_tokens=512)
+                generated_ids_trimmed = [
+                    out_ids[len(in_ids) :] for in_ids, out_ids in zip(inputs.input_ids, generated_ids)
+                ]
+                output_text = processor.batch_decode(
+                    generated_ids_trimmed, skip_special_tokens=True, clean_up_tokenization_spaces=False
+                )
+                st.write("Description:")
+                st.write(output_text[0])
+                # Append the output text to the list
+                all_output_texts.append(output_text[0])
+            except Exception as e:
+                st.error(f"Error during generation: {e}")
+                continue
             # Clear memory after processing each file
             del image, inputs, generated_ids, generated_ids_trimmed, output_text