Spaces:

chats-bug
/

image-captioning

Runtime error

App Files Files Community

chats-bug commited on May 4, 2023

Commit

0d54c12

1 Parent(s): 046f505

Fixed git large coco model

Browse files

Files changed (1) hide show

app.py +2 -13

app.py CHANGED Viewed

@@ -1,3 +1,4 @@
 import gradio as gr
 from transformers import AutoProcessor, AutoTokenizer, AutoImageProcessor, AutoModelForCausalLM, BlipForConditionalGeneration, VisionEncoderDecoderModel, BitsAndBytesConfig
 import torch
@@ -38,7 +39,6 @@ def generate_caption(
 	model,
 	image,
 	tokenizer=None,
-	use_float_16=False,
 ):
 	"""
 	Generate captions for the given image.
@@ -61,15 +61,10 @@ def generate_caption(
 	str
 		The generated caption.
 	"""
-	inputs = preprocessor(image, return_tensors="pt").to(device)
-	pixel_values = preprocessor(images=image, return_tensors="pt").pixel_values
-	if use_float_16:
-		inputs = inputs.to(torch.float16)
 	generated_ids = model.generate(
 		pixel_values=pixel_values,
-		attention_mask=inputs.attention_mask,
 		max_length=50,
 	)
@@ -117,7 +112,6 @@ def generate_captions(
 	image,
 	max_length,
 	temperature,
-	use_sample_image,
 ):
 	"""
 	Generate captions for the given image.
@@ -137,10 +131,6 @@ def generate_captions(
 	caption_git_large_coco = ""
 	caption_oc_coca = ""
-	if use_sample_image:
-		url = "http://images.cocodataset.org/val2017/000000039769.jpg"
-		image = Image.open(requests.get(url, stream=True).raw)
 	# Generate captions for the image using the Blip base model
 	try:
 		caption_blip_base = generate_caption(preprocessor_blip_base, model_blip_base, image).strip()
@@ -176,7 +166,6 @@ iface = gr.Interface(
 		gr.inputs.Image(type="pil", label="Image"),
 		gr.inputs.Slider(minimum=16, maximum=64, step=2, default=32, label="Max Length"),
 		gr.inputs.Slider(minimum=0.5, maximum=1.5, step=0.1, default=1.0, label="Temperature"),
-		gr.inputs.Checkbox(default=False, label="Use example image")
 	],
 	# Define the outputs
 	outputs=[

+import traceback
 import gradio as gr
 from transformers import AutoProcessor, AutoTokenizer, AutoImageProcessor, AutoModelForCausalLM, BlipForConditionalGeneration, VisionEncoderDecoderModel, BitsAndBytesConfig
 import torch
 	model,
 	image,
 	tokenizer=None,
 ):
 	"""
 	Generate captions for the given image.
 	str
 		The generated caption.
 	"""
+	pixel_values = preprocessor(images=image, return_tensors="pt").pixel_values.to(device)
 	generated_ids = model.generate(
 		pixel_values=pixel_values,
 		max_length=50,
 	)
 	image,
 	max_length,
 	temperature,
 ):
 	"""
 	Generate captions for the given image.
 	caption_git_large_coco = ""
 	caption_oc_coca = ""
 	# Generate captions for the image using the Blip base model
 	try:
 		caption_blip_base = generate_caption(preprocessor_blip_base, model_blip_base, image).strip()
 		gr.inputs.Image(type="pil", label="Image"),
 		gr.inputs.Slider(minimum=16, maximum=64, step=2, default=32, label="Max Length"),
 		gr.inputs.Slider(minimum=0.5, maximum=1.5, step=0.1, default=1.0, label="Temperature"),
 	],
 	# Define the outputs
 	outputs=[