Spaces:

Nathanwit
/

Image-Captioning-DL

Runtime error

Nathanwit commited on Dec 11, 2023

Commit

7d12a4b

1 Parent(s): 417b640

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -23,17 +23,15 @@ feature_extractor= ViTImageProcessor.from_pretrained(model_path)
 # Load model
 model = VisionEncoderDecoderModel.from_pretrained(model_path)
-pixel_values = feature_extractor(images=image, return_tensors="pt").pixel_values
-# use GPT2's eos_token as the pad as well as eos token
 def predict(image,max_length=24, num_beams=4):
     image = image.convert('RGB')
-    sequences = model.generate(pixel_values, num_beams=4, max_length=25)
     sequences = model.generate(pixel_values, num_beams=4, max_length=25)
     captions = tokenizer.batch_decode(sequences, skip_special_tokens=True)
-  return captions
 # Gradio Interface

 # Load model
 model = VisionEncoderDecoderModel.from_pretrained(model_path)
 def predict(image,max_length=24, num_beams=4):
     image = image.convert('RGB')
+    pixel_values = feature_extractor(images=image, return_tensors="pt").pixel_values
     sequences = model.generate(pixel_values, num_beams=4, max_length=25)
     captions = tokenizer.batch_decode(sequences, skip_special_tokens=True)
+    return captions
 # Gradio Interface