Spaces:
Build error
Build error
Update app.py
Browse files
app.py
CHANGED
@@ -18,10 +18,10 @@ blip_processor_large = AutoProcessor.from_pretrained("Salesforce/blip-image-capt
|
|
18 |
blip_model_large = BlipForConditionalGeneration.from_pretrained("Salesforce/blip-image-captioning-large").to(device)
|
19 |
|
20 |
blip2_processor = AutoProcessor.from_pretrained("Salesforce/blip2-opt-6.7b")
|
21 |
-
blip2_model = Blip2ForConditionalGeneration.from_pretrained("Salesforce/blip2-opt-6.7b", device_map="auto", torch_dtype=torch.float16)
|
22 |
|
23 |
instructblip_processor = AutoProcessor.from_pretrained("Salesforce/instructblip-vicuna-7b")
|
24 |
-
instructblip_model = InstructBlipForConditionalGeneration.from_pretrained("Salesforce/instructblip-vicuna-7b"
|
25 |
|
26 |
def generate_caption(processor, model, image, tokenizer=None, use_float_16=False):
|
27 |
inputs = processor(images=image, return_tensors="pt").to(device)
|
@@ -42,7 +42,7 @@ def generate_caption(processor, model, image, tokenizer=None, use_float_16=False
|
|
42 |
def generate_caption_blip2(processor, model, image, replace_token=False):
|
43 |
prompt = "Generate a caption for the image:"
|
44 |
|
45 |
-
inputs = processor(images=image, text=prompt, return_tensors="pt").to(device=device, dtype=torch.float16)
|
46 |
|
47 |
generated_ids = model.generate(pixel_values=inputs.pixel_values,
|
48 |
num_beams=5, max_length=50, min_length=1, top_p=0.9,
|
@@ -61,7 +61,7 @@ def generate_captions(image):
|
|
61 |
|
62 |
caption_blip2 = generate_caption_blip2(blip2_processor, blip2_model, image).strip()
|
63 |
|
64 |
-
caption_instructblip = generate_caption_blip2(instructblip_processor, instructblip_model, image)
|
65 |
|
66 |
return caption_git_large_coco, caption_blip_large, caption_blip2, caption_instructblip
|
67 |
|
|
|
18 |
blip_model_large = BlipForConditionalGeneration.from_pretrained("Salesforce/blip-image-captioning-large").to(device)
|
19 |
|
20 |
blip2_processor = AutoProcessor.from_pretrained("Salesforce/blip2-opt-6.7b")
|
21 |
+
blip2_model = Blip2ForConditionalGeneration.from_pretrained("Salesforce/blip2-opt-6.7b", device_map="auto", load_in_4bit=True, torch_dtype=torch.float16)
|
22 |
|
23 |
instructblip_processor = AutoProcessor.from_pretrained("Salesforce/instructblip-vicuna-7b")
|
24 |
+
instructblip_model = InstructBlipForConditionalGeneration.from_pretrained("Salesforce/instructblip-vicuna-7b", device_map="auto", load_in_4bit=True, torch_dtype=torch.float16)
|
25 |
|
26 |
def generate_caption(processor, model, image, tokenizer=None, use_float_16=False):
|
27 |
inputs = processor(images=image, return_tensors="pt").to(device)
|
|
|
42 |
def generate_caption_blip2(processor, model, image, replace_token=False):
|
43 |
prompt = "Generate a caption for the image:"
|
44 |
|
45 |
+
inputs = processor(images=image, text=prompt, return_tensors="pt").to(device=model.device, dtype=torch.float16)
|
46 |
|
47 |
generated_ids = model.generate(pixel_values=inputs.pixel_values,
|
48 |
num_beams=5, max_length=50, min_length=1, top_p=0.9,
|
|
|
61 |
|
62 |
caption_blip2 = generate_caption_blip2(blip2_processor, blip2_model, image).strip()
|
63 |
|
64 |
+
caption_instructblip = generate_caption_blip2(instructblip_processor, instructblip_model, image, replace_token=True)
|
65 |
|
66 |
return caption_git_large_coco, caption_blip_large, caption_blip2, caption_instructblip
|
67 |
|