mudra1710
/

clip-embeddings

Zero-Shot Image Classification

Model card Files Files and versions

clip-embeddings / handler.py

mudra1710's picture

Update handler.py

588c310 about 2 years ago

history blame contribute delete

1.05 kB

	from typing import Dict, List, Any
	import numpy as np
	from transformers import CLIPProcessor, CLIPModel
	from PIL import Image
	from io import BytesIO
	import base64

	class EndpointHandler():
	def __init__(self, path=""):
	# Preload all the elements you we need at inference.
	self.model = CLIPModel.from_pretrained("openai/clip-vit-base-patch32")
	self.processor = CLIPProcessor.from_pretrained("openai/clip-vit-base-patch32")


	def __call__(self, data: Dict[str, Any]) -> List[Dict[str, Any]]:
	url = data.get("inputs")
	text = data.get("text")
	image = Image.open(requests.get(url, stream=True).raw)
	inputs = self.processor(text=text, images=image, return_tensors="pt", padding=True)
	outputs = self.model(**inputs)
	logits_per_image = outputs.logits_per_image # this is the image-text similarity score
	probs = logits_per_image.softmax(dim=1)
	embeddings = outputs.image_embeds.detach().numpy().flatten().tolist()
	return { "embeddings": embeddings }