Spaces:

Jangai
/

Sketch

Sleeping

App Files Files Community

Sketch / app.py

Jangai

Update app.py

c1c81f5 verified about 1 year ago

raw

history blame

2.15 kB

	import gradio as gr
	import torch
	from transformers import DetrImageProcessor, DetrForObjectDetection
	from PIL import Image
	import numpy as np
	import logging

	# Configure logging
	logging.basicConfig(level=logging.DEBUG)

	# Load the pre-trained model and feature extractor
	model_name = "IDEA-Research/grounding-dino-tiny"
	logging.info("Loading image processor and model...")
	feature_extractor = DetrImageProcessor.from_pretrained(model_name)
	model = DetrForObjectDetection.from_pretrained(model_name)

	# Define the prediction function
	def predict(image):
	try:
	logging.info("Received image of type: %s", type(image))
	logging.debug("Image content: %s", image)

	# Use the 'composite' key to get the final image
	if isinstance(image, dict):
	image = image['composite']

	logging.debug("Converting to NumPy array...")
	image = np.array(image).astype('uint8')
	logging.debug("Converting NumPy array to PIL image...")
	image = Image.fromarray(image, 'RGBA').convert('RGB')
	logging.debug("Image converted successfully.")

	logging.info("Processing image...")
	inputs = feature_extractor(images=image, return_tensors="pt")
	outputs = model(**inputs)
	logits = outputs.logits
	probs = torch.nn.functional.softmax(logits, dim=-1)
	top_probs, top_idxs = probs.topk(3, dim=-1)
	top_probs = top_probs.detach().numpy()[0].tolist() # Convert to list
	top_idxs = top_idxs.detach().numpy()[0].tolist() # Convert to list
	top_classes = [model.config.id2label[idx] for idx in top_idxs]
	result = {top_classes[i]: float(top_probs[i]) for i in range(3)}
	logging.info("Prediction successful.")
	return result
	except Exception as e:
	logging.error("Error during prediction: %s", e)
	return {"error": str(e)}

	# Create the Gradio interface
	iface = gr.Interface(
	fn=predict,
	inputs=gr.Sketchpad(),
	outputs=gr.JSON(),
	title="Drawing Classifier",
	description="Draw something and the model will try to identify it!"
	)

	# Launch the interface
	iface.launch()