Spaces:

Exched
/

Image_detec

Runtime error

App Files Files Community

Image_detec / app.py

Exched

Update app.py

5c78d10 verified 4 months ago

raw

history blame contribute delete

2.51 kB

	import gradio as gr
	import torch
	from transformers import AutoModelForCausalLM, AutoTokenizer, CLIPProcessor, CLIPModel
	from PIL import Image
	import requests
	from io import BytesIO

	# Load CLIP model for image classification
	clip_model = CLIPModel.from_pretrained("openai/clip-vit-base-patch32")
	clip_processor = CLIPProcessor.from_pretrained("openai/clip-vit-base-patch32")

	# Load Mistral-7B-Instruct-v0.3 model for chat
	mistral_model = AutoModelForCausalLM.from_pretrained("mistralai/Mistral-7B-Instruct-v0.3")
	mistral_tokenizer = AutoTokenizer.from_pretrained("mistralai/Mistral-7B-Instruct-v0.3")

	# Function for image classification with CLIP (anime recognition)
	def classify_image(input_image):
	if isinstance(input_image, str):
	response = requests.get(input_image)
	img = Image.open(BytesIO(response.content))
	else:
	img = Image.fromarray(input_image)

	# Prepare the image and text (anime-related labels)
	inputs = clip_processor(text=["anime", "cartoon", "realistic", "painting"], images=img, return_tensors="pt", padding=True)
	outputs = clip_model(**inputs)
	logits_per_image = outputs.logits_per_image # this is the image-text similarity score
	probs = logits_per_image.softmax(dim=1) # we can apply softmax to get the label probabilities

	# Return the predicted class label
	labels = ["anime", "cartoon", "realistic", "painting"]
	predicted_label = labels[probs.argmax()]
	return predicted_label

	# Function for chat with Mistral 7B Instruct
	def chat_with_mistral(input_text):
	inputs = mistral_tokenizer(input_text, return_tensors="pt")
	outputs = mistral_model.generate(inputs["input_ids"], max_length=150)
	response = mistral_tokenizer.decode(outputs[0], skip_special_tokens=True)
	return response

	# Create Gradio interface for both Image Classification and Chat
	with gr.Blocks() as demo:
	with gr.Tab("Chat with Mistral"):
	chat_input = gr.Textbox(label="Ask Mistral 7B", placeholder="Type your question here...")
	chat_output = gr.Textbox(label="Mistral's Reply", interactive=False)
	chat_input.submit(chat_with_mistral, inputs=chat_input, outputs=chat_output)

	with gr.Tab("Classify Anime Image"):
	img_input = gr.Image(type="numpy", label="Upload Image for Anime Classification")
	img_output = gr.Textbox(label="Predicted Label", interactive=False)
	img_input.change(classify_image, inputs=img_input, outputs=img_output)

	# Launch the interface
	demo.launch()