Spaces:

mrbeliever
/

Im-prmpt

Running

App Files Files Community

Im-prmpt / app.py

mrbeliever

Update app.py

a93e14b verified 7 months ago

raw

history blame

3.79 kB

	import streamlit as st
	import requests
	import base64
	import os

	# Function to convert image to base64
	def convert_image_to_base64(image):
	image_bytes = image.read()
	encoded_image = base64.b64encode(image_bytes).decode("utf-8")
	return encoded_image

	# Function to generate a caption using Nebius API
	def generate_caption(encoded_image):
	API_URL = "https://api.studio.nebius.ai/v1/chat/completions"
	API_KEY = os.environ.get("NEBIUS_API_KEY")

	headers = {
	"Authorization": f"Bearer {API_KEY}",
	"Content-Type": "application/json"
	}

	payload = {
	"model": "llava-hf/llava-1.5-7b-hf",
	"messages": [
	{
	"role": "system",
	"content": """You are an image to prompt converter. Your work is to observe each and every detail of the image and craft a detailed prompt under 75 words in this format: [image content/subject, description of action, state, and mood], [art form, style], [artist/photographer reference if needed], [additional settings such as camera and lens settings, lighting, colors, effects, texture, background, rendering]."""
	},
	{
	"role": "user",
	"content": "write a detailed caption for this image"
	}
	],
	"image": {
	"type": "image_url",
	"image_url": {
	"url": f"data:image/png;base64,{encoded_image}"
	}
	},
	"temperature": 0.7
	}

	response = requests.post(API_URL, headers=headers, json=payload)

	if response.status_code == 200:
	result = response.json()
	caption = result.get("choices", [{}])[0].get("message", {}).get("content", "No caption generated.")
	return caption
	else:
	st.error(f"API Error {response.status_code}: {response.text}")
	return None

	# Streamlit app
	def main():
	st.set_page_config(page_title="Image to Caption Converter", layout="centered", initial_sidebar_state="collapsed")

	# Gradient background style
	st.markdown("""
	<style>
	body {
	background: linear-gradient(135deg, #1e3c72, #2a5298);
	color: white;
	font-family: 'Arial', sans-serif;
	}
	.uploaded-image {
	max-width: 100%;
	border: 2px solid #ffffff;
	border-radius: 10px;
	}
	.copy-button {
	background-color: #ff8800;
	color: white;
	border: none;
	border-radius: 5px;
	padding: 10px 15px;
	cursor: pointer;
	}
	.copy-button:hover {
	background-color: #cc6b00;
	}
	</style>
	""", unsafe_allow_html=True)

	st.title("🖼️ Image to Caption Converter")

	uploaded_file = st.file_uploader("Upload an image", type=["jpg", "jpeg", "png"])
	if uploaded_file:
	# Display the uploaded image
	st.image(uploaded_file, caption="Uploaded Image", use_container_width=True)

	# Convert image to base64 and get caption
	if st.button("Generate Caption"):
	with st.spinner("Generating caption..."):
	encoded_image = convert_image_to_base64(uploaded_file)
	caption = generate_caption(encoded_image)

	if caption:
	st.subheader("Generated Caption:")
	st.text_area("", caption, height=100, key="caption_area")

	# Copy button
	if st.button("Copy to Clipboard"):
	st.code(caption, language="text")
	st.success("Caption copied to clipboard!")

	if __name__ == "__main__":
	main()