Spaces:

HoKa
/

Form-OCR-Persian

Runtime error

App Files Files Community

Form-OCR-Persian / app.py

HoKa

initial commit

66e6d34 8 months ago

raw

history blame contribute delete

5.03 kB

	import os
	import google.generativeai as genai
	import gradio as gr
	from PIL import Image
	import json

	# Your API key - for Hugging Face, set this as a secret in the Space settings
	GEMINI_API_KEY = os.getenv("GEMINI_API_KEY") # This will get the API key from environment variables

	# Configure Gemini API
	def configure_genai():
	genai.configure(api_key=GEMINI_API_KEY)
	model = genai.GenerativeModel('gemini-1.5-flash-8b')
	return model

	def process_form(image):
	try:
	model = configure_genai()

	if not isinstance(image, Image.Image):
	image = Image.open(image)

	prompt = """
	لطفاً این تصویر فرم را تحلیل کنید و اطلاعات زیر را در قالب JSON استخراج کنید:
	1. تمام فیلدهای متنی و مقادیر آنها
	2. چک باکس‌ها یا دکمه‌های رادیویی و وضعیت آنها
	3. امضاها یا مهرها در صورت وجود

	لطفاً پاسخ را به صورت یک شیء JSON با نام فیلدها و مقادیر مناسب فرمت کنید.
	"""

	response = model.generate_content([prompt, image])
	response_text = response.text
	json_start = response_text.find('{')
	json_end = response_text.rfind('}') + 1

	if json_start != -1 and json_end != -1:
	json_str = response_text[json_start:json_end]
	parsed_json = json.loads(json_str)
	return json.dumps(parsed_json, indent=2, ensure_ascii=False)
	else:
	return response.text

	except Exception as e:
	return f"خطا در پردازش فرم: {str(e)}"

	def create_interface():
	css = """
	body {
	background-color: #000000;
	}

	.gradio-container {
	color: white !important;
	direction: rtl !important;
	text-align: right !important;
	}

	.title-text {
	color: white !important;
	text-align: right !important;
	}

	.subtitle-text {
	color: white !important;
	text-align: right !important;
	}

	.description-text {
	color: white !important;
	text-align: right !important;
	}

	.label-wrap span {
	color: white !important;
	text-align: right !important;
	}

	.md h1, .md h2, .md h3, .md p, .md ol, .md li {
	color: white !important;
	text-align: right !important;
	direction: rtl !important;
	}

	button {
	direction: rtl !important;
	background-color: #ff4b1f !important;
	color: white !important;
	}

	.output-markdown {
	direction: rtl !important;
	text-align: right !important;
	}

	textarea {
	direction: rtl !important;
	text-align: right !important;
	background-color: #2d2d2d !important;
	color: white !important;
	}
	"""

	with gr.Blocks(title="سیستم استخراج متن از فرم - نسخه نمایشی هایمارت", css=css, theme="darker") as interface:
	gr.Markdown('<h1 class="title-text">سیستم هوشمند استخراج متن از فرم</h1>')
	gr.Markdown('<h3 class="subtitle-text">نسخه نمایشی برای هایمارت</h3>')
	gr.Markdown('<p class="description-text">لطفاً تصویر فرم خود را بارگذاری کنید تا اطلاعات آن به صورت خودکار استخراج شود</p>')

	with gr.Row():
	with gr.Column():
	image_input = gr.Image(
	label="تصویر فرم را اینجا بارگذاری کنید",
	type="pil"
	)
	submit_btn = gr.Button("پردازش فرم")

	with gr.Column():
	output_text = gr.Textbox(
	label="اطلاعات استخراج شده",
	lines=10,
	rtl=True
	)

	submit_btn.click(
	fn=process_form,
	inputs=[image_input],
	outputs=output_text
	)

	gr.Markdown("""
	<div class="guide-section">
	<h3>راهنما:</h3>
	<ol>
	<li>یک تصویر از فرم خود را بارگذاری کنید</li>
	<li>روی دکمه 'پردازش فرم' کلیک کنید</li>
	<li>نتیجه به صورت خودکار نمایش داده خواهد شد</li>
	</ol>

	<p><strong>نکته:</strong> برای نتیجه بهتر، لطفاً از تصاویر واضح و با نور کافی استفاده کنید.</p>

	<p><em>این نسخه نمایشی صرفاً جهت ارزیابی قابلیت‌های سیستم می‌باشد.</em></p>
	</div>
	""")

	return interface

	interface = create_interface()
	interface.launch()