Spaces:

Jangai
/

Sketch

Sleeping

Jangai commited on Jun 8, 2024

Commit

301a707

verified ·

1 Parent(s): b0ac62c

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,29 +1,34 @@
 import gradio as gr
-from PIL import Image
 from transformers import TrOCRProcessor, VisionEncoderDecoderModel
-# Load the processor and model
-processor = TrOCRProcessor.from_pretrained("microsoft/trocr-large-handwritten")
-model = VisionEncoderDecoderModel.from_pretrained("microsoft/trocr-large-handwritten")
-# Define the function to recognize handwriting
 def recognize_handwriting(image):
-    pixel_values = processor(images=image, return_tensors="pt").pixel_values
     generated_ids = model.generate(pixel_values)
     generated_text = processor.batch_decode(generated_ids, skip_special_tokens=True)[0]
     return generated_text
 # Create the Gradio interface
-with gr.Blocks() as demo:
-    gr.Markdown("# Handwriting Recognition")
-    with gr.Row():
-        with gr.Column():
-            image_input = gr.Image(tool="editor", type="numpy", label="Draw or Upload an Image")
-            recognize_button = gr.Button("Recognize Handwriting")
-        with gr.Column():
-            output_text = gr.Textbox(label="Recognized Text")
-    recognize_button.click(fn=recognize_handwriting, inputs=image_input, outputs=output_text)
-# Launch the Gradio app
-demo.launch()

 import gradio as gr
 from transformers import TrOCRProcessor, VisionEncoderDecoderModel
+from PIL import Image
+import numpy as np
+# Load the model and processor
+processor = TrOCRProcessor.from_pretrained('microsoft/trocr-large-handwritten')
+model = VisionEncoderDecoderModel.from_pretrained('microsoft/trocr-large-handwritten')
+# Define the prediction function
 def recognize_handwriting(image):
+    if isinstance(image, dict):
+        image = Image.fromarray(image['image'])
+    elif isinstance(image, np.ndarray):
+        image = Image.fromarray(image)
+    else:
+        image = Image.open(image)
+    pixel_values = processor(image, return_tensors="pt").pixel_values
     generated_ids = model.generate(pixel_values)
     generated_text = processor.batch_decode(generated_ids, skip_special_tokens=True)[0]
     return generated_text
 # Create the Gradio interface
+image_input = gr.Image(type="numpy", label="Draw or Upload an Image")
+output_text = gr.Textbox(label="Recognized Text")
+gr.Interface(
+    fn=recognize_handwriting,
+    inputs=image_input,
+    outputs=output_text,
+    title="Handwritten Text Recognition",
+    description="Draw or upload an image of handwritten text to recognize it.",
+).launch()