ipvikas commited on
Commit
2b636b0
·
verified ·
1 Parent(s): 2c804fd

Create OCR_Image_to_Text.py

Browse files
Files changed (1) hide show
  1. OCR_Image_to_Text.py +69 -0
OCR_Image_to_Text.py ADDED
@@ -0,0 +1,69 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # # First uninstall existing packages to avoid conflicts
2
+ # # !pip uninstall -y httpx googletrans gradio easyocr
3
+
4
+ # !pip install httpx==0.24.1
5
+ # !pip install googletrans-py==4.0.0
6
+ # !pip install gradio==3.50.2
7
+ # !pip install easyocr==1.7.1
8
+
9
+ # !pip install numpy Pillow easyocr gradio googletrans==3.1.0a0
10
+
11
+ import gradio as gr
12
+ import os
13
+ from googletrans import Translator
14
+ import easyocr
15
+ from PIL import Image
16
+ from PIL import ImageDraw
17
+ import numpy as np
18
+
19
+ def Get_OCR_demo(image):
20
+ try:
21
+ # Initialize EasyOCR reader
22
+ reader = easyocr.Reader(['en'])
23
+ translator = Translator()
24
+
25
+ # Convert image to numpy array if it isn't already
26
+ if isinstance(image, str):
27
+ # If image is a file path
28
+ image_array = np.array(Image.open(image))
29
+ elif isinstance(image, np.ndarray):
30
+ # If image is already a numpy array
31
+ image_array = image
32
+ else:
33
+ raise ValueError("Unsupported image format")
34
+
35
+ # Perform OCR
36
+ text_list = reader.readtext(
37
+ image_array,
38
+ add_margin=0.55,
39
+ width_ths=0.7,
40
+ link_threshold=0.8,
41
+ decoder='beamsearch',
42
+ blocklist='=-',
43
+ detail=0
44
+ )
45
+
46
+ # Combine text results
47
+ text_comb = ' '.join(text_list) if text_list else "No text detected"
48
+ return text_comb
49
+
50
+ except Exception as e:
51
+ return f"Error processing image: {str(e)}"
52
+
53
+ # Create Gradio interface
54
+ title = "Upload an image and extract Text from it"
55
+ description = "OCR tool for text extraction"
56
+ examples=[["english.png"],["Parag_Letter_j.jpg"]]
57
+
58
+ get_OCR_demo = gr.Interface(
59
+ fn=Get_OCR_demo,
60
+ inputs=gr.Image(label="Upload Image"), # Removed type="filepath"
61
+ outputs=gr.Textbox(label="Extracted Text"),
62
+ title=title,
63
+ description=description,
64
+ cache_examples=False,
65
+ examples=examples
66
+ )
67
+
68
+ # if __name__ == "__main__":
69
+ # get_OCR_demo.launch()