Genzo1010 commited on
Commit
2748615
·
verified ·
1 Parent(s): 669720d

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +56 -5
app.py CHANGED
@@ -1,7 +1,58 @@
1
- import gradio as gr
 
 
 
 
 
 
2
 
3
- def greet(name):
4
- return "Hello " + name + "!!"
5
 
6
- demo = gr.Interface(fn=greet, inputs="text", outputs="text")
7
- demo.launch()
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from fastapi import FastAPI, File, UploadFile
2
+ import numpy as np
3
+ from PIL import Image
4
+ from paddleocr import PaddleOCR
5
+ from doctr.io import DocumentFile
6
+ from doctr.models import ocr_predictor
7
+ import io
8
 
9
+ app = FastAPI()
 
10
 
11
+ # Load the doctr OCR model
12
+ ocr_model = ocr_predictor(pretrained=True)
13
+
14
+ def ocr_with_doctr(file):
15
+ text_output = ''
16
+
17
+ # Load the document
18
+ doc = DocumentFile.from_pdf(file)
19
+
20
+ # Perform OCR
21
+ result = ocr_model(doc)
22
+
23
+ # Extract text from OCR result
24
+ for page in result.pages:
25
+ for block in page.blocks:
26
+ for line in block.lines:
27
+ text_output += " ".join([word.value for word in line.words]) + "\n"
28
+
29
+ return text_output
30
+
31
+ def ocr_with_paddle(img):
32
+ finaltext = ''
33
+ ocr = PaddleOCR(lang='en', use_angle_cls=True)
34
+ result = ocr.ocr(img)
35
+
36
+ for i in range(len(result[0])):
37
+ text = result[0][i][1][0]
38
+ finaltext += ' ' + text
39
+ return finaltext
40
+
41
+
42
+ def generate_text_from_image(img):
43
+ text_output = ''
44
+ text_output = ocr_with_paddle(img)
45
+ return text_output
46
+
47
+ @app.post("/ocr/")
48
+ async def perform_ocr(file: UploadFile = File(...)):
49
+
50
+ file_bytes = await file.read()
51
+
52
+ if file.filename.endswith('.pdf'):
53
+ text_output = ocr_with_doctr(io.BytesIO(file_bytes))
54
+ else:
55
+ img = np.array(Image.open(io.BytesIO(file_bytes)))
56
+ text_output = generate_text_from_image(img)
57
+
58
+ return {"ocr_text": text_output}