pragnakalp
commited on
Commit
•
03ceac8
1
Parent(s):
f84a87f
Update app.py
Browse files
app.py
CHANGED
@@ -16,22 +16,32 @@ import socket
|
|
16 |
# from send_email_user import send_user_email
|
17 |
from huggingface_hub import HfApi
|
18 |
import smtplib
|
19 |
-
|
20 |
-
#
|
21 |
-
#
|
22 |
-
#
|
23 |
-
|
24 |
-
|
25 |
-
|
26 |
-
|
27 |
-
|
28 |
-
|
29 |
-
|
30 |
-
|
31 |
-
|
32 |
-
|
33 |
-
|
34 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
35 |
def get_device_ip_address():
|
36 |
|
37 |
if os.name == "nt":
|
@@ -55,7 +65,6 @@ def get_device_ip_address():
|
|
55 |
return result
|
56 |
|
57 |
|
58 |
-
|
59 |
"""
|
60 |
Paddle OCR
|
61 |
"""
|
@@ -115,6 +124,15 @@ def generate_ocr(Method,img):
|
|
115 |
text_output = ocr_with_keras(img)
|
116 |
if Method == 'PaddleOCR':
|
117 |
text_output = ocr_with_paddle(img)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
118 |
# save_details(Method,text_output,img)
|
119 |
# sender="[email protected]"
|
120 |
# password="httscgatatbbxxur"
|
@@ -197,11 +215,10 @@ demo = gr.Interface(
|
|
197 |
[method,image],
|
198 |
output,
|
199 |
title="Optical Character Recognition",
|
200 |
-
description="Try OCR with different methods",
|
201 |
-
theme="darkpeach",
|
202 |
css=".gradio-container {background-color: lightgray} #radio_div {background-color: #FFD8B4; font-size: 40px;}",
|
203 |
allow_flagging = "manual",
|
204 |
-
flagging_dir = "flagged",
|
205 |
-
flagging_callback=hf_writer
|
206 |
)
|
207 |
demo.launch(enable_queue = False)
|
|
|
16 |
# from send_email_user import send_user_email
|
17 |
from huggingface_hub import HfApi
|
18 |
import smtplib
|
19 |
+
|
20 |
+
# HF_TOKEN = os.getenv('HF_TOKEN')
|
21 |
+
# print("$$$$$$$$$$$$$$$$$$$$$$$$$$$$",type(HF_TOKEN))
|
22 |
+
# hf_writer = gr.HuggingFaceDatasetSaver(HF_TOKEN,'OCR-image-to-text',True,True)
|
23 |
+
|
24 |
+
|
25 |
+
DATASET_REPO_URL = "https://huggingface.co/datasets/pragnakalp/OCR-img-to-text"
|
26 |
+
DATA_FILENAME = "ocr_data.csv"
|
27 |
+
DATA_FILE = os.path.join("ocr_data", DATA_FILENAME)
|
28 |
+
HF_TOKEN = os.environ.get("HF_TOKEN")
|
29 |
+
DATASET_REPO_ID = "pragnakalp/OCR-img-to-text"
|
30 |
+
print("is none?", HF_TOKEN is None)
|
31 |
+
try:
|
32 |
+
hf_hub_download(
|
33 |
+
repo_id=DATASET_REPO_ID,
|
34 |
+
filename=DATA_FILENAME,
|
35 |
+
cache_dir=DATA_DIRNAME,
|
36 |
+
force_filename=DATA_FILENAME
|
37 |
+
)
|
38 |
+
except:
|
39 |
+
print("file not found")
|
40 |
+
|
41 |
+
repo = Repository(
|
42 |
+
local_dir="ocr_data", clone_from=DATASET_REPO_URL, use_auth_token=HF_TOKEN
|
43 |
+
)
|
44 |
+
|
45 |
def get_device_ip_address():
|
46 |
|
47 |
if os.name == "nt":
|
|
|
65 |
return result
|
66 |
|
67 |
|
|
|
68 |
"""
|
69 |
Paddle OCR
|
70 |
"""
|
|
|
124 |
text_output = ocr_with_keras(img)
|
125 |
if Method == 'PaddleOCR':
|
126 |
text_output = ocr_with_paddle(img)
|
127 |
+
|
128 |
+
with open(DATA_FILE, "a") as csvfile:
|
129 |
+
writer = csv.DictWriter(csvfile, fieldnames=["method", "image", "generated_text"])
|
130 |
+
writer.writerow(
|
131 |
+
{"method": Method, "image": img, "generated_text": text_output}
|
132 |
+
)
|
133 |
+
commit_url = repo.push_to_hub()
|
134 |
+
print(commit_url)
|
135 |
+
|
136 |
# save_details(Method,text_output,img)
|
137 |
# sender="[email protected]"
|
138 |
# password="httscgatatbbxxur"
|
|
|
215 |
[method,image],
|
216 |
output,
|
217 |
title="Optical Character Recognition",
|
218 |
+
description="Try OCR with different methods",
|
|
|
219 |
css=".gradio-container {background-color: lightgray} #radio_div {background-color: #FFD8B4; font-size: 40px;}",
|
220 |
allow_flagging = "manual",
|
221 |
+
# flagging_dir = "flagged",
|
222 |
+
# flagging_callback=hf_writer
|
223 |
)
|
224 |
demo.launch(enable_queue = False)
|