Spaces:
Sleeping
Sleeping
Merge pull request #2 from NicBonetto/streamlit-app
Browse files- .gitattributes +3 -0
- README.md +11 -0
- app.py +24 -0
- model/config.json +3 -0
- model/generation_config.json +3 -0
- model/model.safetensors +3 -0
- model/preprocessor_config.json +3 -0
- requirements.txt +2 -1
.gitattributes
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
trocr-ocr/* filter=lfs diff=lfs merge=lfs -text
|
2 |
+
trocr-ocr/** filter=lfs diff=lfs merge=lfs -text
|
3 |
+
model/** filter=lfs diff=lfs merge=lfs -text
|
README.md
CHANGED
@@ -1,2 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
# light-doc-ocr
|
2 |
Lightweight Transformer-based OCR model for document text recognition, fine-tuned with PyTorch and Hugging Face.
|
|
|
1 |
+
---
|
2 |
+
title: Light OCR Finetuned
|
3 |
+
emoji: "📝"
|
4 |
+
colorFrom: "purple"
|
5 |
+
colorTo: "blue"
|
6 |
+
sdk: streamlit
|
7 |
+
sdk_version: "1.25.0"
|
8 |
+
app_file: app.py
|
9 |
+
pinned: true
|
10 |
+
---
|
11 |
+
|
12 |
# light-doc-ocr
|
13 |
Lightweight Transformer-based OCR model for document text recognition, fine-tuned with PyTorch and Hugging Face.
|
app.py
ADDED
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
import streamlit
|
2 |
+
from PIL import Image
|
3 |
+
import torch
|
4 |
+
from transformers import TrOCRProcessor, VisionEncoderDecoderModel
|
5 |
+
|
6 |
+
MODEL_NAME = 'model/'
|
7 |
+
processor = TrOCRProcessor.from_pretrained(MODEL_NAME)
|
8 |
+
model = VisionEncoderDecoderModel.from_pretrained(MODEL_NAME)
|
9 |
+
|
10 |
+
streamlit.title('Light OCR')
|
11 |
+
|
12 |
+
uploaded_file = streamlit.file_uploader('Choose an image...', type=['png', 'jpg', 'jpeg'])
|
13 |
+
if uploaded_file:
|
14 |
+
image = Image.open(uploaded_file).convert("RGB")
|
15 |
+
image = image.resize((384, 384))
|
16 |
+
streamlit.image(image, caption='Uploaded Image', use_column_width=True)
|
17 |
+
|
18 |
+
pixel_values = processor(images=image, return_tensors='pt').pixel_values
|
19 |
+
output_ids = model.generate(pixel_values)
|
20 |
+
text = processor.batch_decode(output_ids, skip_special_tokens=True)[0]
|
21 |
+
|
22 |
+
streamlit.subheader('Recognized Text')
|
23 |
+
streamlit.write(text)
|
24 |
+
|
model/config.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:584e4b4106aa735f04ef9d5dd2e89250f3c98f36435a183fe98bd4888c4c5b2b
|
3 |
+
size 1529
|
model/generation_config.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66a55c9bff6d80e77c8deb6dba8dd79d867da689c7e0f1e1eddb265f8a92fb1b
|
3 |
+
size 185
|
model/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6d77161e6a5564a2d70e53b5dabfad12b67fb2e9bd7c3cc7555b1fe056bc8826
|
3 |
+
size 246430696
|
model/preprocessor_config.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5172006ffcaf0f407db91ac4ada30ad6ca86183fa37ce6059f966bfaffb880cb
|
3 |
+
size 411
|
requirements.txt
CHANGED
@@ -5,4 +5,5 @@ datasets
|
|
5 |
evaluate
|
6 |
jiwer
|
7 |
Pillow
|
8 |
-
|
|
|
|
5 |
evaluate
|
6 |
jiwer
|
7 |
Pillow
|
8 |
+
accelerator
|
9 |
+
streamlit
|