Nic Bonetto commited on
Commit
b2acd9d
·
unverified ·
2 Parent(s): 5e17c65 cec3ef2

Merge pull request #2 from NicBonetto/streamlit-app

Browse files
.gitattributes ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ trocr-ocr/* filter=lfs diff=lfs merge=lfs -text
2
+ trocr-ocr/** filter=lfs diff=lfs merge=lfs -text
3
+ model/** filter=lfs diff=lfs merge=lfs -text
README.md CHANGED
@@ -1,2 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
1
  # light-doc-ocr
2
  Lightweight Transformer-based OCR model for document text recognition, fine-tuned with PyTorch and Hugging Face.
 
1
+ ---
2
+ title: Light OCR Finetuned
3
+ emoji: "📝"
4
+ colorFrom: "purple"
5
+ colorTo: "blue"
6
+ sdk: streamlit
7
+ sdk_version: "1.25.0"
8
+ app_file: app.py
9
+ pinned: true
10
+ ---
11
+
12
  # light-doc-ocr
13
  Lightweight Transformer-based OCR model for document text recognition, fine-tuned with PyTorch and Hugging Face.
app.py ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import streamlit
2
+ from PIL import Image
3
+ import torch
4
+ from transformers import TrOCRProcessor, VisionEncoderDecoderModel
5
+
6
+ MODEL_NAME = 'model/'
7
+ processor = TrOCRProcessor.from_pretrained(MODEL_NAME)
8
+ model = VisionEncoderDecoderModel.from_pretrained(MODEL_NAME)
9
+
10
+ streamlit.title('Light OCR')
11
+
12
+ uploaded_file = streamlit.file_uploader('Choose an image...', type=['png', 'jpg', 'jpeg'])
13
+ if uploaded_file:
14
+ image = Image.open(uploaded_file).convert("RGB")
15
+ image = image.resize((384, 384))
16
+ streamlit.image(image, caption='Uploaded Image', use_column_width=True)
17
+
18
+ pixel_values = processor(images=image, return_tensors='pt').pixel_values
19
+ output_ids = model.generate(pixel_values)
20
+ text = processor.batch_decode(output_ids, skip_special_tokens=True)[0]
21
+
22
+ streamlit.subheader('Recognized Text')
23
+ streamlit.write(text)
24
+
model/config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:584e4b4106aa735f04ef9d5dd2e89250f3c98f36435a183fe98bd4888c4c5b2b
3
+ size 1529
model/generation_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66a55c9bff6d80e77c8deb6dba8dd79d867da689c7e0f1e1eddb265f8a92fb1b
3
+ size 185
model/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d77161e6a5564a2d70e53b5dabfad12b67fb2e9bd7c3cc7555b1fe056bc8826
3
+ size 246430696
model/preprocessor_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5172006ffcaf0f407db91ac4ada30ad6ca86183fa37ce6059f966bfaffb880cb
3
+ size 411
requirements.txt CHANGED
@@ -5,4 +5,5 @@ datasets
5
  evaluate
6
  jiwer
7
  Pillow
8
-
 
 
5
  evaluate
6
  jiwer
7
  Pillow
8
+ accelerator
9
+ streamlit