Spaces:

ml6team
/

byt5_ocr_corrector

Build error

App Files Files Community

Thomas Dehaene commited on Sep 28, 2021

Commit

af1842e

1 Parent(s): e948df6

Bump steamlit

Browse files

Files changed (1) hide show

app.py +16 -16

app.py CHANGED Viewed

@@ -5,30 +5,30 @@ import nlpaug.augmenter.char as nac
 import subprocess
 import sys
 import logging
 def install():
     subprocess.check_call([sys.executable, "-m", "pip", "install", "streamlit==0.89.0"])
 install()
-import streamlit as st
 logging.warning(st.__version__)
-st.markdown('# ByT5 Dutch OCR Corrector :pill:')
-st.write('This app corrects common dutch OCR mistakes, to showcase how this could be used in an OCR post-processing pipeline.')
-st.markdown("""
 To use this:
 - Enter a text with OCR mistakes and hit 'unscramble':point_down:
 - Or enter a normal text, scramble it :twisted_rightwards_arrows: and then hit 'unscramble' :point_down:""")
-@st.cache(allow_output_mutation=True,
           suppress_st_warning=True,
           show_spinner=False)
 def load_model():
-    with st.spinner('Please wait for the model to load...'):
         ocr_pipeline=pipeline(
             'text2text-generation',
             model='ml6team/byt5-base-dutch-ocr-correction',
@@ -39,10 +39,10 @@ def load_model():
 ocr_pipeline = load_model()
-if 'text' not in st.session_state:
-    st.session_state.text = ""
-left_area, right_area = st.beta_columns(2)
 # Format the left area
 left_area.header("Input")
@@ -58,16 +58,16 @@ right_area.header("Output")
 if scramble_button:
     aug = nac.OcrAug()
-    st.session_state.text = st.session_state.input_text
-    base_text = st.session_state.text
     augmented_data = aug.augment(base_text)
-    st.session_state.text = augmented_data
-    del st.session_state.input_text
     placeholder.empty()
-    input_text = placeholder.text_area(value=st.session_state.text, label='Insert text:', key='input_text')
 if submit_button:
-    base_text = st.session_state.input_text
     output_text = " ".join([x['generated_text'] for x in ocr_pipeline(wrap(base_text, 128))])
     right_area.markdown('#####')
     right_area.text_area(value=output_text, label="Corrected text:")

 import subprocess
 import sys
 import logging
+import importlib
 def install():
     subprocess.check_call([sys.executable, "-m", "pip", "install", "streamlit==0.89.0"])
 install()
+importlib.reload(streamlit)
 logging.warning(st.__version__)
+streamlit.markdown('# ByT5 Dutch OCR Corrector :pill:')
+streamlit.write('This app corrects common dutch OCR mistakes, to showcase how this could be used in an OCR post-processing pipeline.')
+streamlit.markdown("""
 To use this:
 - Enter a text with OCR mistakes and hit 'unscramble':point_down:
 - Or enter a normal text, scramble it :twisted_rightwards_arrows: and then hit 'unscramble' :point_down:""")
+@streamlit.cache(allow_output_mutation=True,
           suppress_st_warning=True,
           show_spinner=False)
 def load_model():
+    with streamlit.spinner('Please wait for the model to load...'):
         ocr_pipeline=pipeline(
             'text2text-generation',
             model='ml6team/byt5-base-dutch-ocr-correction',
 ocr_pipeline = load_model()
+if 'text' not in streamlit.session_state:
+    streamlit.session_state.text = ""
+left_area, right_area = streamlit.beta_columns(2)
 # Format the left area
 left_area.header("Input")
 if scramble_button:
     aug = nac.OcrAug()
+    streamlit.session_state.text = streamlit.session_state.input_text
+    base_text = streamlit.session_state.text
     augmented_data = aug.augment(base_text)
+    streamlit.session_state.text = augmented_data
+    del streamlit.session_state.input_text
     placeholder.empty()
+    input_text = placeholder.text_area(value=streamlit.session_state.text, label='Insert text:', key='input_text')
 if submit_button:
+    base_text = streamlit.session_state.input_text
     output_text = " ".join([x['generated_text'] for x in ocr_pipeline(wrap(base_text, 128))])
     right_area.markdown('#####')
     right_area.text_area(value=output_text, label="Corrected text:")