mciancone commited on
Commit
82c01c8
·
verified ·
1 Parent(s): 0272d78

Upload app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -51,7 +51,6 @@ def get_parser(fileext : str) -> AbstractParser:
51
  parser = PdfParser(
52
  use_ocr="never",
53
  )
54
- log("For the purpose of this demo, OCR on .pdf documents is deactivated.", "info")
55
  case ".docx":
56
  parser = DocxParser()
57
  case ".xls" | ".xlsx" | ".xlsm" | ".xlsb" | ".odf" | ".ods" | ".odt":
@@ -82,7 +81,6 @@ def parse_and_chunk(uploaded_file : UploadedFile):
82
  log("Parsing and chunking...", "info")
83
 
84
  try:
85
- print(uploaded_file)
86
  fileext = Path(uploaded_file.name).suffix.lower()
87
  parser = get_parser(fileext)
88
  start_time = time.perf_counter()
@@ -265,6 +263,8 @@ with col1:
265
  mime="text/markdown",
266
  use_container_width=True,
267
  )
 
 
268
  with st.expander("Parsed document", expanded=True):
269
  with st.container(height=600, border=False):
270
  st.markdown(ss.parsed_md)
 
51
  parser = PdfParser(
52
  use_ocr="never",
53
  )
 
54
  case ".docx":
55
  parser = DocxParser()
56
  case ".xls" | ".xlsx" | ".xlsm" | ".xlsb" | ".odf" | ".ods" | ".odt":
 
81
  log("Parsing and chunking...", "info")
82
 
83
  try:
 
84
  fileext = Path(uploaded_file.name).suffix.lower()
85
  parser = get_parser(fileext)
86
  start_time = time.perf_counter()
 
263
  mime="text/markdown",
264
  use_container_width=True,
265
  )
266
+ if Path(uploaded_file.name).suffix.lower() == ".pdf":
267
+ st.info("For the purpose of this demo, OCR on pdf documents is deactivated.", icon="ℹ️")
268
  with st.expander("Parsed document", expanded=True):
269
  with st.container(height=600, border=False):
270
  st.markdown(ss.parsed_md)