Spaces:
Running
Running
Upload app.py
Browse files
app.py
CHANGED
@@ -51,7 +51,6 @@ def get_parser(fileext : str) -> AbstractParser:
|
|
51 |
parser = PdfParser(
|
52 |
use_ocr="never",
|
53 |
)
|
54 |
-
log("For the purpose of this demo, OCR on .pdf documents is deactivated.", "info")
|
55 |
case ".docx":
|
56 |
parser = DocxParser()
|
57 |
case ".xls" | ".xlsx" | ".xlsm" | ".xlsb" | ".odf" | ".ods" | ".odt":
|
@@ -82,7 +81,6 @@ def parse_and_chunk(uploaded_file : UploadedFile):
|
|
82 |
log("Parsing and chunking...", "info")
|
83 |
|
84 |
try:
|
85 |
-
print(uploaded_file)
|
86 |
fileext = Path(uploaded_file.name).suffix.lower()
|
87 |
parser = get_parser(fileext)
|
88 |
start_time = time.perf_counter()
|
@@ -265,6 +263,8 @@ with col1:
|
|
265 |
mime="text/markdown",
|
266 |
use_container_width=True,
|
267 |
)
|
|
|
|
|
268 |
with st.expander("Parsed document", expanded=True):
|
269 |
with st.container(height=600, border=False):
|
270 |
st.markdown(ss.parsed_md)
|
|
|
51 |
parser = PdfParser(
|
52 |
use_ocr="never",
|
53 |
)
|
|
|
54 |
case ".docx":
|
55 |
parser = DocxParser()
|
56 |
case ".xls" | ".xlsx" | ".xlsm" | ".xlsb" | ".odf" | ".ods" | ".odt":
|
|
|
81 |
log("Parsing and chunking...", "info")
|
82 |
|
83 |
try:
|
|
|
84 |
fileext = Path(uploaded_file.name).suffix.lower()
|
85 |
parser = get_parser(fileext)
|
86 |
start_time = time.perf_counter()
|
|
|
263 |
mime="text/markdown",
|
264 |
use_container_width=True,
|
265 |
)
|
266 |
+
if Path(uploaded_file.name).suffix.lower() == ".pdf":
|
267 |
+
st.info("For the purpose of this demo, OCR on pdf documents is deactivated.", icon="ℹ️")
|
268 |
with st.expander("Parsed document", expanded=True):
|
269 |
with st.container(height=600, border=False):
|
270 |
st.markdown(ss.parsed_md)
|