Spaces:
Running
Running
APPLE
commited on
Commit
·
a454e1c
1
Parent(s):
a5ad985
default
Browse files
app.py
CHANGED
@@ -1,25 +1,57 @@
|
|
1 |
from pathlib import Path
|
2 |
import streamlit as st
|
3 |
import os
|
|
|
4 |
|
5 |
-
from form16_parser import build_parser
|
|
|
|
|
|
|
|
|
|
|
|
|
6 |
|
7 |
def main():
|
8 |
st.title("Form16 Parser")
|
9 |
|
|
|
|
|
10 |
uploaded_file = st.file_uploader("Upload a PDF file", type="pdf")
|
11 |
Path("temp_files").mkdir(exist_ok=True, parents=True)
|
12 |
|
13 |
-
if uploaded_file is
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
14 |
# Save the uploaded file to a temporary directory
|
15 |
with open(os.path.join("temp_files", uploaded_file.name), "wb") as f:
|
16 |
f.write(uploaded_file.getvalue())
|
17 |
|
18 |
filepath = os.path.join("temp_files", uploaded_file.name)
|
19 |
parser = build_parser()
|
20 |
-
parsed = parser.parse(filepath, return_output=True)
|
21 |
|
22 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
23 |
|
24 |
|
25 |
|
|
|
1 |
from pathlib import Path
|
2 |
import streamlit as st
|
3 |
import os
|
4 |
+
import requests
|
5 |
|
6 |
+
from form16_parser import build_parser, UnsupportedForm16Error
|
7 |
+
|
8 |
+
badges = """[](https://github.com/INF800/form16-parser)
|
9 |
+
[](https://github.com/mkenney/software-guides/blob/master/STABILITY-BADGES.md#alpha)
|
10 |
+
[](https://github.com/INF800/form16-parser)
|
11 |
+
[]()
|
12 |
+
"""
|
13 |
|
14 |
def main():
|
15 |
st.title("Form16 Parser")
|
16 |
|
17 |
+
st.markdown(f"{badges}")
|
18 |
+
st.write("Source code available @ https://github.com/INF800/form16-parser")
|
19 |
uploaded_file = st.file_uploader("Upload a PDF file", type="pdf")
|
20 |
Path("temp_files").mkdir(exist_ok=True, parents=True)
|
21 |
|
22 |
+
if uploaded_file is None:
|
23 |
+
# If no file is uploaded, load the default PDF file
|
24 |
+
default_pdf_url = "https://assets1.cleartax-cdn.com/cleartax/images/1655725194_sampleform16.pdf"
|
25 |
+
path = Path("temp_files/sampleform16.pdf")
|
26 |
+
# if not path.exists():
|
27 |
+
default_pdf_response = requests.get(default_pdf_url)
|
28 |
+
|
29 |
+
with open(str(path), "wb") as f:
|
30 |
+
f.write(default_pdf_response.content)
|
31 |
+
|
32 |
+
st.write(f"Parsing {default_pdf_url}.")
|
33 |
+
st.write("Try your own form 16 by uploading above.")
|
34 |
+
|
35 |
+
parser = build_parser()
|
36 |
+
parsed = parser.parse(str(path), return_output=True)
|
37 |
+
|
38 |
+
st.write("Parsed data (structured):")
|
39 |
+
st.write(parsed)
|
40 |
+
else:
|
41 |
# Save the uploaded file to a temporary directory
|
42 |
with open(os.path.join("temp_files", uploaded_file.name), "wb") as f:
|
43 |
f.write(uploaded_file.getvalue())
|
44 |
|
45 |
filepath = os.path.join("temp_files", uploaded_file.name)
|
46 |
parser = build_parser()
|
|
|
47 |
|
48 |
+
try:
|
49 |
+
parsed = parser.parse(filepath, return_output=True)
|
50 |
+
st.write("Parsed data (structured):")
|
51 |
+
st.write(parsed)
|
52 |
+
except UnsupportedForm16Error as e:
|
53 |
+
st.write(e)
|
54 |
+
|
55 |
|
56 |
|
57 |
|