form16-parser / app.py
APPLE
default
a454e1c
from pathlib import Path
import streamlit as st
import os
import requests
from form16_parser import build_parser, UnsupportedForm16Error
badges = """[![](https://img.shields.io/static/v1?label=Licence&message=MIT&color=darkgreen)](https://github.com/INF800/form16-parser)
[![stability-alpha](https://img.shields.io/badge/stability-alpha-f4d03f.svg)](https://github.com/mkenney/software-guides/blob/master/STABILITY-BADGES.md#alpha)
[![](https://img.shields.io/static/v1?label=Python&message=3.10+&color=indigo)](https://github.com/INF800/form16-parser)
[![im](https://img.shields.io/github/stars/INF800/form16-parser.svg?style=social&)]()
"""
def main():
st.title("Form16 Parser")
st.markdown(f"{badges}")
st.write("Source code available @ https://github.com/INF800/form16-parser")
uploaded_file = st.file_uploader("Upload a PDF file", type="pdf")
Path("temp_files").mkdir(exist_ok=True, parents=True)
if uploaded_file is None:
# If no file is uploaded, load the default PDF file
default_pdf_url = "https://assets1.cleartax-cdn.com/cleartax/images/1655725194_sampleform16.pdf"
path = Path("temp_files/sampleform16.pdf")
# if not path.exists():
default_pdf_response = requests.get(default_pdf_url)
with open(str(path), "wb") as f:
f.write(default_pdf_response.content)
st.write(f"Parsing {default_pdf_url}.")
st.write("Try your own form 16 by uploading above.")
parser = build_parser()
parsed = parser.parse(str(path), return_output=True)
st.write("Parsed data (structured):")
st.write(parsed)
else:
# Save the uploaded file to a temporary directory
with open(os.path.join("temp_files", uploaded_file.name), "wb") as f:
f.write(uploaded_file.getvalue())
filepath = os.path.join("temp_files", uploaded_file.name)
parser = build_parser()
try:
parsed = parser.parse(filepath, return_output=True)
st.write("Parsed data (structured):")
st.write(parsed)
except UnsupportedForm16Error as e:
st.write(e)
if __name__ == "__main__":
main()