Spaces:
Sleeping
Sleeping
import streamlit as st | |
import pandas as pd | |
from PIL import Image | |
import io | |
from pdf_processing import process_comparison_data, extract_text_with_pypdf | |
def simulate_processing(pdf1, pdf2, tags): | |
# This is a placeholder function. Replace with actual processing logic | |
return [ | |
('key', 'Sample Data 1', 'Sample Data 2'), | |
('index', 'More Sample Data 1', 'More Sample Data 2') | |
] | |
# App title | |
st.title("PDF Tag Processing") | |
# Sidebar configuration | |
st.sidebar.header("Input Configuration") | |
uploaded_file1 = st.sidebar.file_uploader("Upload First PDF", type="pdf") | |
uploaded_file2 = st.sidebar.file_uploader("Upload Second PDF", type="pdf") | |
tags_input = st.sidebar.text_area("Enter Tags (comma-separated)") | |
# Process button | |
if st.button("Process"): | |
# pdf1_text = extract_text_with_pypdf(uploaded_file1) | |
if not uploaded_file1: | |
st.error("Please upload a PDF file in the first pdf space") | |
elif not uploaded_file2: | |
st.error("Please upload a PDF file in the second pdf space") | |
elif not tags_input: | |
st.error("Please add some tags in the text area") | |
else: | |
df = process_comparison_data(uploaded_file1, uploaded_file2, [t.strip() for t in tags_input.split(',') if t.strip()]) | |
# Display results in a table | |
st.subheader("Results") | |
st.dataframe(df) | |
# Display instructions | |
st.write(""" | |
This app allows you to upload two PDF files and enter tags. When you click "Process", | |
it extracts information related to the tags from both the pdfs and compares the information | |
in each pdf for each tag and displays the results in a table. | |
""") | |
# Add an image to illustrate the concept | |
image = Image.open('doaz_image.png') # Make sure to replace with your own image | |
st.image(image, caption='Doaz') | |