rvritesh167 commited on
Commit
a0cce57
·
1 Parent(s): a45b3b8

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +9 -9
app.py CHANGED
@@ -2,21 +2,21 @@ import streamlit as st
2
  from langchain.document_loaders import UnstructuredFileLoader
3
 
4
  def extract_text_from_pdf(uploaded_file):
5
- loader = UnstructuredFileLoader(uploaded_file)
6
- data = loader.load()
7
- txt = ''
8
- for item in data:
9
- txt += item.page_content
10
- return txt
11
 
12
  def main():
13
  st.title("PDF Text Extractor")
14
-
15
  uploaded_file = st.file_uploader("Upload a PDF file", type=["pdf"])
16
-
17
  if uploaded_file is not None:
18
  st.subheader("PDF Content:")
19
- text_content = extract_text_from_pdf(uploaded_file)
 
 
 
 
 
20
  st.text(text_content)
21
 
22
  if __name__ == "__main__":
 
2
  from langchain.document_loaders import UnstructuredFileLoader
3
 
4
  def extract_text_from_pdf(uploaded_file):
5
+
 
 
 
 
 
6
 
7
  def main():
8
  st.title("PDF Text Extractor")
9
+
10
  uploaded_file = st.file_uploader("Upload a PDF file", type=["pdf"])
11
+
12
  if uploaded_file is not None:
13
  st.subheader("PDF Content:")
14
+ loader = UnstructuredFileLoader(uploaded_file)
15
+ data = loader.load()
16
+ txt = ''
17
+ for item in data:
18
+ txt += item.page_content
19
+ text_content = txt
20
  st.text(text_content)
21
 
22
  if __name__ == "__main__":