robertselvam commited on
Commit
95a02ef
·
verified ·
1 Parent(s): 85a2286

Update summary_extractor.py

Browse files
Files changed (1) hide show
  1. summary_extractor.py +3 -3
summary_extractor.py CHANGED
@@ -8,8 +8,8 @@ from langchain.chains.mapreduce import MapReduceChain
8
  from langchain.text_splitter import CharacterTextSplitter
9
  from langchain.chains.summarize import load_summarize_chain
10
  from langchain.prompts import PromptTemplate
11
- from langchain_community.document_loaders import UnstructuredFileLoader
12
-
13
 
14
  class Extractor:
15
 
@@ -35,7 +35,7 @@ class Extractor:
35
  List[str]: List of text content from each page.
36
  """
37
  try:
38
- loader = UnstructuredFileLoader(pdf_file_path.name)
39
  pages = loader.load_and_split()
40
  return pages
41
 
 
8
  from langchain.text_splitter import CharacterTextSplitter
9
  from langchain.chains.summarize import load_summarize_chain
10
  from langchain.prompts import PromptTemplate
11
+ # from langchain_community.document_loaders import UnstructuredFileLoader
12
+ from langchain_community.document_loaders import PyPDFLoader
13
 
14
  class Extractor:
15
 
 
35
  List[str]: List of text content from each page.
36
  """
37
  try:
38
+ loader = PyPDFLoader(pdf_file_path.name)
39
  pages = loader.load_and_split()
40
  return pages
41