sourabhzanwar commited on
Commit
684322b
·
1 Parent(s): 1dbfcd2

temp. removed the additional pdf to text func

Browse files
Files changed (1) hide show
  1. utils/haystack.py +2 -6
utils/haystack.py CHANGED
@@ -5,15 +5,11 @@ from haystack import Pipeline
5
  from haystack.schema import Answer
6
  from haystack.document_stores import BaseDocumentStore
7
  from haystack.document_stores import InMemoryDocumentStore, OpenSearchDocumentStore, WeaviateDocumentStore
8
- from haystack.nodes import EmbeddingRetriever, FARMReader, PromptNode, PreProcessor, TextConverter, FileTypeClassifier, PDFToTextConverter
 
9
  from milvus_haystack import MilvusDocumentStore
10
  #Use this file to set up your Haystack pipeline and querying
11
 
12
- file_type_classifier = FileTypeClassifier()
13
-
14
- text_converter = TextConverter()
15
- pdf_converter = PDFToTextConverter()
16
-
17
  @st.cache_resource(show_spinner=False)
18
  def start_preprocessor_node():
19
  print('initializing preprocessor node')
 
5
  from haystack.schema import Answer
6
  from haystack.document_stores import BaseDocumentStore
7
  from haystack.document_stores import InMemoryDocumentStore, OpenSearchDocumentStore, WeaviateDocumentStore
8
+ from haystack.nodes import EmbeddingRetriever, FARMReader, PromptNode, PreProcessor
9
+ #from haystack.nodes import TextConverter, FileTypeClassifier, PDFToTextConverter
10
  from milvus_haystack import MilvusDocumentStore
11
  #Use this file to set up your Haystack pipeline and querying
12
 
 
 
 
 
 
13
  @st.cache_resource(show_spinner=False)
14
  def start_preprocessor_node():
15
  print('initializing preprocessor node')