Kathirsci commited on
Commit
895f085
·
verified ·
1 Parent(s): 620a8a5

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -3
app.py CHANGED
@@ -3,7 +3,8 @@ import tempfile
3
  import logging
4
  from typing import List
5
  from langchain_community.document_loaders import PyPDFLoader
6
- from langchain_community.embeddings import HuggingFaceEmbeddings
 
7
  from langchain_community.vectorstores import FAISS
8
  from langchain_community.llms import HuggingFacePipeline
9
  from langchain.chains.summarize import load_summarize_chain
@@ -18,7 +19,7 @@ logger = logging.getLogger(__name__)
18
 
19
  # Constants
20
  EMBEDDING_MODEL = 'sentence-transformers/all-MiniLM-L6-v2'
21
- DEFAULT_MODEL = "llava-v1.6-mistral-7b"
22
 
23
  @st.cache_resource
24
  def load_embeddings():
@@ -50,7 +51,7 @@ def process_pdf(file) -> List[Document]:
50
 
51
  loader = PyPDFLoader(file_path=temp_file_path)
52
  pages = loader.load()
53
- text_splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=200)
54
  documents = text_splitter.split_documents(pages)
55
  return documents
56
  except Exception as e:
 
3
  import logging
4
  from typing import List
5
  from langchain_community.document_loaders import PyPDFLoader
6
+ #from langchain_community.embeddings import HuggingFaceEmbeddings
7
+ from langchain_huggingface import HuggingFaceEmbeddings
8
  from langchain_community.vectorstores import FAISS
9
  from langchain_community.llms import HuggingFacePipeline
10
  from langchain.chains.summarize import load_summarize_chain
 
19
 
20
  # Constants
21
  EMBEDDING_MODEL = 'sentence-transformers/all-MiniLM-L6-v2'
22
+ DEFAULT_MODEL = "llava-v1.6-mistral-7b-hf"
23
 
24
  @st.cache_resource
25
  def load_embeddings():
 
51
 
52
  loader = PyPDFLoader(file_path=temp_file_path)
53
  pages = loader.load()
54
+ text_splitter = RecursiveCharacterTextSplitter(chunk_size=4000, chunk_overlap=200)
55
  documents = text_splitter.split_documents(pages)
56
  return documents
57
  except Exception as e: