demoPOC commited on
Commit
ce04a13
·
1 Parent(s): 0cbb22a

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +17 -5
app.py CHANGED
@@ -24,7 +24,9 @@ import openai
24
  from langchain.llms import OpenAI
25
 
26
  from langchain.embeddings.openai import OpenAIEmbeddings
27
- #from langchain.embeddings.sentence_transformer import SentenceTransformerEmbeddings
 
 
28
 
29
  from langchain.document_loaders import SeleniumURLLoader, PyPDFLoader
30
 
@@ -61,10 +63,20 @@ def pretty_print_docs(docs):
61
 
62
 
63
  def getEmbeddingModel(embeddingId):
64
- # if (embeddingId == 1):
65
- # embeddings = SentenceTransformerEmbeddings(model_name="all-MiniLM-L6-v2")
66
- # else:
67
- # embeddings = OpenAIEmbeddings()
 
 
 
 
 
 
 
 
 
 
68
  return OpenAIEmbeddings()
69
 
70
 
 
24
  from langchain.llms import OpenAI
25
 
26
  from langchain.embeddings.openai import OpenAIEmbeddings
27
+ from langchain.embeddings import HuggingFaceBgeEmbeddings
28
+ from langchain.embeddings import HuggingFaceInstructEmbeddings
29
+ from langchain.embeddings import SentenceTransformerEmbeddings
30
 
31
  from langchain.document_loaders import SeleniumURLLoader, PyPDFLoader
32
 
 
63
 
64
 
65
  def getEmbeddingModel(embeddingId):
66
+ if (embeddingId == 1):
67
+ embeddings = SentenceTransformerEmbeddings(model_name="all-MiniLM-L6-v2")
68
+ elif (embeddingId == 2):
69
+ model_name = "hkunlp/instructor-large"
70
+ model_kwargs = {'device': 'cpu'}
71
+ encode_kwargs = {'normalize_embeddings': True}
72
+ embeddings = HuggingFaceInstructEmbeddings(model_name=model_name,model_kwargs=model_kwargs,encode_kwargs=encode_kwargs)
73
+ elif (embeddingId == 2):
74
+ model_name = "BAAI/bge-large-en-v1.5"
75
+ model_kwargs = {'device': 'cuda'}
76
+ encode_kwargs = {'normalize_embeddings': True} # set True to compute cosine similarity
77
+ model = HuggingFaceBgeEmbeddings(model_name=model_name,model_kwargs=model_kwargs,encode_kwargs=encode_kwargs)
78
+ else:
79
+ embeddings = OpenAIEmbeddings()
80
  return OpenAIEmbeddings()
81
 
82