eliot-hub commited on
Commit
9c5d425
·
1 Parent(s): 543c1bb
Files changed (1) hide show
  1. app.py +9 -1
app.py CHANGED
@@ -22,6 +22,9 @@ from langchain_huggingface import HuggingFaceEmbeddings
22
  import os
23
  from chroma_datasets.utils import import_into_chroma
24
  from datasets import load_dataset
 
 
 
25
 
26
  # Global params
27
  CHROMA_PATH = "chromadb_mem10_mxbai_800_complete"
@@ -31,11 +34,16 @@ LLM_NAME = "gpt-4o-mini"
31
  OPENAI_API_KEY = os.environ.get("OPENAI_API_KEY")
32
  MXBAI_API_KEY = os.environ.get("MXBAI_API_KEY")
33
  HF_TOKEN = os.environ.get("HF_TOKEN")
 
34
 
35
  # Load the reranker model
36
  device = "cuda:0" if torch.cuda.is_available() else "cpu"
37
  mxbai_client = MixedbreadAI(api_key=MXBAI_API_KEY)
38
  model_emb = "mixedbread-ai/mxbai-embed-large-v1"
 
 
 
 
39
 
40
  # Set up ChromaDB
41
  client = chromadb.Client()
@@ -46,7 +54,7 @@ dataset = load_dataset("eliot-hub/memoires_vec_800", split="data", token=HF_TOKE
46
  db = import_into_chroma(
47
  chroma_client=client,
48
  dataset=dataset,
49
- embedding_function=HuggingFaceEmbeddings(model_name=model_emb)
50
  )
51
  # db = Chroma(
52
  # client=client,
 
22
  import os
23
  from chroma_datasets.utils import import_into_chroma
24
  from datasets import load_dataset
25
+ import chromadb.utils.embedding_functions as embedding_functions
26
+
27
+
28
 
29
  # Global params
30
  CHROMA_PATH = "chromadb_mem10_mxbai_800_complete"
 
34
  OPENAI_API_KEY = os.environ.get("OPENAI_API_KEY")
35
  MXBAI_API_KEY = os.environ.get("MXBAI_API_KEY")
36
  HF_TOKEN = os.environ.get("HF_TOKEN")
37
+ HF_API_KEY = os.environ.get("HF_API_KEY")
38
 
39
  # Load the reranker model
40
  device = "cuda:0" if torch.cuda.is_available() else "cpu"
41
  mxbai_client = MixedbreadAI(api_key=MXBAI_API_KEY)
42
  model_emb = "mixedbread-ai/mxbai-embed-large-v1"
43
+ huggingface_ef = embedding_functions.HuggingFaceEmbeddingFunction(
44
+ api_key=HF_API_KEY,
45
+ model_name=model_emb
46
+ )
47
 
48
  # Set up ChromaDB
49
  client = chromadb.Client()
 
54
  db = import_into_chroma(
55
  chroma_client=client,
56
  dataset=dataset,
57
+ embedding_function=huggingface_ef
58
  )
59
  # db = Chroma(
60
  # client=client,