Spaces:
Sleeping
Sleeping
emb_func
Browse files
app.py
CHANGED
@@ -22,6 +22,9 @@ from langchain_huggingface import HuggingFaceEmbeddings
|
|
22 |
import os
|
23 |
from chroma_datasets.utils import import_into_chroma
|
24 |
from datasets import load_dataset
|
|
|
|
|
|
|
25 |
|
26 |
# Global params
|
27 |
CHROMA_PATH = "chromadb_mem10_mxbai_800_complete"
|
@@ -31,11 +34,16 @@ LLM_NAME = "gpt-4o-mini"
|
|
31 |
OPENAI_API_KEY = os.environ.get("OPENAI_API_KEY")
|
32 |
MXBAI_API_KEY = os.environ.get("MXBAI_API_KEY")
|
33 |
HF_TOKEN = os.environ.get("HF_TOKEN")
|
|
|
34 |
|
35 |
# Load the reranker model
|
36 |
device = "cuda:0" if torch.cuda.is_available() else "cpu"
|
37 |
mxbai_client = MixedbreadAI(api_key=MXBAI_API_KEY)
|
38 |
model_emb = "mixedbread-ai/mxbai-embed-large-v1"
|
|
|
|
|
|
|
|
|
39 |
|
40 |
# Set up ChromaDB
|
41 |
client = chromadb.Client()
|
@@ -46,7 +54,7 @@ dataset = load_dataset("eliot-hub/memoires_vec_800", split="data", token=HF_TOKE
|
|
46 |
db = import_into_chroma(
|
47 |
chroma_client=client,
|
48 |
dataset=dataset,
|
49 |
-
embedding_function=
|
50 |
)
|
51 |
# db = Chroma(
|
52 |
# client=client,
|
|
|
22 |
import os
|
23 |
from chroma_datasets.utils import import_into_chroma
|
24 |
from datasets import load_dataset
|
25 |
+
import chromadb.utils.embedding_functions as embedding_functions
|
26 |
+
|
27 |
+
|
28 |
|
29 |
# Global params
|
30 |
CHROMA_PATH = "chromadb_mem10_mxbai_800_complete"
|
|
|
34 |
OPENAI_API_KEY = os.environ.get("OPENAI_API_KEY")
|
35 |
MXBAI_API_KEY = os.environ.get("MXBAI_API_KEY")
|
36 |
HF_TOKEN = os.environ.get("HF_TOKEN")
|
37 |
+
HF_API_KEY = os.environ.get("HF_API_KEY")
|
38 |
|
39 |
# Load the reranker model
|
40 |
device = "cuda:0" if torch.cuda.is_available() else "cpu"
|
41 |
mxbai_client = MixedbreadAI(api_key=MXBAI_API_KEY)
|
42 |
model_emb = "mixedbread-ai/mxbai-embed-large-v1"
|
43 |
+
huggingface_ef = embedding_functions.HuggingFaceEmbeddingFunction(
|
44 |
+
api_key=HF_API_KEY,
|
45 |
+
model_name=model_emb
|
46 |
+
)
|
47 |
|
48 |
# Set up ChromaDB
|
49 |
client = chromadb.Client()
|
|
|
54 |
db = import_into_chroma(
|
55 |
chroma_client=client,
|
56 |
dataset=dataset,
|
57 |
+
embedding_function=huggingface_ef
|
58 |
)
|
59 |
# db = Chroma(
|
60 |
# client=client,
|