File size: 1,071 Bytes
c498106
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
from config import *
import chromadb
from chromadb.utils import embedding_functions
from config import OPENAI_API_KEY
from utils import generate_uuid

emmbedding_model = "text-embedding-3-large"
openai_ef = embedding_functions.OpenAIEmbeddingFunction(model_name=emmbedding_model,api_key=OPENAI_API_KEY)
if deploy:
    chroma_client = chromadb.PersistentClient(path="./data/emeddeings")
else:
    chroma_client = chromadb.PersistentClient(path="/home/ubuntu/research/data/emeddeings")
    
collection_doc = chroma_client.get_or_create_collection(name="2024_main_document_lvl")
collection_para = chroma_client.get_or_create_collection(name="2024_main_paragraph_lvl")

def add_document_chroma_collection(collection_object, document_list, embedding_list, metadata):
    
    metadata_list = [metadata for i in range(len(document_list))]
    ids_gen = [generate_uuid() for i in range(len(document_list))]
    collection_object.add(embeddings = embedding_list,documents = document_list,metadatas = metadata_list,ids = ids_gen)
    if collection_object:
        return True