import chromadb | |
from chromadb.config import Settings | |
from fastapi import APIRouter | |
router = APIRouter() | |
chroma_settings = Settings( | |
anonymized_telemetry=False, | |
persist_directory="db", | |
allow_reset=False, | |
is_persistent=True, | |
) | |
client = chromadb.Client(chroma_settings) | |
async def get_all_collections(): | |
# Currently only works for ChromaDB but can be extended easily | |
# for other vector stores as well | |
collections = client.list_collections() | |
responses = [c.dict() for c in collections] | |
return responses | |
# TODO(deshraj): Add pagination and make this endpoint agnostic to the vector store | |
async def get_collection_details(collection_name: str): | |
collection = client.get_collection(collection_name) | |
collection_data = collection.get() | |
metadatas, documents = collection_data['metadatas'], collection_data['documents'] | |
collated_data = [] | |
for i in zip(metadatas, documents): | |
collated_data.append({ | |
"metadata": i[0], | |
"document": i[1] | |
}) | |
response = {"details": collection.model_dump(), "data": collated_data} | |
return response | |