File size: 647 Bytes
fb85888
 
 
 
 
d9b98b5
 
fb85888
 
 
 
d9b98b5
 
 
fb85888
d9b98b5
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
# File: scripts/reindex.py
import yaml
from orchestrator.client import MCPClient
from orchestrator.provenance import init_db, Paper

if __name__ == '__main__':
    cfg = yaml.safe_load(open('config.yaml'))
    chroma = MCPClient(cfg['mcp_servers']['chroma'])
    Session = init_db(cfg.get('db_url', 'sqlite:///embeddings.db'))
    session = Session()

    papers = session.query(Paper).all()
    print(f'Reindexing {len(papers)} papers...')
    for paper in papers:
        text = (paper.title or '') + ' ' + (paper.abstract or '')
        chroma.call('chroma.insert', {'id': paper.id, 'text': text, 'metadata': {}})
    print('Reindex complete!')