File size: 526 Bytes
49e32ea
 
275393f
49e32ea
 
275393f
49e32ea
ae4a7ec
49e32ea
 
0c818aa
49e32ea
41ed1b7
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
import ingest as ing

borough_plan_text, file_names = ing.parse_file([open("Lambeth_2030-Our_Future_Our_Lambeth.pdf")])
print("Borough plan text created")

print(borough_plan_text)

borough_plan_docs = ing.text_to_docs(borough_plan_text)
print("Borough plan docs created")

embedding_model =  "BAAI/bge-base-en-v1.5" # "mixedbread-ai/mxbai-embed-xsmall-v1" #

embeddings = ing.load_embeddings(model_name = embedding_model)
ing.embed_faiss_save_to_zip(borough_plan_docs, save_to="faiss_embedding", model_name = embedding_model)