File size: 811 Bytes
f437f2a
 
 
 
 
 
 
 
 
 
1d55d4a
f437f2a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
969e642
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
from langchain.document_loaders import PyPDFLoader
loader = PyPDFLoader("Test/blob/main/Footcare.pdf")
pages = loader.load()


from langchain.text_splitter import RecursiveCharacterTextSplitter
splitter = RecursiveCharacterTextSplitter(chunk_size=512, chunk_overlap=30)
docs = splitter.split_documents(pages)


from langchain_community.embeddings import HuggingFaceEmbeddings
embedding_model = HuggingFaceEmbedding(model_name="all-MiniLM-L6-v2")
embeddings = model.encode(docs)


from langchain.vectorstores import Chroma
persist_directory = 'docs/chroma/'
vectordb = Chroma.from_documents(
    documents=docs,
    embedding=embedding,
    persist_directory=persist_directory
)


retriever = vectordb.as_retriever()
import gradio as gr
import gradio as gr
gr.load("models/HuggingFaceH4/zephyr-7b-beta").launch()