|
from langchain.document_loaders import PyPDFLoader |
|
loader = PyPDFLoader("Test/blob/main/Footcare.pdf") |
|
pages = loader.load() |
|
|
|
|
|
from langchain.text_splitter import RecursiveCharacterTextSplitter |
|
splitter = RecursiveCharacterTextSplitter(chunk_size=512, chunk_overlap=30) |
|
docs = splitter.split_documents(pages) |
|
|
|
|
|
from langchain_community.embeddings import HuggingFaceEmbeddings |
|
embedding_model = HuggingFaceEmbedding(model_name="all-MiniLM-L6-v2") |
|
embeddings = model.encode(docs) |
|
|
|
|
|
from langchain.vectorstores import Chroma |
|
persist_directory = 'docs/chroma/' |
|
vectordb = Chroma.from_documents( |
|
documents=docs, |
|
embedding=embedding, |
|
persist_directory=persist_directory |
|
) |
|
|
|
|
|
retriever = vectordb.as_retriever() |
|
import gradio as gr |
|
import gradio as gr |
|
gr.load("models/HuggingFaceH4/zephyr-7b-beta").launch() |