Spaces:

filipsedivy
/

boost-space-llm

Sleeping

File size: 2,243 Bytes

7d587fb
eb8aef0
 
f0a5e1c
eb8aef0
 
 
 
d304a46
7d587fb
 
 
eb8aef0
 
7d587fb
eb8aef0
 
ac6cd22
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7d587fb
f0a5e1c
 
 
 
 
 
7d587fb
f0a5e1c
7d587fb
 
 
 
15d6540
eb5eb52
f0a5e1c
 
 
eb5eb52
7d587fb
 
 
eb8aef0

import gradio as gr
from langchain.embeddings import SentenceTransformerEmbeddings
from langchain.vectorstores import Chroma
from huggingface_hub import InferenceClient

embeddings = SentenceTransformerEmbeddings(model_name="msmarco-distilbert-base-v4")
db = Chroma(persist_directory="embeddings", embedding_function=embeddings)

client = InferenceClient(model="gmistralai/Mixtral-8x7B-Instruct-v0.1")


def respond(
        message,
        history: list[tuple[str, str]],
):
    matching_docs = db.similarity_search(message)

    if not matching_docs:
        prompt = (
            f"You are an expert in generating responses when there is no information available. "
            f"Unfortunately, there are no relevant documents available to answer the following query:\n\n"
            f"Please provide a polite and original response to inform the user that the requested information is not "
            f"available."
        )
    else:
        context = ""
        current_length = 0
        for i, doc in enumerate(matching_docs):
            doc_text = f"Document {i + 1}:\n{doc.page_content}\n\n"
            doc_length = len(doc_text.split())
            context += doc_text
            current_length += doc_length

        prompt = (
            f"You are an expert in summarizing and answering questions based on given documents. "
            f"You're an expert in English grammar at the same time. "
            f"This means that your texts are flawless, correct and grammatically correct."
            f"Please provide a detailed and well-explained answer to the following query in 4-6 sentences:\n\n"
            f"Query: {message}\n\n"
            f"Based on the following documents:\n{context}\n\n"
            f"Answer:"
        )

    response = client.text_generation(
        prompt,
        max_new_tokens=250,
        temperature=0.7,
        top_p=0.95,
    )

    yield response


demo = gr.ChatInterface(
    respond,
    title="Boost.space Docs LLM",
    examples=[
        ["What types of roles are in the system?"],
        ["How to import records into stock receipts in Boost.space?"],
        ["Is it possible to create a PDF export from the product?"],
    ],
)

if __name__ == "__main__":
    demo.launch()