langchain-chat-with-pdf-openai

Sleeping

File size: 9,180 Bytes

d8c3a88
d2e3c7f
 
 
 
 
5099842
6c5c0ad
d2e3c7f
5d7723c
08d8ad5
5099842
4b219d0
58bf31d
75fd4bb
5099842
6a6fbcd
d2e3c7f
 
5d7723c
d2e3c7f
1e82c8e
371e0b5
 
d2e3c7f
5099842
1ba421b
5099842
fc6b35d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
e0f056b
fc6b35d
 
 
 
 
 
 
 
 
 
 
 
 
 
5d7723c
fc6b35d
5d7723c
b525450
f13caea
 
 
fc6b35d
d290cdf
 
 
5099842
432a54a
5099842
 
fc39a13
 
 
 
 
 
 
1ba421b
fc39a13
 
5099842
 
 
 
 
 
 
58bf31d
d2e3c7f
5099842
 
 
 
dba9ef7
5099842
1ba421b
47be8b1
 
 
 
 
1ba421b
5099842
 
6a6fbcd
5d7723c
 
75fd4bb
5099842
 
82e1dd9
 
5099842
e4ebe8c
7f36a98
5d7723c
 
82e1dd9
75fd4bb
86e77d8
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5099842
 
 
 
1ba421b
 
 
 
5099842
d2e3c7f
5099842
 
d2e3c7f
 
 
5e8e8f0
d2e3c7f
 
432a54a
1ba421b
 
 
d2e3c7f
5099842
 
 
86e77d8
 
 
 
 
 
 
 
 
 
 
 
5099842
1b68e78
5e8e8f0
d2e3c7f
b10e9f4
432a54a

import os
import gradio as gr
from langchain.document_loaders import PyPDFLoader
from langchain.text_splitter import RecursiveCharacterTextSplitter
from langchain.embeddings import OpenAIEmbeddings
from langchain.vectorstores import FAISS
from langchain.chains import ConversationalRetrievalChain
from langchain.chat_models import ChatOpenAI
from langchain.memory import ConversationBufferMemory
import shutil
from collections import deque
from langchain.prompts import PromptTemplate



openai_api_key = os.environ.get("OPENAI_API_KEY")

class AdvancedPdfChatbot:
    def __init__(self, openai_api_key):
        self.memory = deque(maxlen=20)
        os.environ["OPENAI_API_KEY"] = openai_api_key
        self.embeddings = OpenAIEmbeddings()
        self.text_splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=200)
        self.llm =  ChatOpenAI(temperature=0.7,model_name='gpt-4o',max_tokens=2048,top_p = 0.7)
        self.memory = ConversationBufferMemory(memory_key="chat_history", return_messages=True)
        self.qa_chain = None
        self.pdf_path = None
        self.template = """
You are a file-based knowledge assistant that interacts with users like ChatGPT. Your primary source of knowledge comes from user-uploaded files, such as PDFs. You do not rely on general knowledge or the internet. Instead, you extract, analyze, and synthesize information directly from the content of the provided file(s).  
**1. Personality and Tone**  
- Be polite, clear, and professional.  
- Use formal, academic language when the context requires it.  
- Provide concise, well-structured responses, and maintain a helpful and supportive tone.  
**2. Core Capabilities**  
- Extract and summarize key information from the provided file.  
- Answer user questions based on the content of the file.  
- Provide in-depth analysis, explanations, and references to the file's content.  
- Suggest relevant sections, chapters, or pages where specific information can be found.  
- Offer guidance on how users can interpret and understand the file's contents.  
**3. Knowledge and Scope**  
- Your knowledge is limited to the content found in the uploaded file(s).  
- You should not answer questions unrelated to the file's content unless explicitly requested.  
- If a user asks a question that is not found in the file, inform them that the information is not available.  
**4. Interaction Rules**  
- Respond with specific references to the document's content, including page numbers, sections, or headings, if available.  
- If the user asks for clarification, politely request more details.  
- Provide accurate, detailed, structured, clear explanations for user queries.  
- Never "make up" information. If something is not in the file, clearly state that it cannot be found.  
**5. Context Awareness**  
- Remember the content of the file for the duration of the session.  
- Use file-specific knowledge to provide logical and evidence-backed responses.  
- If multiple files are uploaded, clarify which file is being referenced and specify which file the information is from.  
**6. Technical Details**  
- Summarize content into concise answers and organize information using bullet points, lists, or structured paragraphs.  
- If asked to provide a summary, focus on key points, main arguments, and essential takeaways.  
- When a user asks for a section or heading, search for relevant text within the file.  
- Do not offer answers beyond the scope of the file, and avoid guessing.  
**7. Example Usage**  
User: "Can you summarize the main argument from the introduction of the file?"  
Response: "Sure! The introduction discusses [key points] and highlights the central argument that [main idea]. This can be found on page 2 under the heading 'Introduction'."  
User: "Where can I find the definition of 'symbolic interactionism' in the document?"  
Bot Response: "The definition of 'symbolic interactionism' appears on page 12 under the subheading 'Key Theoretical Concepts'."  
User: "Explain the concept of 'cognitive dissonance' as it is presented in the document."  
Bot Response: "In the document, 'cognitive dissonance' is defined as [definition from the file]. It appears in the context of [brief explanation] and can be found on page 15 under the section 'Theoretical Foundations'."  



** You should also be able to have a casual conversation when users say thank you or hi or hello, you should be an interactive chat bot.
**End of Prompt**
        Context: {context}
        Question: {question}
        Answer:
        """

        self.prompt = PromptTemplate(template=self.template, input_variables=["context", "question"])

    def load_and_process_pdf(self, pdf_path):
        try:
            loader = PyPDFLoader(pdf_path)
            documents = loader.load()
            texts = self.text_splitter.split_documents(documents)
            self.db = FAISS.from_documents(texts, self.embeddings)
            self.setup_conversation_chain()
            self.pdf_path = pdf_path
        except Exception as e:
            return f"An error occurred while processing the PDF: {e}"

    def setup_conversation_chain(self):
        self.qa_chain = ConversationalRetrievalChain.from_llm(
            self.llm,
            retriever=self.db.as_retriever(),
            memory=self.memory,
            combine_docs_chain_kwargs={"prompt": self.prompt}
        )

    def chat(self, query):
        if not self.qa_chain:
            return "Please upload a PDF first."
        result = self.qa_chain({"question": query})
        return result  # Return the entire result dictionary

    def get_pdf_path(self):
        
        if self.pdf_path:
            return self.pdf_path
        else:
            return "No PDF uploaded yet."

# Initialize the chatbot
pdf_chatbot = AdvancedPdfChatbot(openai_api_key)



def upload_pdf(pdf_file):
    if pdf_file is None:
        return "Please upload a PDF file."
    file_path = pdf_file.name  # This is the full path, e.g., /tmp/tmp1234.pdf
    pdf_chatbot.memory.clear()  # Clears chat history
    pdf_chatbot.load_and_process_pdf(file_path)
    return file_path




def respond(message, history):
    if not pdf_chatbot.qa_chain:
        return "", history, "", "", "", "", "", ""

    # Generate response using QA chain
    response = pdf_chatbot.chat(message)
    response_answer = response["answer"]
    if response_answer.find("Helpful Answer:") != -1:
        response_answer = response_answer.split("Helpful Answer:")[-1]
    response_sources = response["source_documents"]

    # Extract source documents and page numbers
    response_source1 = response_sources[0].page_content.strip() if len(response_sources) > 0 else ""
    response_source2 = response_sources[1].page_content.strip() if len(response_sources) > 1 else ""
    response_source3 = response_sources[2].page_content.strip() if len(response_sources) > 2 else ""
    response_source1_page = response_sources[0].metadata["page"] + 1 if len(response_sources) > 0 else ""
    response_source2_page = response_sources[1].metadata["page"] + 1 if len(response_sources) > 1 else ""
    response_source3_page = response_sources[2].metadata["page"] + 1 if len(response_sources) > 2 else ""

    # Append user message and response to chat history
    history.append((message, response_answer))

    return "", history, response_source1, response_source1_page, response_source2, response_source2_page, response_source3, response_source3_page
def clear_chatbot():
    pdf_chatbot.memory.clear()
    return []

def get_pdf_path():
    # Call the method to return the current PDF path
    return pdf_chatbot.get_pdf_path()

# Create the Gradio interface
with gr.Blocks() as demo:
    gr.Markdown("# PDF Chatbot")
    
    with gr.Row():
        pdf_upload = gr.File(label="Upload PDF", file_types=[".pdf"])
        upload_button = gr.Button("Process PDF")

    upload_status = gr.Textbox(label="Upload Status")
    upload_button.click(upload_pdf, inputs=[pdf_upload], outputs=[upload_status])

    path_button = gr.Button("Get PDF Path")
    pdf_path_display = gr.Textbox(label="Current PDF Path")
    
    chatbot_interface = gr.Chatbot()
    msg = gr.Textbox()
    clear = gr.Button("Clear")

    with gr.Accordion("Advanced - Document references", open=False):
        with gr.Row():
            doc_source1 = gr.Textbox(label="Reference 1", lines=2, container=True, scale=20)
            source1_page = gr.Number(label="Page", scale=1)
        with gr.Row():
            doc_source2 = gr.Textbox(label="Reference 2", lines=2, container=True, scale=20)
            source2_page = gr.Number(label="Page", scale=1)
        with gr.Row():
            doc_source3 = gr.Textbox(label="Reference 3", lines=2, container=True, scale=20)
            source3_page = gr.Number(label="Page", scale=1)

    msg.submit(respond, inputs=[msg, chatbot_interface], outputs=[msg, chatbot_interface, doc_source1, source1_page, doc_source2, source2_page, doc_source3, source3_page])
    clear.click(clear_chatbot, outputs=[chatbot_interface])
    path_button.click(get_pdf_path, outputs=[pdf_path_display])

if __name__ == "__main__":
    demo.launch()