Spaces:

bukalapak
/

allofresh-assistant

Runtime error

App Files Files Community

ar-dy commited on May 10, 2023

Commit

cad351c

1 Parent(s): 26e0866

initial push from existing

Browse files

Files changed (8) hide show

.gitignore +3 -0
allofresh_chatbot.py +173 -0
app.py +41 -0
prompts/ans_prompt.py +58 -0
prompts/mod_prompt.py +17 -0
prompts/reco_prompt.py +44 -0
requirements.txt +3 -0
utils.py +44 -0

.gitignore ADDED Viewed

	@@ -0,0 +1,3 @@

+.env
+**__init__.py
+__pycache__

allofresh_chatbot.py ADDED Viewed

	@@ -0,0 +1,173 @@

+import os
+from dotenv import load_dotenv
+from langchain import PromptTemplate, LLMChain
+from langchain.agents import initialize_agent, Tool
+from langchain.chat_models import AzureChatOpenAI
+from langchain.agents import ZeroShotAgent, AgentExecutor
+from langchain.chains.conversation.memory import ConversationBufferMemory
+from langchain.callbacks import get_openai_callback
+from langchain.chains.llm import LLMChain
+from langchain.llms import AzureOpenAI
+from langchain.prompts import PromptTemplate
+from utils import lctool_search_allo_api, cut_dialogue_history
+from prompts.mod_prompt import MOD_PROMPT
+from prompts.ans_prompt import ANS_PREFIX, ANS_FORMAT_INSTRUCTIONS, ANS_SUFFIX
+from prompts.reco_prompt import RECO_PREFIX, RECO_FORMAT_INSTRUCTIONS, RECO_SUFFIX
+load_dotenv()
+class AllofreshChatbot():
+    def __init__(self, debug=False):
+        self.ans_memory = None
+        self.debug = debug
+        # init llm
+        self.llms = self.init_llm()
+        # init moderation chain
+        self.mod_chain = self.init_mod_chain()
+        # init answering agent
+        self.ans_memory = self.init_ans_memory()
+        self.ans_agent = self.init_ans_agent()
+        # init reco agent
+        self.reco_agent = self.init_reco_agent()
+    def init_llm(self):
+        return {
+            "gpt-4": AzureChatOpenAI(
+                temperature=0,
+                deployment_name = os.getenv("DEPLOYMENT_NAME_GPT4"),
+                model_name = os.getenv("MODEL_NAME_GPT4"),
+                openai_api_type = os.getenv("OPENAI_API_TYPE"),
+                openai_api_base = os.getenv("OPENAI_API_BASE"),
+                openai_api_version = os.getenv("OPENAI_API_VERSION"),
+                openai_api_key = os.getenv("OPENAI_API_KEY"),
+                openai_organization = os.getenv("OPENAI_ORGANIZATION")
+            ),
+            "gpt-3.5": AzureChatOpenAI(
+                temperature=0,
+                deployment_name = os.getenv("DEPLOYMENT_NAME_GPT3.5"),
+                model_name = os.getenv("MODEL_NAME_GPT3.5"),
+                openai_api_type = os.getenv("OPENAI_API_TYPE"),
+                openai_api_base = os.getenv("OPENAI_API_BASE"),
+                openai_api_version = os.getenv("OPENAI_API_VERSION"),
+                openai_api_key = os.getenv("OPENAI_API_KEY"),
+                openai_organization = os.getenv("OPENAI_ORGANIZATION")
+            ),
+            "gpt-3": AzureOpenAI(
+                temperature=0,
+                deployment_name = os.getenv("DEPLOYMENT_NAME_GPT3"),
+                model_name = os.getenv("MODEL_NAME_GPT3"),
+                openai_api_base = os.getenv("OPENAI_API_BASE"),
+                openai_api_key = os.getenv("OPENAI_API_KEY"),
+                openai_organization = os.getenv("OPENAI_ORGANIZATION")
+            ),
+        }
+    def init_mod_chain(self):
+        mod_prompt = PromptTemplate(
+            template=MOD_PROMPT,
+            input_variables=["query"]
+        )
+        # Define the first LLM chain with the shared AzureOpenAI object and prompt template
+        return LLMChain(llm=self.llms["gpt-4"], prompt=mod_prompt)
+    def init_ans_memory(self):
+        return ConversationBufferMemory(memory_key="chat_history", output_key='output')
+    def init_ans_agent(self):
+        ans_tools = [
+            Tool(
+                name="Product Search",
+                func=lctool_search_allo_api,
+                description="""
+                    To search for products in Allofresh's Database.
+                    Always use this to verify product names.
+                    Outputs product names and prices
+                """
+            )
+        ]
+        return initialize_agent(
+            ans_tools,
+            self.llms["gpt-4"],
+            agent="conversational-react-description",
+            verbose=self.debug,
+            memory=self.ans_memory,
+            return_intermediate_steps=True,
+            agent_kwargs={
+                'prefix': ANS_PREFIX,
+                # 'format_instructions': ANS_FORMAT_INSTRUCTIONS, # only needed for below gpt-4
+                'suffix': ANS_SUFFIX
+            }
+        )
+    def ans_pipeline(self, text, debug_cost=False, keep_last_n_words=500):
+        try:
+            self.ans_agent.memory.buffer = cut_dialogue_history(self.ans_agent.memory.buffer, keep_last_n_words=keep_last_n_words)
+        except:
+            pass
+        finally:
+            with get_openai_callback() as openai_cb:
+                res = self.ans_agent({"input": text.strip()})
+                response = res['output'].replace("\\", "/")
+                if debug_cost:
+                    print(f"Total Tokens: {openai_cb.total_tokens}")
+                    print(f"Prompt Tokens: {openai_cb.prompt_tokens}")
+                    print(f"Completion Tokens: {openai_cb.completion_tokens}")
+                    print(f"Total Cost (USD): ${openai_cb.total_cost}")
+                return response
+    def init_reco_agent(self):
+        reco_tools = [
+            Tool(
+                name="Product Search",
+                func=lctool_search_allo_api,
+                description="""
+                    To search for products in Allofresh's Database.
+                    Always use this to verify product names.
+                    Outputs product names and prices
+                """
+            ),
+            Tool(
+                name="No Recommendation",
+                func=lambda x: "No recommendation",
+                description="""
+                    Use this if based on the context you don't need to recommend any products
+                """
+            )
+        ]
+        prompt = ZeroShotAgent.create_prompt(
+            reco_tools,
+            prefix=RECO_PREFIX,
+            format_instructions=RECO_FORMAT_INSTRUCTIONS,
+            suffix=RECO_SUFFIX,
+            input_variables=["input", "agent_scratchpad"]
+        )
+        llm_chain_reco = LLMChain(llm=self.llms["gpt-4"], prompt=prompt)
+        agent_reco = ZeroShotAgent(llm_chain=llm_chain_reco, allowed_tools=[tool.name for tool in reco_tools])
+        return AgentExecutor.from_agent_and_tools(agent=agent_reco, tools=reco_tools, verbose=self.debug)
+    def answer(self, query):
+        # moderate
+        mod_verdict = self.mod_chain.run({"query": query})
+        # if pass moderation
+        if mod_verdict == "True":
+            # answer question
+            answer = self.ans_pipeline(query)
+            # recommend
+            reco = self.reco_agent.run({"input": self.ans_agent.memory.buffer})
+            if len(reco) > 0:
+                self.ans_agent.memory.chat_memory.add_ai_message(reco)
+            # construct output
+            return (answer, reco)
+        else:
+            return (
+                "Maaf saya tidak bisa membantu Anda untuk itu..., tapi silakan tanya Allofresh-Assistant apa saja terkait kebutuhan berbelanja Anda!",
+                ""
+            )

app.py ADDED Viewed

	@@ -0,0 +1,41 @@

+import gradio as gr
+from loguru import logger
+from pydantic import BaseModel
+from allofresh_chatbot import AllofreshChatbot
+allo_chatbot = AllofreshChatbot(debug=False)
+class Message(BaseModel):
+    role: str
+    content: str
+async def predict(input, history):
+    """
+    Predict the response of the chatbot and complete a running list of chat history.
+    """
+    history.append({"role": "user", "content": input})
+    answer, reco = allo_chatbot.answer(input)
+    history.append({"role": "assistant", "content": answer})
+    if len(reco) > 0:
+        history.append({"role": "user", "content": ""})
+        history.append({"role": "assistant", "content": reco})
+    messages = [(history[i]["content"], history[i+1]["content"]) for i in range(0, len(history)-1, 2)]
+    return messages, history
+"""
+Gradio Blocks low-level API that allows to create custom web applications (here our chat app)
+"""
+with gr.Blocks() as demo:
+    logger.info("Starting Demo...")
+    chatbot = gr.Chatbot(label="Allofresh Assistant")
+    state = gr.State([])
+    with gr.Row():
+        txt = gr.Textbox(show_label=False, placeholder="Enter text, then press enter").style(container=False)
+    txt.submit(predict, [txt, state], [chatbot, state])
+demo.launch()

prompts/ans_prompt.py ADDED Viewed

	@@ -0,0 +1,58 @@

+ANS_PREFIX = """
+You are Allofresh-Assistant, an AI language model that has been trained to serve Allofresh,
+an online e-grocery platform selling supermarket products with a focus on fresh produces.
+Your primary function is to assist customers with their shopping needs,
+including but not limited to answering questions on products and services offered Allofresh.
+You can answer questions regarding what people can do with the products they buy at Allofresh.
+e.g. food and recipes as it will nudge people to buy products
+If a customer asks you a question that falls outside of your function or knowledge as an online supermarket assistant,
+you must politely decline to answer and redirect the conversation back to your area of expertise.
+You have access to the supermarket's knowledge base (products, vouchers, etc.).
+You should use this information to provide accurate and helpful responses to customer inquiries.
+You must remember the name and description of each tool.
+Customers might give you questions which you can answer without tools,
+but questions which requires specific knowledge regarding the supermarket must be validated to the knowledge base.
+If you can't answer a question with or without tools, politely apologize that you don't know.
+You must answer in formal yet friendly bahasa Indonesia.
+TOOLS:
+------
+"""
+ANS_FORMAT_INSTRUCTIONS = """
+To use a tool, please use the following format:
+```
+Thought: Do I need to use a tool? Yes
+Action: the action to take, should be one of [{tool_names}]
+Action Input: the input to the action
+Observation: the result of the action
+```
+When you have a response to say to the Human, or if you do not need to use a tool, you MUST use the format:
+```
+Thought: Do I need to use a tool? No
+```
+Finally, whether you used the tool or not, output the answer
+{ai_prefix}: [your response here]
+"""
+ANS_SUFFIX = """
+You are very strict on correctness and will never fake an information regarding the supermarket (product names, location, price, vouchers, etc.).
+Therefore you must validate every information related to Allofresh to Allofresh's knowledge base
+You must answer the user's question as informative as possible
+Take into account the previous conversation history:
+{chat_history}
+Begin! Remember you must give the final answer in bahasa indonesia
+New Input: {input}
+{agent_scratchpad}
+...
+"""

prompts/mod_prompt.py ADDED Viewed

	@@ -0,0 +1,17 @@

+MOD_PROMPT = """
+You are MODERATOR.
+MODERATOR MUST ONLY classify whether a certain passage belongs to a certain topic.
+INPUT: {query}
+INSTRUCTIONS:
+Classify WHETHER OR NOT input is RELATED to EITHER of the following:
+- greetings
+- supermarket shopping
+- general questions/inquiry on foods/recipe
+NOTES:
+- the query might be in bahasa indonesia, english, or a combination of both. you must take into account for both languages
+ONLY ANSWER with either [True, False]
+"""

prompts/reco_prompt.py ADDED Viewed

	@@ -0,0 +1,44 @@

+RECO_PREFIX = """
+    You are Recobot, an LLM trained to recommend products.
+    You are serving Allofresh, an online e-grocery platform selling supermarket products with a focus on fresh produces.
+    You have the capability to assess the context and determine whether it's appropriate to recommend a product or not
+    You are to evaluate another LLM's output and determine what products to recommend to user based on the output.
+    You NEVER make up product names, and will always check the product database for available products
+    You must answer in formal yet friendly bahasa Indonesia.
+"""
+# this is only used for gpt-3.5-turbo and below
+RECO_FORMAT_INSTRUCTIONS = """
+You must use the following format:
+Context: the input context you must assess
+Thought: Do I need to recommend products? If based on context, recommendation related to the last HumanMessage has been given by AI, then no need to recommend. Yes or No?
+Action: What should I do? must be one of [{tool_names}]
+Action Input: If you want to recommend products, pass the list of products you want to search, else input empty string
+Observation: the result of the action
+... (this Thought/Action/Action Input/Observation can repeat N times)
+Thought: I now know the final answer
+Final Answer: if no need to recommend product, only output empty string, else recommend all relevant products based on observation result
+"""
+RECO_GPT3_ADD_FORMAT_INSTRUCTIONS = """
+Example of recommending products
+Context: Human: Human: gw pengen makanan sehat pake ayam, rendah kalori, rendah karbo, gimana caranya? bagi resep dan cara masak dong'?\nAI: Untuk makanan sehat rendah kalori dan rendah karbohidrat, Anda bisa mencoba resep Ayam Panggang dengan Sayuran. Bahan-bahan yang dibutuhkan adalah ayam fillet, paprika, brokoli, bawang bombay, bawang putih, garam, merica, dan minyak zaitun. Pertama, potong ayam fillet menjadi beberapa bagian dan lumuri dengan garam dan merica. Kemudian panggang ayam di dalam oven selama 20-25 menit. Sementara itu, tumis bawang bombay dan bawang putih dengan sedikit minyak zaitun hingga harum. Tambahkan paprika dan brokoli yang sudah dipotong-potong, lalu tumis hingga sayuran matang. Sajikan ayam panggang dengan sayuran sebagai pelengkap. Selamat mencoba!
+Thought: Yes
+Action: Search Products
+Observation: [reco_result_from_tools]
+Thought: I now know the final answer
+Final Answer: [your_final_answer]
+Example of NOT recommending products:
+Context: Human: hi, ada ayam gak?\nAI: Ya, kami memiliki Ayam Broiler Daging Giling seharga Rp 19.300, Ayam Broiler Paha Tanpa Tulang seharga Rp 16.825, dan Ayam Broiler Paha Atas seharga Rp 17.875. Apakah ada yang ingin Anda beli?
+Thought: No
+Action: No Recommendation
+Observation: [observation_result]
+Thought: I now know the final answer
+Final Answer: [your_final_answer]
+"""
+RECO_SUFFIX = """
+    Begin!
+    Context: {input}
+    {agent_scratchpad}
+"""

requirements.txt ADDED Viewed

	@@ -0,0 +1,3 @@

+langchain==0.0.163
+loguru==0.6.0
+openai==0.27.4

utils.py ADDED Viewed

	@@ -0,0 +1,44 @@

+import requests
+import json
+from dotenv import load_dotenv
+import os
+load_dotenv()
+ALLOFRESH_SEARCH_API_BASE = os.getenv("ALLOFRESH_SEARCH_API_BASE")
+def search_allo_api(query, limit=3):
+    response = requests.get(f'{ALLOFRESH_SEARCH_API_BASE}?keyword={query}&limit={limit}&p=1')
+    return json.loads(response.text)
+def lctool_search_allo_api(queries):
+    all_results = []
+    try:
+        for q in queries.split(", "):
+            prods_list = search_allo_api(q)["products"]
+            all_results.append({
+                q: [
+                    {k: v for k, v in prod_dict.items() if k in ["name", "price"]}
+                    for prod_dict in prods_list
+                ]
+            })
+        return str(all_results)
+    except Exception as e:
+        return str(e)
+def cut_dialogue_history(history_memory, keep_last_n_words=500):
+    if history_memory is None or len(history_memory) == 0:
+        return history_memory
+    tokens = history_memory.split()
+    n_tokens = len(tokens)
+    # print(f"history_memory: {history_memory}, n_tokens: {n_tokens}")
+    if n_tokens < keep_last_n_words:
+        return history_memory
+    paragraphs = history_memory.split('\n')
+    last_n_tokens = n_tokens
+    while last_n_tokens >= keep_last_n_words:
+        last_n_tokens -= len(paragraphs[0].split(' '))
+        paragraphs = paragraphs[1:]
+    return '\n' + '\n'.join(paragraphs)