Spaces:

deddoggo
/

chatbot_demo

Paused

App Files Files Community

deddoggo commited on Jun 29

Commit

8860136

1 Parent(s): a53f1d8

multi-turns chatbot

Browse files

Files changed (2) hide show

app.py +1 -1
rag_pipeline.py +25 -13

app.py CHANGED Viewed

@@ -38,7 +38,7 @@ with gr.Blocks(theme=gr.themes.Soft(), title="Chatbot Luật Giao thông Việt
     clear = gr.ClearButton([msg, chatbot])
     def respond(message, chat_history):
-        bot_message = chat_interface(message, chat_history)
         chat_history.append((message, bot_message))
         return "", chat_history

     clear = gr.ClearButton([msg, chatbot])
     def respond(message, chat_history):
+        bot_message = chat_interface(message, COMPONENTS, chat_history)
         chat_history.append((message, bot_message))
         return "", chat_history

rag_pipeline.py CHANGED Viewed

@@ -79,7 +79,29 @@ def initialize_components(data_path):
         "bm25_model": bm25_model
     }
-def generate_response(query, components):
     """
     Tạo câu trả lời cho một query bằng cách sử dụng các thành phần đã được khởi tạo.
     """
@@ -96,7 +118,7 @@ def generate_response(query, components):
         faiss_index=components["faiss_index"],
         chunks_data=components["chunks_data"],
         bm25_model=components["bm25_model"],
-        k=5,
         initial_k_multiplier=18
     )
@@ -113,17 +135,7 @@ def generate_response(query, components):
         context = "\n\n---\n\n".join(context_parts)
     # 3. Xây dựng Prompt và tạo câu trả lời
-    prompt = f"""Dưới đây là một số thông tin trích dẫn từ văn bản luật giao thông đường bộ Việt Nam.
-Hãy SỬ DỤNG CÁC THÔNG TIN NÀY để trả lời câu hỏi một cách chính xác và đầy đủ.
-Nếu câu hỏi đưa ra nhiều đáp án thì chọn 1 đáp án đúng nhất.
-### Thông tin luật:
-{context}
-### Câu hỏi:
-{query}
-### Trả lời:"""
     print("--- Bắt đầu tạo câu trả lời từ LLM ---")
     inputs = tokenizer(prompt, return_tensors="pt").to("cuda" if torch.cuda.is_available() else "cpu")

         "bm25_model": bm25_model
     }
+def build_multiturn_prompt(chat_history, current_query, retrieved_context):
+    # Lấy tối đa N lượt gần nhất (tránh token quá dài)
+    max_turns = 5
+    history_text = ""
+    for i, (user_msg, bot_msg) in enumerate(chat_history[-max_turns:]):
+        history_text += f"[Người dùng]: {user_msg}\n[Chatbot]: {bot_msg}\n"
+    full_prompt = f"""Bạn là một chatbot trợ lý luật giao thông Việt Nam. Dưới đây là các đoạn hội thoại trước đó, và trích dẫn luật phù hợp để trả lời câu hỏi tiếp theo.
+### Lịch sử hội thoại:
+{history_text}
+### Thông tin luật:
+{retrieved_context}
+### Câu hỏi hiện tại:
+{current_query}
+### Trả lời:"""
+    return full_prompt
+def generate_response(query, components, chat_history=None):
     """
     Tạo câu trả lời cho một query bằng cách sử dụng các thành phần đã được khởi tạo.
     """
         faiss_index=components["faiss_index"],
         chunks_data=components["chunks_data"],
         bm25_model=components["bm25_model"],
+        k=3,
         initial_k_multiplier=18
     )
         context = "\n\n---\n\n".join(context_parts)
     # 3. Xây dựng Prompt và tạo câu trả lời
+    prompt = build_multiturn_prompt(chat_history or [], query, context)
     print("--- Bắt đầu tạo câu trả lời từ LLM ---")
     inputs = tokenizer(prompt, return_tensors="pt").to("cuda" if torch.cuda.is_available() else "cpu")