llm

Sleeping

App Files Files Community

Chris4K commited on Jan 12

Commit

ca6ed76

verified ·

1 Parent(s): 4c2be05

Update services/chat_service.py

Browse files

Files changed (1) hide show

services/chat_service.py +97 -114

services/chat_service.py CHANGED Viewed

@@ -1,8 +1,10 @@
-# services/chat_service.py
 from typing import List, Dict, Any, Optional, Tuple
 from datetime import datetime
 import logging
 from config.config import settings
 logger = logging.getLogger(__name__)
@@ -29,7 +31,6 @@ class ConversationManager:
             'context': context
         })
-        # Trim history if needed
         if len(self.conversations[session_id]) > self.max_history:
             self.conversations[session_id] = self.conversations[session_id][-self.max_history:]
@@ -41,8 +42,6 @@ class ConversationManager:
             del self.conversations[session_id]
 class ChatService:
-    """Main chat service that coordinates responses"""
-    """Main chat service that coordinates responses"""
     def __init__(
         self,
         model_service,
@@ -57,6 +56,33 @@ class ChatService:
         self.faq_service = faq_service
         self.conversation_manager = ConversationManager()
     def construct_system_prompt(self, context: str) -> str:
         """Constructs the system message."""
         return (
@@ -73,72 +99,68 @@ class ChatService:
             chat_history: List[Tuple[str, str]],
             max_history_turns: int = 1
         ) -> str:
-            """Constructs the full prompt."""
-            # System message
-            system_message = self.construct_system_prompt(context)
-            # Start with system message
-            prompt = f"<|begin_of_text|><|start_header_id|>system<|end_header_id|>\n\n{system_message}<|eot_id|>"
-            # Add chat history (limit to last `max_history_turns` interactions)
-            for user_msg, assistant_msg in chat_history[-max_history_turns:]:
-                prompt += f"<|start_header_id|>user<|end_header_id|>\n\n{user_msg}<|eot_id|>"
-                prompt += f"<|start_header_id|>assistant<|end_header_id|>\n\n{assistant_msg}<|eot_id|>"
-            # Add the current user input
-            prompt += f"<|start_header_id|>user<|end_header_id|>\n\n{user_input}<|eot_id|>"
-            prompt += "<|start_header_id|>assistant<|end_header_id|>\n\n"
-            return prompt
     def build_context(
-            self,
-            search_results: Dict[str, List[Dict[str, Any]]],
-            chat_history: List[Dict[str, Any]]
-        ) -> str:
-            """Build context for the model from search results and chat history"""
-            context_parts = []
-            # Add relevant products
-            if search_results.get('products'):
-                products = search_results['products'][:2]  # Limit to top 2 products
-                for product in products:
-                    context_parts.append(
-                        f"Produkt: {product['Name']}\n"
-                        f"Beschreibung: {product['Description']}\n"
-                        f"Preis: {product['Price']}€\n"
-                        f"Kategorie: {product['ProductCategory']}"
-                    )
-            # Add relevant PDF content
-            if search_results.get('documents'):
-                docs = search_results['documents'][:2]
-                for doc in docs:
-                    context_parts.append(
-                        f"Aus Dokument '{doc['source']}' (Seite {doc['page']}):\n"
-                        f"{doc['text']}"
-                    )
-            # Add relevant FAQs
-            if search_results.get('faqs'):
-                faqs = search_results['faqs'][:2]
-                for faq in faqs:
-                    context_parts.append(
-                        f"FAQ:\n"
-                        f"Frage: {faq['question']}\n"
-                        f"Antwort: {faq['answer']}"
-                    )
-            # Add recent chat history
-            if chat_history:
-                recent_history = chat_history[-3:]  # Last 3 interactions
-                history_text = "\n".join(
-                    f"User: {h['user_input']}\nAssistant: {h['response']}"
-                    for h in recent_history
                 )
-                context_parts.append(f"Letzte Interaktionen:\n{history_text}")
-            print("\n\n".join(context_parts))
-            return "\n\n".join(context_parts)
     async def chat(
         self,
@@ -148,29 +170,21 @@ class ChatService:
     ) -> Tuple[str, List[Tuple[str, str]], Dict[str, List[Dict[str, Any]]]]:
         """Main chat method that coordinates the entire conversation flow."""
         try:
-            # Ensure session_id is a string
             if not isinstance(session_id, str):
                 session_id = str(session_id)
-            # Get chat history
             chat_history_raw = self.conversation_manager.get_history(session_id)
             chat_history = [
                 (entry['user_input'], entry['response']) for entry in chat_history_raw
             ]
-            # Search all sources
-            search_results = await self.search_all_sources(user_input)
             print(search_results)
-            # Build context
             context = self.build_context(search_results, chat_history_raw)
-            # Construct the prompt
             prompt = self.construct_prompt(user_input, context, chat_history)
-            # Generate response
-            response = await self.generate_response(prompt, max_length)
-            # Store interaction
             self.conversation_manager.add_interaction(
                 session_id,
                 user_input,
@@ -178,9 +192,9 @@ class ChatService:
                 {'search_results': search_results}
             )
-            # Prepare the chat history for Gradio
             formatted_history = [
-                (entry['user_input'], entry['response']) for entry in self.conversation_manager.get_history(session_id)
             ]
             return response, formatted_history, search_results
@@ -189,36 +203,7 @@ class ChatService:
             logger.error(f"Error in chat: {e}")
             raise
-    async def search_all_sources(
-        self,
-        query: str,
-        top_k: int = 3
-    ) -> Dict[str, List[Dict[str, Any]]]:
-        """Search across all available data sources"""
-        try:
-            print("-----------------------------")
-            print("starting searches .... ")
-            products = self.data_service.search(query, top_k)
-            pdfs = self.pdf_service.search(query, top_k)
-            faqs = self.faq_service.search_faqs(query, top_k)
-            results = {
-                'products': products or [],
-                'documents': pdfs or [],
-                'faqs': faqs or []
-            }
-            print("Search results:", results)
-            return results
-        except Exception as e:
-            logger.error(f"Error searching sources: {e}")
-            return {'products': [], 'documents': [], 'faqs': []}
-    async def generate_response(
         self,
         prompt: str,
         max_length: int = 1000
@@ -241,8 +226,7 @@ class ChatService:
                 top_p=0.9,
                 do_sample=True,
                 no_repeat_ngram_size=3,
-                early_stopping=False, # True  num_beams=3,  # Increase number of beams if beam search is needed
-                #pad_token_id=self.tokenizer.eos_token_id, #eos_token_id
             )
             response = self.tokenizer.decode(
@@ -254,5 +238,4 @@ class ChatService:
         except Exception as e:
             logger.error(f"Error generating response: {e}")
-            raise

+#chat_service.py
 from typing import List, Dict, Any, Optional, Tuple
 from datetime import datetime
 import logging
 from config.config import settings
+import asyncio
 logger = logging.getLogger(__name__)
             'context': context
         })
         if len(self.conversations[session_id]) > self.max_history:
             self.conversations[session_id] = self.conversations[session_id][-self.max_history:]
             del self.conversations[session_id]
 class ChatService:
     def __init__(
         self,
         model_service,
         self.faq_service = faq_service
         self.conversation_manager = ConversationManager()
+    def search_all_sources(
+        self,
+        query: str,
+        top_k: int = 3
+    ) -> Dict[str, List[Dict[str, Any]]]:
+        """Search across all available data sources"""
+        try:
+            print("-----------------------------")
+            print("starting searches .... ")
+            products = self.data_service.search(query, top_k)
+            pdfs = self.pdf_service.search(query, top_k)
+            faqs = self.faq_service.search_faqs(query, top_k)
+            results = {
+                'products': products or [],
+                'documents': pdfs or [],
+                'faqs': faqs or []
+            }
+            print("Search results:", results)
+            return results
+        except Exception as e:
+            logger.error(f"Error searching sources: {e}")
+            return {'products': [], 'documents': [], 'faqs': []}
     def construct_system_prompt(self, context: str) -> str:
         """Constructs the system message."""
         return (
             chat_history: List[Tuple[str, str]],
             max_history_turns: int = 1
         ) -> str:
+        """Constructs the full prompt."""
+        system_message = self.construct_system_prompt(context)
+        prompt = f"<|begin_of_text|><|start_header_id|>system<|end_header_id|>\n\n{system_message}<|eot_id|>"
+        for user_msg, assistant_msg in chat_history[-max_history_turns:]:
+            prompt += f"<|start_header_id|>user<|end_header_id|>\n\n{user_msg}<|eot_id|>"
+            prompt += f"<|start_header_id|>assistant<|end_header_id|>\n\n{assistant_msg}<|eot_id|>"
+        prompt += f"<|start_header_id|>user<|end_header_id|>\n\n{user_input}<|eot_id|>"
+        prompt += "<|start_header_id|>assistant<|end_header_id|>\n\n"
+        return prompt
     def build_context(
+        self,
+        search_results: Dict[str, List[Dict[str, Any]]],
+        chat_history: List[Dict[str, Any]]
+    ) -> str:
+        """Build context for the model from search results and chat history"""
+        context_parts = []
+        # Add relevant products
+        if search_results.get('products'):
+            products = search_results['products'][:2]  # Limit to top 2 products
+            for product in products:
+                context_parts.append(
+                    f"Produkt: {product['Name']}\n"
+                    f"Beschreibung: {product['Description']}\n"
+                    f"Preis: {product['Price']}€\n"
+                    f"Kategorie: {product['ProductCategory']}"
+                )
+        # Add relevant PDF content
+        if search_results.get('documents'):
+            docs = search_results['documents'][:2]
+            for doc in docs:
+                context_parts.append(
+                    f"Aus Dokument '{doc['source']}' (Seite {doc['page']}):\n"
+                    f"{doc['text']}"
                 )
+        # Add relevant FAQs
+        if search_results.get('faqs'):
+            faqs = search_results['faqs'][:2]
+            for faq in faqs:
+                context_parts.append(
+                    f"FAQ:\n"
+                    f"Frage: {faq['question']}\n"
+                    f"Antwort: {faq['answer']}"
+                )
+        # Add recent chat history
+        if chat_history:
+            recent_history = chat_history[-3:]  # Last 3 interactions
+            history_text = "\n".join(
+                f"User: {h['user_input']}\nAssistant: {h['response']}"
+                for h in recent_history
+            )
+            context_parts.append(f"Letzte Interaktionen:\n{history_text}")
+        print("\n\n".join(context_parts))
+        return "\n\n".join(context_parts)
     async def chat(
         self,
     ) -> Tuple[str, List[Tuple[str, str]], Dict[str, List[Dict[str, Any]]]]:
         """Main chat method that coordinates the entire conversation flow."""
         try:
             if not isinstance(session_id, str):
                 session_id = str(session_id)
             chat_history_raw = self.conversation_manager.get_history(session_id)
             chat_history = [
                 (entry['user_input'], entry['response']) for entry in chat_history_raw
             ]
+            search_results = self.search_all_sources(user_input)
             print(search_results)
             context = self.build_context(search_results, chat_history_raw)
             prompt = self.construct_prompt(user_input, context, chat_history)
+            response = self.generate_response(prompt, max_length)
             self.conversation_manager.add_interaction(
                 session_id,
                 user_input,
                 {'search_results': search_results}
             )
             formatted_history = [
+                (entry['user_input'], entry['response'])
+                for entry in self.conversation_manager.get_history(session_id)
             ]
             return response, formatted_history, search_results
             logger.error(f"Error in chat: {e}")
             raise
+    def generate_response(
         self,
         prompt: str,
         max_length: int = 1000
                 top_p=0.9,
                 do_sample=True,
                 no_repeat_ngram_size=3,
+                early_stopping=False
             )
             response = self.tokenizer.decode(
         except Exception as e:
             logger.error(f"Error generating response: {e}")
+            raise