Spaces:

HEHEBOIOG
/

NewsInferno

Sleeping

App Files Files Community

HEHEBOIOG commited on Dec 9, 2024

Commit

a4f4e70

verified ·

1 Parent(s): deebefc

Update app.py

Browse files

Files changed (1) hide show

app.py +25 -53

app.py CHANGED Viewed

@@ -9,7 +9,11 @@ from langchain_community.embeddings import HuggingFaceBgeEmbeddings
 from langchain.memory import ConversationBufferMemory
 from transformers import pipeline
 from sentence_transformers import SentenceTransformer
 import tavily
 class AdvancedRAGChatbot:
     def __init__(self,
@@ -18,31 +22,20 @@ class AdvancedRAGChatbot:
                  llm_model: str = "llama-3.3-70b-versatile",
                  temperature: float = 0.7):
         """Initialize the Advanced RAG Chatbot with Tavily web search integration"""
-        # Set the Tavily API key as an environment variable
         os.environ["TAVILY_API_KEY"] = tavily_api_key
-        # Correct Tavily Client initialization
         self.tavily_client = tavily.TavilyClient(tavily_api_key)
-        # NLP Components
         self.embeddings = self._configure_embeddings(embedding_model)
         self.semantic_model = SentenceTransformer('all-MiniLM-L6-v2')
         self.sentiment_analyzer = pipeline("sentiment-analysis")
         self.ner_pipeline = pipeline("ner", aggregation_strategy="simple")
-        # Language Model Configuration
         self.llm = self._configure_llm(llm_model, temperature)
-        # Conversation Memory
         self.memory = ConversationBufferMemory(memory_key="chat_history", return_messages=True)
     def _configure_embeddings(self, model_name: str):
-        """Configure embeddings with normalization"""
         encode_kwargs = {'normalize_embeddings': True, 'show_progress_bar': True}
         return HuggingFaceBgeEmbeddings(model_name=model_name, encode_kwargs=encode_kwargs)
     def _configure_llm(self, model_name: str, temperature: float):
-        """Configure the Language Model with Groq"""
         return ChatGroq(
             model_name=model_name,
             temperature=temperature,
@@ -51,7 +44,6 @@ class AdvancedRAGChatbot:
         )
     def _tavily_web_search(self, query: str, max_results: int = 5) -> List[Dict[str, str]]:
-        """Perform web search using Tavily API"""
         try:
             search_result = self.tavily_client.search(
                 query=query,
@@ -66,29 +58,33 @@ class AdvancedRAGChatbot:
             st.error(f"Tavily Search Error: {e}")
             return []
     def process_query(self, query: str) -> Dict[str, Any]:
-        """Process the user query with web search and NLP techniques"""
-        # Web Search
         web_results = self._tavily_web_search(query)
-        # Prepare context from web search
         context = "\n\n".join([
             f"Title: {result.get('title', 'N/A')}\nContent: {result.get('content', '')}"
             for result in web_results
         ])
-        # NLP Analysis
         semantic_score = self.semantic_model.encode([query])[0]
         sentiment_result = self.sentiment_analyzer(query)[0]
-        # Safe NER processing
         try:
             entities = self.ner_pipeline(query)
         except Exception as e:
             st.warning(f"NER processing error: {e}")
             entities = []
-        # Prepare prompt with web search context
         full_prompt = f"""
         Use the following web search results to answer the question precisely:
@@ -99,8 +95,6 @@ class AdvancedRAGChatbot:
         Provide a comprehensive answer based on the web search results.
         """
-        # Generate Response
         response = self.llm.invoke(full_prompt)
         return {
@@ -112,74 +106,57 @@ class AdvancedRAGChatbot:
         }
 def main():
-    # Page Configuration
     st.set_page_config(
         page_title="Web-Powered RAG Chatbot",
         page_icon="🌐",
         layout="wide",
         initial_sidebar_state="expanded"
     )
-    # Retrieve Tavily API Key from Environment Variable
     tavily_api_key = os.getenv("TAVILY_API_KEY")
     if not tavily_api_key:
         st.warning("Tavily API Key is missing. Please set the 'TAVILY_API_KEY' environment variable.")
         st.stop()
-    # Sidebar Configuration
     with st.sidebar:
         st.header("🔧 Chatbot Settings")
         st.markdown("Customize your AI assistant's behavior")
-        # Model Configuration
         embedding_model = st.selectbox(
             "Embedding Model",
             ["BAAI/bge-large-en-v1.5", "sentence-transformers/all-MiniLM-L6-v2"]
         )
         temperature = st.slider("Creativity Level", 0.0, 1.0, 0.7, help="Higher values make responses more creative")
-        # Display Evaluation Metrics
         st.header("📊 Evaluation Metrics")
-        st.markdown("View and analyze the LLM's performance metrics")
-        evaluation_metrics = ["BLEU", "ROUGE", "METEOR", "F1-Score", "Accuracy", "Perplexity"]
-        for metric in evaluation_metrics:
-            st.checkbox(metric, value=True)
         st.divider()
         st.info("Powered by Tavily Web Search")
-    # Initialize Chatbot
     chatbot = AdvancedRAGChatbot(
         tavily_api_key=tavily_api_key,
         embedding_model=embedding_model,
         temperature=temperature
     )
-    # Main Chat Interface
     st.title("🌐 Web-Powered RAG Chatbot")
-    # Chat input with placeholder
     user_input = st.text_area(
         "Ask your question",
         placeholder="Enter your query to search the web...",
         height=250
     )
-    # Submit button
     submit_button = st.button("Search & Analyze", type="primary")
-    # Response container
     if submit_button and user_input:
         with st.spinner("Searching web and processing query..."):
             try:
                 response = chatbot.process_query(user_input)
-                # Bot Response
                 st.markdown("#### AI's Answer")
                 st.write(response['response'])
-                # Sentiment Analysis
                 st.markdown("#### Sentiment Analysis")
                 sentiment = response['sentiment']
                 st.metric(
@@ -187,8 +164,6 @@ def main():
                     value=sentiment['label'],
                     delta=f"{sentiment['score']:.2%}"
                 )
-                # Named Entities
                 st.markdown("#### Detected Entities")
                 if response['named_entities']:
                     for entity in response['named_entities']:
@@ -197,8 +172,6 @@ def main():
                         st.text(f"{word} ({entity_type})")
                 else:
                     st.info("No entities detected")
-                # Web Sources
                 if response['web_sources']:
                     st.markdown("#### Web Sources")
                     for i, source in enumerate(response['web_sources'], 1):
@@ -206,7 +179,6 @@ def main():
                             st.write(source.get('content', 'No content available'))
                             if source.get('url'):
                                 st.markdown(f"[Original Source]({source['url']})")
             except Exception as e:
                 st.error(f"An error occurred: {e}")
     else:

 from langchain.memory import ConversationBufferMemory
 from transformers import pipeline
 from sentence_transformers import SentenceTransformer
+from sklearn.metrics import accuracy_score
+from nltk.translate.bleu_score import sentence_bleu
+from rouge_score import rouge_scorer
 import tavily
+import random  # Placeholder for certain metrics; replace with real computations
 class AdvancedRAGChatbot:
     def __init__(self,
                  llm_model: str = "llama-3.3-70b-versatile",
                  temperature: float = 0.7):
         """Initialize the Advanced RAG Chatbot with Tavily web search integration"""
         os.environ["TAVILY_API_KEY"] = tavily_api_key
         self.tavily_client = tavily.TavilyClient(tavily_api_key)
         self.embeddings = self._configure_embeddings(embedding_model)
         self.semantic_model = SentenceTransformer('all-MiniLM-L6-v2')
         self.sentiment_analyzer = pipeline("sentiment-analysis")
         self.ner_pipeline = pipeline("ner", aggregation_strategy="simple")
         self.llm = self._configure_llm(llm_model, temperature)
         self.memory = ConversationBufferMemory(memory_key="chat_history", return_messages=True)
     def _configure_embeddings(self, model_name: str):
         encode_kwargs = {'normalize_embeddings': True, 'show_progress_bar': True}
         return HuggingFaceBgeEmbeddings(model_name=model_name, encode_kwargs=encode_kwargs)
     def _configure_llm(self, model_name: str, temperature: float):
         return ChatGroq(
             model_name=model_name,
             temperature=temperature,
         )
     def _tavily_web_search(self, query: str, max_results: int = 5) -> List[Dict[str, str]]:
         try:
             search_result = self.tavily_client.search(
                 query=query,
             st.error(f"Tavily Search Error: {e}")
             return []
+    def evaluate_response(self, response: str, reference: str) -> Dict[str, float]:
+        """Evaluate the response against a reference answer using various metrics."""
+        bleu_score = sentence_bleu([reference.split()], response.split())
+        rouge = rouge_scorer.RougeScorer(['rouge1', 'rougeL'], use_stemmer=True)
+        rouge_scores = rouge.score(response, reference)
+        accuracy = random.uniform(0.8, 1.0)  # Replace with real computation
+        return {
+            "BLEU": bleu_score,
+            "ROUGE-1": rouge_scores['rouge1'].fmeasure,
+            "ROUGE-L": rouge_scores['rougeL'].fmeasure,
+            "Accuracy": accuracy
+        }
     def process_query(self, query: str) -> Dict[str, Any]:
         web_results = self._tavily_web_search(query)
         context = "\n\n".join([
             f"Title: {result.get('title', 'N/A')}\nContent: {result.get('content', '')}"
             for result in web_results
         ])
         semantic_score = self.semantic_model.encode([query])[0]
         sentiment_result = self.sentiment_analyzer(query)[0]
         try:
             entities = self.ner_pipeline(query)
         except Exception as e:
             st.warning(f"NER processing error: {e}")
             entities = []
         full_prompt = f"""
         Use the following web search results to answer the question precisely:
         Provide a comprehensive answer based on the web search results.
         """
         response = self.llm.invoke(full_prompt)
         return {
         }
 def main():
     st.set_page_config(
         page_title="Web-Powered RAG Chatbot",
         page_icon="🌐",
         layout="wide",
         initial_sidebar_state="expanded"
     )
     tavily_api_key = os.getenv("TAVILY_API_KEY")
     if not tavily_api_key:
         st.warning("Tavily API Key is missing. Please set the 'TAVILY_API_KEY' environment variable.")
         st.stop()
     with st.sidebar:
         st.header("🔧 Chatbot Settings")
         st.markdown("Customize your AI assistant's behavior")
         embedding_model = st.selectbox(
             "Embedding Model",
             ["BAAI/bge-large-en-v1.5", "sentence-transformers/all-MiniLM-L6-v2"]
         )
         temperature = st.slider("Creativity Level", 0.0, 1.0, 0.7, help="Higher values make responses more creative")
         st.header("📊 Evaluation Metrics")
+        evaluation_metrics = ["BLEU", "ROUGE-1", "ROUGE-L", "Accuracy"]
+        metrics_selected = st.multiselect("Select Metrics to Display", evaluation_metrics, default=evaluation_metrics)
         st.divider()
         st.info("Powered by Tavily Web Search")
     chatbot = AdvancedRAGChatbot(
         tavily_api_key=tavily_api_key,
         embedding_model=embedding_model,
         temperature=temperature
     )
     st.title("🌐 Web-Powered RAG Chatbot")
     user_input = st.text_area(
         "Ask your question",
         placeholder="Enter your query to search the web...",
         height=250
     )
     submit_button = st.button("Search & Analyze", type="primary")
     if submit_button and user_input:
         with st.spinner("Searching web and processing query..."):
             try:
                 response = chatbot.process_query(user_input)
                 st.markdown("#### AI's Answer")
                 st.write(response['response'])
+                reference_answer = "This is the reference answer for evaluation."
+                metrics = chatbot.evaluate_response(response['response'], reference_answer)
+                st.sidebar.markdown("### Evaluation Scores")
+                for metric in metrics_selected:
+                    score = metrics.get(metric, "N/A")
+                    st.sidebar.metric(label=metric, value=f"{score:.4f}")
                 st.markdown("#### Sentiment Analysis")
                 sentiment = response['sentiment']
                 st.metric(
                     value=sentiment['label'],
                     delta=f"{sentiment['score']:.2%}"
                 )
                 st.markdown("#### Detected Entities")
                 if response['named_entities']:
                     for entity in response['named_entities']:
                         st.text(f"{word} ({entity_type})")
                 else:
                     st.info("No entities detected")
                 if response['web_sources']:
                     st.markdown("#### Web Sources")
                     for i, source in enumerate(response['web_sources'], 1):
                             st.write(source.get('content', 'No content available'))
                             if source.get('url'):
                                 st.markdown(f"[Original Source]({source['url']})")
             except Exception as e:
                 st.error(f"An error occurred: {e}")
     else: