Spaces:

Reality123b
/

XylariaDeepReason

Sleeping

App Files Files Community

Reality123b commited on Feb 17

Commit

fcf4ade

verified ·

1 Parent(s): 48a64eb

Update app.py

Browse files

Files changed (1) hide show

app.py +144 -86

app.py CHANGED Viewed

@@ -17,8 +17,7 @@ import arxiv
 import scholarly
 import pymed
 import wikipedia
-#from newspaper3k import Article  # Removed newspaper3k
-import trafilatura  # Import trafilatura
 from trafilatura import extract, fetch_url
 import pickle
 import faiss
@@ -38,18 +37,20 @@ client = InferenceClient(provider="hf-inference", api_key=HF_API_KEY)
 MAIN_LLM_MODEL = "mistralai/Mistral-Nemo-Instruct-2407"
 REASONING_LLM_MODEL = "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B"
 CRITIC_LLM_MODEL = "Qwen/QwQ-32B-Preview"
-ENSEMBLE_MODELS = [MAIN_LLM_MODEL, REASONING_LLM_MODEL, CRITIC_LLM_MODEL]
-MAX_ITERATIONS = 20
-TIMEOUT = 120
-RETRY_DELAY = 5
-NUM_RESULTS = 15
 SIMILARITY_THRESHOLD = 0.15
-MAX_CONTEXT_ITEMS = 30
-MAX_HISTORY_ITEMS = 8
-MAX_FULL_TEXT_LENGTH = 10000
 FAISS_INDEX_PATH = "research_index.faiss"
 RESEARCH_DATA_PATH = "research_data.pkl"
 try:
     main_similarity_model = SentenceTransformer('sentence-transformers/all-mpnet-base-v2')
@@ -61,7 +62,7 @@ try:
         index = faiss.read_index(FAISS_INDEX_PATH)
         logger.info(f"Loaded FAISS index from {FAISS_INDEX_PATH}")
     else:
-        index = faiss.IndexFlatIP(embedding_dim)
         logger.info("Created a new FAISS index.")
 except Exception as e:
     logger.error(f"Failed to load models or initialize FAISS: {e}")
@@ -97,6 +98,29 @@ def load_research_data():
         logger.info("No existing research data found.")
         return {}
 def hf_inference(model_name, prompt, max_tokens=2000, retries=5):
     for attempt in range(retries):
         try:
@@ -137,11 +161,11 @@ def ensemble_inference(prompt, models=ENSEMBLE_MODELS, max_tokens=1500):
     for result in results:
         synthesis_prompt += f"Expert {results.index(result) + 1} ({result['model'].split('/')[-1]}):\n{result['text']}\n\n"
-    synthesis = hf_inference(MAIN_LLM_MODEL, synthesis_prompt)
     if "generated_text" in synthesis:
         return synthesis
     else:
-        return {"generated_text": max(results, key=lambda x: len(x["text"]))["text"]}
 def tool_search_web(query: str, num_results: int = NUM_RESULTS, safesearch: str = "moderate",
                    time_filter: Optional[str] = None, region: str = "wt-wt", language: str = "en-us") -> list:
@@ -170,19 +194,6 @@ def tool_search_web(query: str, num_results: int = NUM_RESULTS, safesearch: str
                 return []
     except Exception as e:
         logger.error(f"DuckDuckGo search error: {e}")
-        try:
-            with DDGS() as ddgs:
-                results = [r for r in ddgs.text(
-                    keywords=query,
-                    max_results=num_results,
-                    safesearch=safesearch,
-                    region=region,
-                    hreflang=language
-                )]
-                if results:
-                    return [{"title": r["title"], "snippet": r["body"], "url": r["href"]} for r in results]
-        except Exception as e2:
-            logger.error(f"Fallback DuckDuckGo search also failed: {e2}")
         return []
 def tool_search_arxiv(query: str, max_results: int = 5) -> list:
@@ -284,9 +295,9 @@ def tool_search_scholar(query: str, max_results: int = 5) -> list:
 def extract_article_content(url: str) -> str:
     try:
         downloaded = fetch_url(url)
-        if downloaded is None:  # Handle potential download failures
             return ""
-        return extract(downloaded, favor_precision=True) #Added favor_precision
     except Exception as e:
         logger.error(f"Failed to extract article content from {url}: {e}")
         return ""
@@ -304,7 +315,7 @@ def tool_reason(prompt: str, search_results: list, reasoning_context: list = [],
     results_by_source = {}
     for i, result in enumerate(search_results):
-        source = result.get('source', 'Web Search')
         if source not in results_by_source:
             results_by_source[source] = []
         results_by_source[source].append((i, result))
@@ -320,15 +331,15 @@ def tool_reason(prompt: str, search_results: list, reasoning_context: list = [],
             reasoning_input += "\n"
     if reasoning_context:
-        recent_context = reasoning_context[-MAX_HISTORY_ITEMS:]
         reasoning_input += "\nPrevious Reasoning Context:\n" + "\n".join(recent_context)
     if critique:
         reasoning_input += f"\n\nRecent critique to address: {critique}\n"
-    reasoning_input += "\nProvide a thorough, nuanced analysis that builds upon previous reasoning if applicable. Consider multiple perspectives, potential contradictions in the search results, and the reliability of different sources."
-    reasoning_output = ensemble_inference(reasoning_input)
     if isinstance(reasoning_output, dict) and "generated_text" in reasoning_output:
         return reasoning_output["generated_text"].strip()
@@ -342,7 +353,7 @@ def tool_summarize(insights: list, prompt: str, contradictions: list = []) -> st
     summarization_input = f"Synthesize the following insights into a cohesive and comprehensive summary regarding: '{prompt}'\n\n"
-    max_tokens = 12000
     selected_insights = []
     token_count = get_token_count(summarization_input) + get_token_count("\n\n".join(contradictions))
@@ -403,7 +414,7 @@ def tool_critique_reasoning(reasoning_output: str, prompt: str,
     critique_input += "Identify any flaws, biases, logical fallacies, unsupported claims, or areas for improvement. Be specific and constructive. Suggest concrete ways to enhance the reasoning. Also evaluate the strength of evidence and whether conclusions are proportionate to the available information."
-    critique_output = hf_inference(CRITIC_LLM_MODEL, critique_input)
     if isinstance(critique_output, dict) and "generated_text" in critique_output:
         return critique_output["generated_text"].strip()
@@ -415,7 +426,7 @@ def tool_identify_contradictions(insights: list) -> list:
     if len(insights) < 2:
         return []
-    max_tokens = 12000
     selected_insights = []
     token_count = 0
@@ -430,13 +441,13 @@ def tool_identify_contradictions(insights: list) -> list:
     contradiction_input = "Identify specific contradictions in these insights:\n\n" + "\n\n".join(selected_insights)
     contradiction_input += "\n\nList each contradiction as a separate numbered point. For each contradiction, cite the specific claims that are in tension and evaluate which claim is better supported. If no contradictions exist, respond with 'No contradictions found.'"
-    contradiction_output = hf_inference(CRITIC_LLM_MODEL, contradiction_input)
     if isinstance(contradiction_output, dict) and "generated_text" in contradiction_output:
         result = contradiction_output["generated_text"].strip()
         if result == "No contradictions found.":
             return []
         contradictions = re.findall(r'\d+\.\s+(.*?)(?=\d+\.|$)', result, re.DOTALL)
         return [c.strip() for c in contradictions if c.strip()]
@@ -456,10 +467,11 @@ def tool_identify_focus_areas(prompt: str, insights: list = [],
     focus_input += "Identify 3-5 specific aspects that should be investigated further to get a complete understanding. Be precise and prioritize underexplored areas. For each suggested area, briefly explain why it's important to investigate."
-    focus_output = hf_inference(MAIN_LLM_MODEL, focus_input)
     if isinstance(focus_output, dict) and "generated_text" in focus_output:
         result = focus_output["generated_text"].strip()
         areas = re.findall(r'(?:^|\n)(?:\d+\.|\*|\-)\s*(.*?)(?=(?:\n(?:\d+\.|\*|\-|$))|$)', result)
         return [area.strip() for area in areas if area.strip()][:5]
@@ -472,7 +484,7 @@ def add_to_faiss_index(text: str):
     if embedding_np.shape[1] != embedding_dim:
         logger.error(f"Embedding dimension mismatch: expected {embedding_dim}, got {embedding_np.shape[1]}")
         return
-    faiss.normalize_L2(embedding_np)
     index.add(embedding_np)
 def search_faiss_index(query: str, top_k: int = 5) -> List[str]:
@@ -497,7 +509,7 @@ def filter_results(search_results, prompt, previous_snippets=None):
         for result in search_results:
             combined_text = result['title'] + " " + result['snippet']
-            if result['snippet'] in seen_snippets:
                 continue
             result_embedding = main_similarity_model.encode(combined_text, convert_to_tensor=True)
@@ -506,16 +518,16 @@ def filter_results(search_results, prompt, previous_snippets=None):
             if cosine_score >= SIMILARITY_THRESHOLD:
                 result['relevance_score'] = cosine_score
                 filtered_results.append(result)
-                seen_snippets.add(result['snippet'])
                 add_to_faiss_index(result['snippet'])
-        filtered_results.sort(key=lambda x: x.get('relevance_score', 0), reverse=True)
         return filtered_results
     except Exception as e:
         logger.error(f"Error during filtering: {e}")
-        return search_results
 def tool_extract_key_entities(prompt: str) -> list:
     entity_input = f"Extract the key entities (people, organizations, concepts, technologies, events, time periods, locations, etc.) from this research prompt that should be investigated individually:\n\n{prompt}\n\nList the 5-7 most important entities, one per line, with a brief explanation (2-3 sentences) of why each is central to the research question."
@@ -525,7 +537,7 @@ def tool_extract_key_entities(prompt: str) -> list:
     if isinstance(entity_output, dict) and "generated_text" in entity_output:
         result = entity_output["generated_text"].strip()
         entities = [e.strip() for e in result.split('\n') if e.strip()]
-        return entities[:7]
     logger.error(f"Failed to extract key entities: {entity_output}")
     return []
@@ -538,11 +550,11 @@ def tool_meta_analyze(entity_insights: Dict[str, list], prompt: str) -> str:
     for entity, insights in entity_insights.items():
         if insights:
-            meta_input += f"\n--- {entity} ---\n" + insights[-1] + "\n"
     meta_input += "\nProvide a high-level synthesis that identifies:\n1. Common themes across entities\n2. Important differences and contradictions\n3. How these entities interact or influence each other\n4. The broader implications for the original research question\n5. A systems-level understanding of how these elements fit together"
-    meta_output = ensemble_inference(meta_input)
     if isinstance(meta_output, dict) and "generated_text" in meta_output:
         return meta_output["generated_text"].strip()
@@ -567,7 +579,7 @@ def tool_draft_research_plan(prompt: str, entities: list, focus_areas: list = []
     plan_input += "5. Potential challenges and how to address them\n"
     plan_input += "6. Criteria for evaluating the quality of findings"
-    plan_output = hf_inference(REASONING_LLM_MODEL, plan_input)
     if isinstance(plan_output, dict) and "generated_text" in plan_output:
         return plan_output["generated_text"].strip()
@@ -576,10 +588,31 @@ def tool_draft_research_plan(prompt: str, entities: list, focus_areas: list = []
     return "Could not generate a research plan due to an error."
 def tool_extract_article(url: str) -> str:
-    # Use trafilatura's extraction function
     extracted_text = extract_article_content(url)
     return extracted_text if extracted_text else f"Could not extract content from {url}"
 tools = {
     "search_web": {
         "function": tool_search_web,
@@ -630,6 +663,13 @@ tools = {
         "parameters": {
             "url": {"type": "string", "description": "The URL of the article to extract"}
         },
     },
     "reason": {
         "function": tool_reason,
@@ -734,16 +774,13 @@ Available Tools:
 Instructions:
 Select the BEST tool and parameters for the current research stage. Output valid JSON. If no tool is appropriate, respond with {}.
 Only use provided tools. Be strategic about which tool to use next based on the research progress so far.
 You MUST be methodical.  Think step-by-step:
 1.  **Plan:** If it's the very beginning, extract key entities, identify focus areas, and then draft a research plan.
 2.  **Search:**  Use a variety of search tools.  Start with broad searches, then narrow down.  Use specific search tools (arXiv, PubMed, Scholar) for relevant topics.
 3.  **Analyze:**  Reason deeply about search results, and critique your reasoning.  Identify contradictions. Filter and use FAISS index for relevant information.
 4.  **Refine:** If results are poor, generate *better* search queries. Adjust focus areas.
 5.  **Iterate:** Repeat steps 2-4, focusing on different entities and aspects.
 6.  **Synthesize:**  Finally, summarize the findings, addressing contradictions.
 Example:
 {"tool": "search_web", "parameters": {"query": "Eiffel Tower location"}}
 Output:
@@ -753,7 +790,8 @@ Output:
 def deep_research(prompt):
     task_description = "You are an advanced research assistant. Use available tools iteratively, focus on different aspects, follow promising leads, critically evaluate your findings, and build up a comprehensive understanding. Utilize the FAISS index to avoid redundant searches and build a persistent knowledge base."
     research_data = load_research_data()
     context = research_data.get('context', [])
     all_insights = research_data.get('all_insights', [])
     entity_specific_insights = research_data.get('entity_specific_insights', {})
@@ -776,47 +814,50 @@ def deep_research(prompt):
         logger.info("Initialized a fresh FAISS Index")
     key_entities_with_descriptions = tool_extract_key_entities(prompt=prompt)
-    key_entities = [e.split(":")[0].strip() for e in key_entities_with_descriptions]
     if key_entities:
         context.append(f"Identified key entities: {key_entities}")
         intermediate_output += f"Identified key entities for focused research: {key_entities_with_descriptions}\n"
     entity_progress = {entity: {'queries': [], 'insights': []} for entity in key_entities}
-    entity_progress['general'] = {'queries': [], 'insights': []}
     for entity in key_entities + ['general']:
-        if entity in research_data:
             entity_progress[entity]['queries'] = research_data[entity]['queries']
             entity_progress[entity]['insights'] = research_data[entity]['insights']
     if not focus_areas:  # Corrected placement: outside the loop
         initial_focus_areas = tool_identify_focus_areas(prompt=prompt)
         research_plan = tool_draft_research_plan(prompt=prompt, entities=key_entities, focus_areas=initial_focus_areas)
-        context.append(f"Initial Research Plan: {research_plan[:200]}...")
         intermediate_output += f"Initial Research Plan:\n{research_plan}\n\n"
         focus_areas = initial_focus_areas
     for i in range(MAX_ITERATIONS):
-        if key_entities and i > 0:
-            entities_to_process = key_entities + ['general']
             current_entity = entities_to_process[i % len(entities_to_process)]
         else:
-            current_entity = 'general'
         context.append(f"Current focus: {current_entity}")
-        if i > 0:
             faiss_results_indices = search_faiss_index(prompt if current_entity == 'general' else f"{prompt} {current_entity}")
             faiss_context = []
             for idx in faiss_results_indices:
-                if idx < len(all_insights):
                     faiss_context.append(f"Previously found insight: {all_insights[idx]}")
             if faiss_context:
-                context.extend(faiss_context)
                 intermediate_output += f"Iteration {i+1} - Retrieved {len(faiss_context)} relevant items from FAISS index.\n"
-        if i == 0:
             initial_query = tool_generate_search_query(prompt=prompt)
             if initial_query:
                 previous_queries.append(initial_query)
@@ -861,6 +902,7 @@ def deep_research(prompt):
                 previous_queries.append(entity_query)
                 entity_progress[current_entity]['queries'].append(entity_query)
                 with ThreadPoolExecutor(max_workers=5) as executor:
                     futures = [
                         executor.submit(tool_search_web, query=entity_query, num_results=NUM_RESULTS//2),
@@ -874,9 +916,10 @@ def deep_research(prompt):
                     for future in as_completed(futures):
                         search_results.extend(future.result())
                 filtered_search_results = filter_results(search_results,
                                                         f"{prompt} {current_entity}",
-                                                        previous_snippets=seen_snippets)
                 if filtered_search_results:
                     context.append(f"Entity Search for {current_entity}: {len(filtered_search_results)} results")
@@ -884,7 +927,7 @@ def deep_research(prompt):
                     entity_reasoning = tool_reason(
                         prompt=f"{prompt} focusing on {current_entity}",
                         search_results=filtered_search_results,
-                        reasoning_context=entity_progress[current_entity]['insights'],
                         focus_areas=focus_areas
                     )
@@ -915,17 +958,17 @@ def deep_research(prompt):
         try:
             response_text = llm_response["generated_text"].strip()
-            response_json = json.loads(response_text)
             intermediate_output += f"Iteration {i+1} - Focus: {current_entity} - Action: {response_text}\n"
         except json.JSONDecodeError:
             intermediate_output += f"Iteration {i+1} - LLM Response (Invalid JSON): {llm_response['generated_text'][:100]}...\n"
-            context.append(f"Invalid JSON: {llm_response['generated_text'][:100]}...")
             continue
         tool_name = response_json.get("tool")
         parameters = response_json.get("parameters", {})
-        if not tool_name:
             if all_insights:
                 if i > MAX_ITERATIONS // 2:
                     break
@@ -947,7 +990,7 @@ def deep_research(prompt):
                 result = tool["function"](**parameters)
                 if current_entity != 'general':
-                    entity_progress[current_entity]['queries'].append(result)
                 previous_queries.append(result)
@@ -959,12 +1002,13 @@ def deep_research(prompt):
                 filtered_result = filter_results(result, search_prompt, previous_snippets=seen_snippets)
-                result = filtered_result
-                if not result and 'query' in parameters:
                     failed_queries.append(parameters['query'])
             elif tool_name == "reason":
                 if current_entity != 'general' and 'reasoning_context' not in parameters:
                     parameters['reasoning_context'] = entity_progress[current_entity]['insights']
                 elif 'reasoning_context' not in parameters:
@@ -977,9 +1021,9 @@ def deep_research(prompt):
                         parameters['prompt'] = prompt
                 if 'search_results' not in parameters:
-                    parameters['search_results'] = []
-                if 'focus_areas' not in parameters and focus_areas:
                     parameters['focus_areas'] = focus_areas
                 result = tool["function"](**parameters)
@@ -987,20 +1031,20 @@ def deep_research(prompt):
                 if current_entity != 'general':
                     entity_progress[current_entity]['insights'].append(result)
                     if current_entity not in entity_specific_insights:
-                        entity_specific_insights[current_entity] = []
                     entity_specific_insights[current_entity].append(result)
                 else:
-                    reasoning_context.append(result)
                 add_to_faiss_index(result)
                 all_insights.append(result)
             elif tool_name == "critique_reasoning":
-                if 'previous_critiques' not in parameters:
                     parameters['previous_critiques'] = previous_critiques
                 if all_insights:
                     if 'reasoning_output' not in parameters:
-                        parameters['reasoning_output'] = all_insights[-1]
                     if 'prompt' not in parameters:
                         parameters['prompt'] = prompt
@@ -1013,7 +1057,7 @@ def deep_research(prompt):
             elif tool_name == "identify_contradictions":
                 result = tool["function"](**parameters)
                 if result:
-                    contradictions = result
                     context.append(f"Identified contradictions: {result}")
             elif tool_name == "identify_focus_areas":
@@ -1022,19 +1066,28 @@ def deep_research(prompt):
                 result = tool["function"](**parameters)
                 if result:
                     old_focus = set(focus_areas)
-                    focus_areas = result
-                    failed_areas.extend([area for area in old_focus if area not in result])
                     context.append(f"New focus areas: {result}")
             elif tool_name == "extract_article":
                 result = tool["function"](**parameters)
                 if result:
                     context.append(f"Extracted article content from {parameters['url']}: {result[:200]}...")
                     reasoning_about_article = tool_reason(prompt=prompt, search_results=[{"title": "Extracted Article", "snippet": result, "url": parameters['url']}])
                     if reasoning_about_article:
                         all_insights.append(reasoning_about_article)
                         add_to_faiss_index(reasoning_about_article)
             elif tool_name == "meta_analyze":
                 if 'entity_insights' not in parameters:
@@ -1043,12 +1096,13 @@ def deep_research(prompt):
                     parameters['prompt'] = prompt
                 result = tool["function"](**parameters)
                 if result:
-                    all_insights.append(result)
                     context.append(f"Meta-analysis across entities: {result[:200]}...")
                     add_to_faiss_index(result)
             elif tool_name == "draft_research_plan":
-                result = "Research plan already generated."
             else:
                 result = tool["function"](**parameters)
@@ -1059,6 +1113,7 @@ def deep_research(prompt):
             intermediate_output += f"Iteration {i+1} - Result: {result_str}\n"
             result_context = result_str
             if len(result_str) > 300:
                 result_context = result_str[:300] + "..."
@@ -1070,6 +1125,7 @@ def deep_research(prompt):
             intermediate_output += f"Iteration {i+1} - Error: {str(e)}\n"
             continue
         research_data = {
             'context': context,
             'all_insights': all_insights,
@@ -1085,22 +1141,24 @@ def deep_research(prompt):
             'research_session_id': research_session_id
         }
         for entity in entity_progress:
-             research_data[entity] = entity_progress[entity]
         save_research_data(research_data, index)
     if len(entity_specific_insights) > 1 and len(all_insights) > 2:
         meta_analysis = tool_meta_analyze(entity_insights=entity_specific_insights, prompt=prompt)
         if meta_analysis:
             all_insights.append(meta_analysis)
             intermediate_output += f"Final Meta-Analysis: {meta_analysis[:500]}...\n"
-            add_to_faiss_index(meta_analysis)
     if all_insights:
-        final_result = tool_summarize(all_insights, prompt, contradictions)
     else:
         final_result = "Could not find meaningful information despite multiple attempts."
     full_output = f"**Research Prompt:** {prompt}\n\n"
     if key_entities_with_descriptions:

 import scholarly
 import pymed
 import wikipedia
+import trafilatura
 from trafilatura import extract, fetch_url
 import pickle
 import faiss
 MAIN_LLM_MODEL = "mistralai/Mistral-Nemo-Instruct-2407"
 REASONING_LLM_MODEL = "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B"
 CRITIC_LLM_MODEL = "Qwen/QwQ-32B-Preview"
+ENSEMBLE_MODELS = [MAIN_LLM_MODEL, REASONING_LLM_MODEL, CRITIC_LLM_MODEL]  # Keep, but expand upon.
+MAX_ITERATIONS = 40  # Increased for deeper research.
+TIMEOUT = 180 # Longer timeout for larger models / complex tasks.
+RETRY_DELAY = 10 # longer delay
+NUM_RESULTS = 20
 SIMILARITY_THRESHOLD = 0.15
+MAX_CONTEXT_ITEMS = 50  # Increased context window.
+MAX_HISTORY_ITEMS = 12
+MAX_FULL_TEXT_LENGTH = 20000 # larger document size
 FAISS_INDEX_PATH = "research_index.faiss"
 RESEARCH_DATA_PATH = "research_data.pkl"
+PAPER_SUMMARIES_PATH = "paper_summaries.pkl" #New path for storing paper summary
 try:
     main_similarity_model = SentenceTransformer('sentence-transformers/all-mpnet-base-v2')
         index = faiss.read_index(FAISS_INDEX_PATH)
         logger.info(f"Loaded FAISS index from {FAISS_INDEX_PATH}")
     else:
+        index = faiss.IndexFlatIP(embedding_dim)  # Use IndexFlatIP for inner product (cosine similarity).
         logger.info("Created a new FAISS index.")
 except Exception as e:
     logger.error(f"Failed to load models or initialize FAISS: {e}")
         logger.info("No existing research data found.")
         return {}
+def save_paper_summaries(summaries: Dict[str, str]):
+    try:
+        with open(PAPER_SUMMARIES_PATH, "wb") as f:
+            pickle.dump(summaries, f)
+        logger.info(f"Paper summaries saved to {PAPER_SUMMARIES_PATH}")
+    except Exception as e:
+        logger.error(f"Error saving paper summaries: {e}")
+def load_paper_summaries() -> Dict[str, str]:
+    if os.path.exists(PAPER_SUMMARIES_PATH):
+        try:
+            with open(PAPER_SUMMARIES_PATH, "rb") as f:
+                data = pickle.load(f)
+                logger.info(f"Loaded paper summaries from {PAPER_SUMMARIES_PATH}")
+                return data
+        except Exception as e:
+            logger.error(f"Error loading paper summaries: {e}")
+            return {}
+    else:
+        logger.info("No existing paper summaries found.")
+        return {}
 def hf_inference(model_name, prompt, max_tokens=2000, retries=5):
     for attempt in range(retries):
         try:
     for result in results:
         synthesis_prompt += f"Expert {results.index(result) + 1} ({result['model'].split('/')[-1]}):\n{result['text']}\n\n"
+    synthesis = hf_inference(MAIN_LLM_MODEL, synthesis_prompt) # Use a consistent model for final synthesis
     if "generated_text" in synthesis:
         return synthesis
     else:
+        return {"generated_text": max(results, key=lambda x: len(x["text"]))["text"]} # Fallback
 def tool_search_web(query: str, num_results: int = NUM_RESULTS, safesearch: str = "moderate",
                    time_filter: Optional[str] = None, region: str = "wt-wt", language: str = "en-us") -> list:
                 return []
     except Exception as e:
         logger.error(f"DuckDuckGo search error: {e}")
         return []
 def tool_search_arxiv(query: str, max_results: int = 5) -> list:
 def extract_article_content(url: str) -> str:
     try:
         downloaded = fetch_url(url)
+        if downloaded is None:
             return ""
+        return extract(downloaded, favor_precision=True)
     except Exception as e:
         logger.error(f"Failed to extract article content from {url}: {e}")
         return ""
     results_by_source = {}
     for i, result in enumerate(search_results):
+        source = result.get('source', 'Web Search') # Default to 'Web Search'
         if source not in results_by_source:
             results_by_source[source] = []
         results_by_source[source].append((i, result))
             reasoning_input += "\n"
     if reasoning_context:
+        recent_context = reasoning_context[-MAX_HISTORY_ITEMS:]  # Limit history
         reasoning_input += "\nPrevious Reasoning Context:\n" + "\n".join(recent_context)
     if critique:
         reasoning_input += f"\n\nRecent critique to address: {critique}\n"
+    reasoning_input += "\nProvide a thorough, nuanced analysis that builds upon previous reasoning if applicable. Consider multiple perspectives, potential contradictions in the search results, and the reliability of different sources.  Address any specific critiques."
+    reasoning_output = ensemble_inference(reasoning_input) # Use ensemble for high-quality reasoning.
     if isinstance(reasoning_output, dict) and "generated_text" in reasoning_output:
         return reasoning_output["generated_text"].strip()
     summarization_input = f"Synthesize the following insights into a cohesive and comprehensive summary regarding: '{prompt}'\n\n"
+    max_tokens = 12000  # Increased token limit
     selected_insights = []
     token_count = get_token_count(summarization_input) + get_token_count("\n\n".join(contradictions))
     critique_input += "Identify any flaws, biases, logical fallacies, unsupported claims, or areas for improvement. Be specific and constructive. Suggest concrete ways to enhance the reasoning. Also evaluate the strength of evidence and whether conclusions are proportionate to the available information."
+    critique_output = hf_inference(CRITIC_LLM_MODEL, critique_input) # Use specialized critique model.
     if isinstance(critique_output, dict) and "generated_text" in critique_output:
         return critique_output["generated_text"].strip()
     if len(insights) < 2:
         return []
+    max_tokens = 12000  # Increased token limit for potentially more contradictions
     selected_insights = []
     token_count = 0
     contradiction_input = "Identify specific contradictions in these insights:\n\n" + "\n\n".join(selected_insights)
     contradiction_input += "\n\nList each contradiction as a separate numbered point. For each contradiction, cite the specific claims that are in tension and evaluate which claim is better supported. If no contradictions exist, respond with 'No contradictions found.'"
+    contradiction_output = hf_inference(CRITIC_LLM_MODEL, contradiction_input)  # Use critique model
     if isinstance(contradiction_output, dict) and "generated_text" in contradiction_output:
         result = contradiction_output["generated_text"].strip()
         if result == "No contradictions found.":
             return []
+        # More robust contradiction extraction, handles multi-sentence contradictions
         contradictions = re.findall(r'\d+\.\s+(.*?)(?=\d+\.|$)', result, re.DOTALL)
         return [c.strip() for c in contradictions if c.strip()]
     focus_input += "Identify 3-5 specific aspects that should be investigated further to get a complete understanding. Be precise and prioritize underexplored areas. For each suggested area, briefly explain why it's important to investigate."
+    focus_output = hf_inference(MAIN_LLM_MODEL, focus_input)  # Consistent model
     if isinstance(focus_output, dict) and "generated_text" in focus_output:
         result = focus_output["generated_text"].strip()
+        # More robust extraction, handles different list formats
         areas = re.findall(r'(?:^|\n)(?:\d+\.|\*|\-)\s*(.*?)(?=(?:\n(?:\d+\.|\*|\-|$))|$)', result)
         return [area.strip() for area in areas if area.strip()][:5]
     if embedding_np.shape[1] != embedding_dim:
         logger.error(f"Embedding dimension mismatch: expected {embedding_dim}, got {embedding_np.shape[1]}")
         return
+    faiss.normalize_L2(embedding_np)  # Normalize for cosine similarity.
     index.add(embedding_np)
 def search_faiss_index(query: str, top_k: int = 5) -> List[str]:
         for result in search_results:
             combined_text = result['title'] + " " + result['snippet']
+            if result['snippet'] in seen_snippets:  # Prevent exact duplicates
                 continue
             result_embedding = main_similarity_model.encode(combined_text, convert_to_tensor=True)
             if cosine_score >= SIMILARITY_THRESHOLD:
                 result['relevance_score'] = cosine_score
                 filtered_results.append(result)
+                seen_snippets.add(result['snippet']) # Add snippets after filtering
                 add_to_faiss_index(result['snippet'])
+        filtered_results.sort(key=lambda x: x.get('relevance_score', 0), reverse=True)  # Sort by relevance.
         return filtered_results
     except Exception as e:
         logger.error(f"Error during filtering: {e}")
+        return search_results  # Return original results on error.
 def tool_extract_key_entities(prompt: str) -> list:
     entity_input = f"Extract the key entities (people, organizations, concepts, technologies, events, time periods, locations, etc.) from this research prompt that should be investigated individually:\n\n{prompt}\n\nList the 5-7 most important entities, one per line, with a brief explanation (2-3 sentences) of why each is central to the research question."
     if isinstance(entity_output, dict) and "generated_text" in entity_output:
         result = entity_output["generated_text"].strip()
         entities = [e.strip() for e in result.split('\n') if e.strip()]
+        return entities[:7] # Limit to top 7 entities
     logger.error(f"Failed to extract key entities: {entity_output}")
     return []
     for entity, insights in entity_insights.items():
         if insights:
+            meta_input += f"\n--- {entity} ---\n" + insights[-1] + "\n"  # Most recent insight for each entity
     meta_input += "\nProvide a high-level synthesis that identifies:\n1. Common themes across entities\n2. Important differences and contradictions\n3. How these entities interact or influence each other\n4. The broader implications for the original research question\n5. A systems-level understanding of how these elements fit together"
+    meta_output = ensemble_inference(meta_input)  # Ensemble for meta-analysis
     if isinstance(meta_output, dict) and "generated_text" in meta_output:
         return meta_output["generated_text"].strip()
     plan_input += "5. Potential challenges and how to address them\n"
     plan_input += "6. Criteria for evaluating the quality of findings"
+    plan_output = hf_inference(REASONING_LLM_MODEL, plan_input) # Use reasoning model
     if isinstance(plan_output, dict) and "generated_text" in plan_output:
         return plan_output["generated_text"].strip()
     return "Could not generate a research plan due to an error."
 def tool_extract_article(url: str) -> str:
     extracted_text = extract_article_content(url)
     return extracted_text if extracted_text else f"Could not extract content from {url}"
+# New tool for summarizing a single paper
+def tool_summarize_paper(paper_text: str) -> str:
+  summarization_prompt = f"""Summarize this academic paper, focusing on the following:
+1.  **Main Research Question(s):** What questions does the paper address?
+2.  **Methodology:** Briefly describe the methods used (e.g., experiments, surveys, simulations, theoretical analysis).
+3.  **Key Findings:** What are the most important results or conclusions?
+4.  **Limitations:**  What are the acknowledged limitations of the study?
+5.  **Implications:** What are the broader implications of the findings, according to the authors?
+Paper Text:
+{paper_text[:MAX_FULL_TEXT_LENGTH]}
+"""  # Truncate if necessary
+  summary = hf_inference(REASONING_LLM_MODEL, summarization_prompt, max_tokens=500)
+  if isinstance(summary, dict) and "generated_text" in summary:
+      return summary["generated_text"].strip()
+  else:
+      logger.error(f"Failed to generate summary: {summary}")
+      return "Could not generate a summary due to an error."
 tools = {
     "search_web": {
         "function": tool_search_web,
         "parameters": {
             "url": {"type": "string", "description": "The URL of the article to extract"}
         },
+    },
+        "summarize_paper": {
+        "function": tool_summarize_paper,
+        "description": "Summarizes the content of an academic paper.",
+        "parameters": {
+            "paper_text": {"type": "string", "description": "The full text of the paper to be summarized."},
+        },
     },
     "reason": {
         "function": tool_reason,
 Instructions:
 Select the BEST tool and parameters for the current research stage. Output valid JSON. If no tool is appropriate, respond with {}.
 Only use provided tools. Be strategic about which tool to use next based on the research progress so far.
 You MUST be methodical.  Think step-by-step:
 1.  **Plan:** If it's the very beginning, extract key entities, identify focus areas, and then draft a research plan.
 2.  **Search:**  Use a variety of search tools.  Start with broad searches, then narrow down.  Use specific search tools (arXiv, PubMed, Scholar) for relevant topics.
 3.  **Analyze:**  Reason deeply about search results, and critique your reasoning.  Identify contradictions. Filter and use FAISS index for relevant information.
 4.  **Refine:** If results are poor, generate *better* search queries. Adjust focus areas.
 5.  **Iterate:** Repeat steps 2-4, focusing on different entities and aspects.
 6.  **Synthesize:**  Finally, summarize the findings, addressing contradictions.
 Example:
 {"tool": "search_web", "parameters": {"query": "Eiffel Tower location"}}
 Output:
 def deep_research(prompt):
     task_description = "You are an advanced research assistant. Use available tools iteratively, focus on different aspects, follow promising leads, critically evaluate your findings, and build up a comprehensive understanding. Utilize the FAISS index to avoid redundant searches and build a persistent knowledge base."
     research_data = load_research_data()
+    paper_summaries = load_paper_summaries()  # Load paper summaries
     context = research_data.get('context', [])
     all_insights = research_data.get('all_insights', [])
     entity_specific_insights = research_data.get('entity_specific_insights', {})
         logger.info("Initialized a fresh FAISS Index")
     key_entities_with_descriptions = tool_extract_key_entities(prompt=prompt)
+    key_entities = [e.split(":")[0].strip() for e in key_entities_with_descriptions] # Extract just entity names
     if key_entities:
         context.append(f"Identified key entities: {key_entities}")
         intermediate_output += f"Identified key entities for focused research: {key_entities_with_descriptions}\n"
+    # Initialize progress tracking for each entity.
     entity_progress = {entity: {'queries': [], 'insights': []} for entity in key_entities}
+    entity_progress['general'] = {'queries': [], 'insights': []}  # For general, non-entity-specific searches
     for entity in key_entities + ['general']:
+        if entity in research_data:  # Load existing progress
             entity_progress[entity]['queries'] = research_data[entity]['queries']
             entity_progress[entity]['insights'] = research_data[entity]['insights']
     if not focus_areas:  # Corrected placement: outside the loop
         initial_focus_areas = tool_identify_focus_areas(prompt=prompt)
         research_plan = tool_draft_research_plan(prompt=prompt, entities=key_entities, focus_areas=initial_focus_areas)
+        context.append(f"Initial Research Plan: {research_plan[:200]}...") # Add plan to context
         intermediate_output += f"Initial Research Plan:\n{research_plan}\n\n"
         focus_areas = initial_focus_areas
     for i in range(MAX_ITERATIONS):
+        # Entity-focused iteration strategy
+        if key_entities and i > 0:  # Cycle through entities *after* initial setup
+            entities_to_process = key_entities + ['general']  # Include 'general' for broad searches
             current_entity = entities_to_process[i % len(entities_to_process)]
         else:
+            current_entity = 'general'  # Start with general research.
         context.append(f"Current focus: {current_entity}")
+        # FAISS Retrieval
+        if i > 0:  # Use FAISS *after* the first iteration (once we have data)
             faiss_results_indices = search_faiss_index(prompt if current_entity == 'general' else f"{prompt} {current_entity}")
             faiss_context = []
             for idx in faiss_results_indices:
+                if idx < len(all_insights):  # Check index bounds
                     faiss_context.append(f"Previously found insight: {all_insights[idx]}")
             if faiss_context:
+                context.extend(faiss_context) # Add FAISS context
                 intermediate_output += f"Iteration {i+1} - Retrieved {len(faiss_context)} relevant items from FAISS index.\n"
+        if i == 0: #Initial broad search
             initial_query = tool_generate_search_query(prompt=prompt)
             if initial_query:
                 previous_queries.append(initial_query)
                 previous_queries.append(entity_query)
                 entity_progress[current_entity]['queries'].append(entity_query)
                 with ThreadPoolExecutor(max_workers=5) as executor:
                     futures = [
                         executor.submit(tool_search_web, query=entity_query, num_results=NUM_RESULTS//2),
                     for future in as_completed(futures):
                         search_results.extend(future.result())
                 filtered_search_results = filter_results(search_results,
                                                         f"{prompt} {current_entity}",
+                                                        previous_snippets=seen_snippets) # Pass existing snippets
                 if filtered_search_results:
                     context.append(f"Entity Search for {current_entity}: {len(filtered_search_results)} results")
                     entity_reasoning = tool_reason(
                         prompt=f"{prompt} focusing on {current_entity}",
                         search_results=filtered_search_results,
+                        reasoning_context=entity_progress[current_entity]['insights'], # Use entity-specific context
                         focus_areas=focus_areas
                     )
         try:
             response_text = llm_response["generated_text"].strip()
+            response_json = json.loads(response_text)  # Parse the JSON response.
             intermediate_output += f"Iteration {i+1} - Focus: {current_entity} - Action: {response_text}\n"
         except json.JSONDecodeError:
             intermediate_output += f"Iteration {i+1} - LLM Response (Invalid JSON): {llm_response['generated_text'][:100]}...\n"
+            context.append(f"Invalid JSON: {llm_response['generated_text'][:100]}...") # Add invalid JSON to context
             continue
         tool_name = response_json.get("tool")
         parameters = response_json.get("parameters", {})
+        if not tool_name: #LLM didn't return a tool.  End the process if we are past halfway.
             if all_insights:
                 if i > MAX_ITERATIONS // 2:
                     break
                 result = tool["function"](**parameters)
                 if current_entity != 'general':
+                    entity_progress[current_entity]['queries'].append(result) # Add entity-specific
                 previous_queries.append(result)
                 filtered_result = filter_results(result, search_prompt, previous_snippets=seen_snippets)
+                result = filtered_result  # Work with filtered results
+                if not result and 'query' in parameters: # Add query to failures if nothing returned.
                     failed_queries.append(parameters['query'])
             elif tool_name == "reason":
+                # Ensure correct reasoning context is passed.
                 if current_entity != 'general' and 'reasoning_context' not in parameters:
                     parameters['reasoning_context'] = entity_progress[current_entity]['insights']
                 elif 'reasoning_context' not in parameters:
                         parameters['prompt'] = prompt
                 if 'search_results' not in parameters:
+                    parameters['search_results'] = [] #Avoid errors if no search results.
+                if 'focus_areas' not in parameters and focus_areas: # Avoid overwriting focus_areas if already set
                     parameters['focus_areas'] = focus_areas
                 result = tool["function"](**parameters)
                 if current_entity != 'general':
                     entity_progress[current_entity]['insights'].append(result)
                     if current_entity not in entity_specific_insights:
+                         entity_specific_insights[current_entity] = []
                     entity_specific_insights[current_entity].append(result)
                 else:
+                    reasoning_context.append(result) #Add to general context.
                 add_to_faiss_index(result)
                 all_insights.append(result)
             elif tool_name == "critique_reasoning":
+                if 'previous_critiques' not in parameters: #Pass in the previous critiques.
                     parameters['previous_critiques'] = previous_critiques
                 if all_insights:
                     if 'reasoning_output' not in parameters:
+                        parameters['reasoning_output'] = all_insights[-1]  #Critique the most recent insight.
                     if 'prompt' not in parameters:
                         parameters['prompt'] = prompt
             elif tool_name == "identify_contradictions":
                 result = tool["function"](**parameters)
                 if result:
+                    contradictions = result  # Keep track of contradictions.
                     context.append(f"Identified contradictions: {result}")
             elif tool_name == "identify_focus_areas":
                 result = tool["function"](**parameters)
                 if result:
                     old_focus = set(focus_areas)
+                    focus_areas = result  # Update focus areas
+                    failed_areas.extend([area for area in old_focus if area not in result])  #Track failed areas
                     context.append(f"New focus areas: {result}")
             elif tool_name == "extract_article":
                 result = tool["function"](**parameters)
                 if result:
                     context.append(f"Extracted article content from {parameters['url']}: {result[:200]}...")
+                    # Reason specifically about the extracted article.
                     reasoning_about_article = tool_reason(prompt=prompt, search_results=[{"title": "Extracted Article", "snippet": result, "url": parameters['url']}])
                     if reasoning_about_article:
                         all_insights.append(reasoning_about_article)
                         add_to_faiss_index(reasoning_about_article)
+            elif tool_name == "summarize_paper":
+                result = tool["function"](**parameters)
+                if result:
+                    paper_summaries[parameters['paper_text'][:100]] = result  # Store by a snippet of the text
+                    save_paper_summaries(paper_summaries)
+                    context.append(f"Summarized paper: {result[:200]}...")
+                    add_to_faiss_index(result) # Add the summary itself to FAISS.
+                    all_insights.append(result) #Add summary to insights for later summarization.
             elif tool_name == "meta_analyze":
                 if 'entity_insights' not in parameters:
                     parameters['prompt'] = prompt
                 result = tool["function"](**parameters)
                 if result:
+                    all_insights.append(result)  # Add meta-analysis to overall insights.
                     context.append(f"Meta-analysis across entities: {result[:200]}...")
                     add_to_faiss_index(result)
             elif tool_name == "draft_research_plan":
+                result = "Research plan already generated."  # Avoid re-generating.
             else:
                 result = tool["function"](**parameters)
             intermediate_output += f"Iteration {i+1} - Result: {result_str}\n"
+            # Add tool use to context, limit context length
             result_context = result_str
             if len(result_str) > 300:
                 result_context = result_str[:300] + "..."
             intermediate_output += f"Iteration {i+1} - Error: {str(e)}\n"
             continue
+        #Save data
         research_data = {
             'context': context,
             'all_insights': all_insights,
             'research_session_id': research_session_id
         }
         for entity in entity_progress:
+             research_data[entity] = entity_progress[entity] #save the individual entity
         save_research_data(research_data, index)
+    # Perform meta-analysis *before* final summarization, if we have enough entity-specific insights.
     if len(entity_specific_insights) > 1 and len(all_insights) > 2:
         meta_analysis = tool_meta_analyze(entity_insights=entity_specific_insights, prompt=prompt)
         if meta_analysis:
             all_insights.append(meta_analysis)
             intermediate_output += f"Final Meta-Analysis: {meta_analysis[:500]}...\n"
+            add_to_faiss_index(meta_analysis)  # Add to FAISS
     if all_insights:
+        final_result = tool_summarize(all_insights, prompt, contradictions) # Summarize all insights.
     else:
         final_result = "Could not find meaningful information despite multiple attempts."
     full_output = f"**Research Prompt:** {prompt}\n\n"
     if key_entities_with_descriptions: