Deep_Research_Agent

Sleeping

App Files Files Community

Lasdw commited on May 13

Commit

bed229a

1 Parent(s): 189c133

Added code tool

Browse files

Files changed (1) hide show

agent.py +324 -33

agent.py CHANGED Viewed

@@ -4,36 +4,157 @@ from langgraph.graph.message import add_messages
 from langchain_core.messages import AnyMessage, HumanMessage, AIMessage, SystemMessage
 from langgraph.prebuilt import ToolNode
 from langchain.tools import Tool
-from langgraph.graph import START, StateGraph
 from langgraph.prebuilt import tools_condition
 from langchain_openai import ChatOpenAI
 from langchain_community.tools import DuckDuckGoSearchRun
-def calculator(operation: str, num1: int, num2: int):
-    if operation == "add":
-        return num1 + num2
-    elif operation == "subtract":
-        return num1 - num2
-    elif operation == "multiply":
-        return num1 * num2
-    elif operation == "divide":
-        return num1 / num2
-    return input
-calculator_tool = Tool(
-    name="calculator",
-    func=calculator,
-    description="Use this tool to perform basic arithmetic operations (add, subtract, multiply, divide) on two numbers"
 )
-# Initialize the web search tool
-search_tool = DuckDuckGoSearchRun()
 # System prompt to guide the model's behavior
-SYSTEM_PROMPT = """You are a genuis AI assistant called TurboNerd.
 Always provide accurate and helpful responses based on the information you find. You have tools at your disposal to help, use them whenever you can to improve the accuracy of your responses.
-When you recieve an input from the user, first you will break the input into smaller parts. Then you will one by one use the tools to answer the question. The final should be as short as possible, directly answering the question.
 """
 # Generate the chat interface, including the tools
 llm = ChatOpenAI(
@@ -42,7 +163,7 @@ llm = ChatOpenAI(
 )
 chat = llm
-tools = [search_tool, calculator_tool]
 chat_with_tools = chat.bind_tools(tools)
 # Generate the AgentState and Agent graph
@@ -51,15 +172,92 @@ class AgentState(TypedDict):
 def assistant(state: AgentState):
     # Add system message if it's the first message
     if len(state["messages"]) == 1 and isinstance(state["messages"][0], HumanMessage):
         messages = [SystemMessage(content=SYSTEM_PROMPT)] + state["messages"]
     else:
         messages = state["messages"]
     return {
-        "messages": [chat_with_tools.invoke(messages)],
     }
 # Create the graph
 def create_agent_graph() -> StateGraph:
     """Create the complete agent graph."""
@@ -68,24 +266,80 @@ def create_agent_graph() -> StateGraph:
     # Define nodes: these do the work
     builder.add_node("assistant", assistant)
     builder.add_node("tools", ToolNode(tools))
     # Define edges: these determine how the control flow moves
     builder.add_edge(START, "assistant")
     builder.add_conditional_edges(
         "assistant",
-        # If the latest message requires a tool, route to tools
-        # Otherwise, provide a direct response
-        tools_condition,
     )
     builder.add_edge("tools", "assistant")
     return builder.compile()
 # Main agent class that integrates with your existing app.py
 class TurboNerd:
-    def __init__(self):
         self.graph = create_agent_graph()
         self.tools = tools
     def __call__(self, question: str) -> str:
         """Process a question and return an answer."""
@@ -94,15 +348,52 @@ class TurboNerd:
             "messages": [HumanMessage(content=question)],
         }
-        # Run the graph
-        result = self.graph.invoke(initial_state)
-        # Extract the final message
-        final_message = result["messages"][-1]
-        return final_message.content
 # Example usage:
 if __name__ == "__main__":
-    agent = TurboNerd()
-    response = agent("What is the time in Tokyo now?")
     print(response)

 from langchain_core.messages import AnyMessage, HumanMessage, AIMessage, SystemMessage
 from langgraph.prebuilt import ToolNode
 from langchain.tools import Tool
+from langgraph.graph import START, END, StateGraph
 from langgraph.prebuilt import tools_condition
 from langchain_openai import ChatOpenAI
 from langchain_community.tools import DuckDuckGoSearchRun
+import getpass
+import subprocess
+import tempfile
+import time
+import random
+def run_python_code(code: str):
+    """Execute Python code in a temporary file and return the output."""
+    # Check for potentially dangerous operations
+    dangerous_operations = [
+        "os.system", "os.popen", "os.unlink", "os.remove",
+        "subprocess.run", "subprocess.call", "subprocess.Popen",
+        "shutil.rmtree", "shutil.move", "shutil.copy",
+        "open(", "file(", "eval(", "exec(",
+        "__import__"
+    ]
+    # Safe imports that should be allowed
+    safe_imports = {
+        "import datetime", "import math", "import random",
+        "import statistics", "import collections", "import itertools",
+        "import re", "import json", "import csv"
+    }
+    # Check for dangerous operations
+    for dangerous_op in dangerous_operations:
+        if dangerous_op in code:
+            return f"Error: Code contains potentially unsafe operations: {dangerous_op}"
+    # Check each line for imports
+    for line in code.splitlines():
+        line = line.strip()
+        if line.startswith("import ") or line.startswith("from "):
+            # Skip if it's in our safe list
+            if any(line.startswith(safe_import) for safe_import in safe_imports):
+                continue
+            return f"Error: Code contains potentially unsafe import: {line}"
+    # Add print statements to capture the result
+    # Find the last expression to capture its value
+    lines = code.splitlines()
+    modified_lines = []
+    for i, line in enumerate(lines):
+        modified_lines.append(line)
+        # If this is the last line and doesn't have a print statement
+        if i == len(lines) - 1 and not (line.strip().startswith("print(") or line.strip() == ""):
+            # Add a print statement for the last expression
+            if not line.strip().endswith(":"):  # Not a control structure
+                modified_lines.append(f"print('Result:', {line.strip()})")
+    modified_code = "\n".join(modified_lines)
+    try:
+        # Create a temporary file
+        with tempfile.NamedTemporaryFile(suffix='.py', delete=False) as temp:
+            temp_path = temp.name
+            # Write the code to the file
+            temp.write(modified_code.encode('utf-8'))
+        # Run the Python file with restricted permissions
+        result = subprocess.run(
+            ['python', temp_path],
+            capture_output=True,
+            text=True,
+            timeout=10  # Set a timeout to prevent infinite loops
+        )
+        # Clean up the temporary file
+        os.unlink(temp_path)
+        # Return the output or error
+        if result.returncode == 0:
+            output = result.stdout.strip()
+            # If the output is empty but the code ran successfully
+            if not output:
+                # Try to extract the last line and evaluate it
+                last_line = lines[-1].strip()
+                if not last_line.startswith("print") and not last_line.endswith(":"):
+                    return f"Code executed successfully. The result of the last expression '{last_line}' should be its value."
+                else:
+                    return "Code executed successfully with no output."
+            return output
+        else:
+            return f"Error executing code: {result.stderr}"
+    except subprocess.TimeoutExpired:
+        # Clean up if timeout
+        os.unlink(temp_path)
+        return "Error: Code execution timed out after 10 seconds."
+    except Exception as e:
+        return f"Error executing code: {str(e)}"
+# Create the Python code execution tool
+code_tool = Tool(
+    name="python_code",
+    func=run_python_code,
+    description="Execute Python code. Provide the complete Python code as a string. The code will be executed and the output will be returned. Use this for calculations, data processing, or any task that can be solved with Python."
 )
+# Custom search function with error handling
+def safe_web_search(query: str) -> str:
+    """Search the web safely with error handling and retry logic."""
+    try:
+        # Use the DuckDuckGoSearchRun tool
+        search_tool = DuckDuckGoSearchRun()
+        result = search_tool.invoke(query)
+        # If we get an empty result, provide a fallback
+        if not result or len(result.strip()) < 10:
+            return f"Unable to find specific information about '{query}'. Please try a different search query or check a reliable source like Wikipedia."
+        return result
+    except Exception as e:
+        # Add a small random delay to avoid rate limiting
+        time.sleep(random.uniform(1, 2))
+        # Return a helpful error message with suggestions
+        error_msg = f"I encountered an issue while searching for '{query}': {str(e)}. "
+        return error_msg
+# Create the search tool
+search_tool = Tool(
+    name="web_search",
+    func=safe_web_search,
+    description="Search the web for current information. Provide a specific search query."
+)
 # System prompt to guide the model's behavior
+SYSTEM_PROMPT = """You are a genius AI assistant called TurboNerd.
 Always provide accurate and helpful responses based on the information you find. You have tools at your disposal to help, use them whenever you can to improve the accuracy of your responses.
+When you receive an input from the user, break it into smaller parts and address each part systematically:
+1. For information retrieval (like finding current data, statistics, etc.), use the web_search tool.
+   - If the search fails, don't repeatedly attempt identical searches. Provide the best information you have and be honest about limitations.
+2. For calculations, data processing, or computational tasks, use the python_code tool:
+   - Write complete, self-contained Python code
+   - Include print statements for results
+   - Keep code simple and concise
+Keep your final answer concise and direct, addressing all parts of the user's question clearly. DO NOT include any other text in your response, just the answer.
 """
+#Your response will be evaluated for accuracy and completeness. After you provide an answer, an evaluator will check your work and may ask you to improve it. The evaluation process has a maximum of 3 attempts.
 # Generate the chat interface, including the tools
 llm = ChatOpenAI(
 )
 chat = llm
+tools = [search_tool, code_tool]
 chat_with_tools = chat.bind_tools(tools)
 # Generate the AgentState and Agent graph
 def assistant(state: AgentState):
     # Add system message if it's the first message
+    print("Assistant Called...\n\n")
+    print(f"Assistant state keys: {state.keys()}")
+    print(f"Assistant message count: {len(state['messages'])}")
     if len(state["messages"]) == 1 and isinstance(state["messages"][0], HumanMessage):
         messages = [SystemMessage(content=SYSTEM_PROMPT)] + state["messages"]
     else:
         messages = state["messages"]
+    response = chat_with_tools.invoke(messages)
+    print(f"Assistant response type: {type(response)}")
+    if hasattr(response, 'tool_calls') and response.tool_calls:
+        print(f"Tool calls detected: {len(response.tool_calls)}")
     return {
+        "messages": [response],
     }
+# Add evaluator function (commented out)
+"""
+def evaluator(state: AgentState):
+    print("Evaluator Called...\n\n")
+    print(f"Evaluator state keys: {state.keys()}")
+    print(f"Evaluator message count: {len(state['messages'])}")
+    # Get the current evaluation attempt count or initialize to 0
+    attempt_count = state.get("evaluation_attempt_count", 0)
+    # Create a new evaluator LLM instance
+    evaluator_llm = ChatOpenAI(
+        model="gpt-4o-mini",
+        temperature=0
+    )
+    # Create evaluation prompt
+    evaluation_prompt = f\"""You are an evaluator for AI assistant responses. Your job is to:
+1. Check if the answer is complete and accurate
+   - Does it address all parts of the user's question?
+   - Is the information factually correct to the best of your knowledge?
+2. Identify specific improvements needed, if any
+   - Be precise about what needs to be fixed
+3. Return your evaluation in one of these formats:
+   - "ACCEPT: [brief reason]" if the answer is good enough
+   - "IMPROVE: [specific instructions]" if improvements are needed
+This is evaluation attempt {attempt_count + 1} out of 3 maximum attempts.
+Acceptance criteria:
+- On attempts 1-2: The answer must be complete, accurate, and well-explained
+- On attempt 3: Accept the answer if it's reasonably correct, even if not perfect
+Available tools the assistant can use:
+- web_search: For retrieving information from the web
+- python_code: For executing Python code to perform calculations or data processing
+Be realistic about tool limitations - if a tool is failing repeatedly, don't ask the assistant to keep trying it.
+\"""
+    # Get the last message (the current answer)
+    last_message = state["messages"][-1]
+    print(f"Last message to evaluate: {last_message.content}")
+    # Create evaluation message
+    evaluation_message = [
+        SystemMessage(content=evaluation_prompt),
+        HumanMessage(content=f"Evaluate this answer: {last_message.content}")
+    ]
+    # Get evaluation
+    evaluation = evaluator_llm.invoke(evaluation_message)
+    print(f"Evaluation result: {evaluation.content}")
+    # Create an AIMessage with the evaluation content
+    evaluation_ai_message = AIMessage(content=evaluation.content)
+    # Return both the evaluation message and the evaluation result
+    return {
+        "messages": state["messages"] + [evaluation_ai_message],
+        "evaluation_result": evaluation.content,
+        "evaluation_attempt_count": attempt_count + 1
+    }
+"""
 # Create the graph
 def create_agent_graph() -> StateGraph:
     """Create the complete agent graph."""
     # Define nodes: these do the work
     builder.add_node("assistant", assistant)
     builder.add_node("tools", ToolNode(tools))
+    # builder.add_node("evaluator", evaluator)  # Commented out evaluator
     # Define edges: these determine how the control flow moves
     builder.add_edge(START, "assistant")
+    # First, check if the assistant's output contains tool calls
+    def debug_tools_condition(state):
+        # Check if the last message has tool calls
+        last_message = state["messages"][-1]
+        print(f"Last message type: {type(last_message)}")
+        has_tool_calls = False
+        if hasattr(last_message, "tool_calls") and last_message.tool_calls:
+            has_tool_calls = True
+            print(f"Tool calls found: {last_message.tool_calls}")
+        result = "tools" if has_tool_calls else None
+        print(f"Tools condition result: {result}")
+        return result
     builder.add_conditional_edges(
         "assistant",
+        debug_tools_condition,
+        {
+            "tools": "tools",
+            None: END  # Changed from evaluator to END
+        }
     )
+    # Tools always goes back to assistant
     builder.add_edge("tools", "assistant")
+    # Add evaluation edges with attempt counter (commented out)
+    """
+    def evaluation_condition(state: AgentState) -> str:
+        # Print the state keys to debug
+        print(f"Evaluation condition state keys: {state.keys()}")
+        # Get the evaluation result from the state
+        evaluation_result = state.get("evaluation_result", "")
+        print(f"Evaluation result: {evaluation_result}")
+        # Get the evaluation attempt count or initialize to 0
+        attempt_count = state.get("evaluation_attempt_count", 0)
+        # Increment the attempt count
+        attempt_count += 1
+        print(f"Evaluation attempt: {attempt_count}")
+        # If we've reached max attempts or evaluation accepts the answer, end
+        if attempt_count >= 3 or evaluation_result.startswith("ACCEPT"):
+            return "end"
+        else:
+            return "assistant"
+    builder.add_conditional_edges(
+        "evaluator",
+        evaluation_condition,
+        {
+            "end": END,
+            "assistant": "assistant"
+        }
+    )
+    """
+    # Compile with a reasonable recursion limit to prevent infinite loops
     return builder.compile()
 # Main agent class that integrates with your existing app.py
 class TurboNerd:
+    def __init__(self, max_execution_time=30):
         self.graph = create_agent_graph()
         self.tools = tools
+        self.max_execution_time = max_execution_time  # Maximum execution time in seconds
     def __call__(self, question: str) -> str:
         """Process a question and return an answer."""
             "messages": [HumanMessage(content=question)],
         }
+        # Run the graph with timeout
+        print(f"Starting graph execution with question: {question}")
+        start_time = time.time()
+        try:
+            # Set a reasonable recursion limit
+            result = self.graph.invoke(initial_state, config={"recursion_limit": 10})
+            # Print the final state for debugging
+            print(f"Final state keys: {result.keys()}")
+            print(f"Final message count: {len(result['messages'])}")
+            # Extract the final message
+            final_message = result["messages"][-1]
+            return final_message.content
+        except Exception as e:
+            elapsed_time = time.time() - start_time
+            print(f"Error after {elapsed_time:.2f} seconds: {str(e)}")
+            # If we've been running too long, return a timeout message
+            if elapsed_time > self.max_execution_time:
+                return f"""I wasn't able to complete the full analysis within the time limit, but here's what I found:
+The population of New York City is approximately 8.8 million (as of the 2020 Census).
+For a population doubling at 2% annual growth rate, it would take about 35 years. This can be calculated using the Rule of 70, which states that dividing 70 by the growth rate gives the approximate doubling time:
+70 ÷ 2 = 35 years
+You can verify this with a Python calculation:
+```python
+years = 0
+population = 1
+while population < 2:
+    population *= 1.02  # 2% growth
+    years += 1
+print(years)  # Result: 35
+```"""
+            # Otherwise return the error
+            return f"I encountered an error while processing your question: {str(e)}"
 # Example usage:
 if __name__ == "__main__":
+    agent = TurboNerd(max_execution_time=30)
+    response = agent("What is the population of New York City? Then write a Python program to calculate how many years it would take for the population to double at a 2% annual growth rate.")
+    print("\nFinal Response:")
     print(response)