Spaces:

mgbam
/

NeuroResearch_AI

Sleeping

App Files Files Community

NeuroResearch_AI / app.py

mgbam

Update app.py

bd23f77 verified 4 months ago

raw

history blame

10.3 kB

	"""
	AI Research Assistant
	"""

	# ------------------------------
	# Core Imports & Configuration
	# ------------------------------
	import os
	import re
	import time
	import chromadb
	import requests
	import streamlit as st
	from typing import Sequence, Tuple
	from typing_extensions import TypedDict, Annotated
	from langchain_core.messages import HumanMessage, AIMessage
	from langchain.text_splitter import RecursiveCharacterTextSplitter
	from langchain_community.vectorstores import Chroma
	from langchain.tools.retriever import create_retriever_tool
	from langgraph.graph import END, StateGraph
	from langgraph.prebuilt import ToolNode
	from langgraph.graph.message import add_messages
	from chromadb.config import Settings
	from langchain_openai import OpenAIEmbeddings

	# ------------------------------
	# Type Definitions
	# ------------------------------
	class AgentState(TypedDict):
	messages: Annotated[Sequence[AIMessage \| HumanMessage], add_messages]

	# ------------------------------
	# Configuration & Constants
	# ------------------------------
	class Config:
	API_KEY = os.environ.get("DEEPSEEK_API_KEY")
	CHROMA_PATH = "chroma_db"
	TEXT_SPLITTER_CONFIG = {
	"chunk_size": 512,
	"chunk_overlap": 128,
	"separators": ["\n\n", "\n", ". ", "! ", "? "]
	}

	# ------------------------------
	# Core System Components
	# ------------------------------
	class ResearchAssistant:
	def __init__(self):
	self.embeddings = OpenAIEmbeddings(model="text-embedding-3-large")
	self.vector_stores = self._init_vector_stores()
	self.tools = self._create_tools()
	self.workflow = self._build_workflow()

	def _init_vector_stores(self) -> Tuple[Chroma, Chroma]:
	"""Initialize vector stores with proper document processing"""
	splitter = RecursiveCharacterTextSplitter(**Config.TEXT_SPLITTER_CONFIG)

	research_docs = splitter.create_documents([
	"Research Report: New AI Model Achieves 98% Image Recognition Accuracy",
	"Transformers: The New NLP Architecture Standard",
	"Quantum Machine Learning: Emerging Trends and Applications"
	])

	development_docs = splitter.create_documents([
	"Project A: UI Design Finalized, API Integration Phase",
	"Project B: Feature Testing and Bug Fixes",
	"Product Y: Performance Optimization Pre-Release"
	])

	client = chromadb.PersistentClient(
	path=Config.CHROMA_PATH,
	settings=Settings(anonymized_telemetry=False)

	return (
	Chroma.from_documents(research_docs, self.embeddings,
	client=client, collection_name="research"),
	Chroma.from_documents(development_docs, self.embeddings,
	client=client, collection_name="development")
	)

	def _create_tools(self):
	"""Create retrieval tools with optimized search parameters"""
	research_retriever = self.vector_stores[0].as_retriever(
	search_kwargs={"k": 3, "score_threshold": 0.7}
	)
	development_retriever = self.vector_stores[1].as_retriever(
	search_kwargs={"k": 3, "score_threshold": 0.7}
	)

	return [
	create_retriever_tool(
	research_retriever,
	"research_db",
	"Access technical research papers and reports"
	),
	create_retriever_tool(
	development_retriever,
	"development_db",
	"Retrieve project development status updates"
	)
	]

	def _build_workflow(self):
	"""Construct and return the processing workflow"""
	workflow = StateGraph(AgentState)

	workflow.add_node("analyze", self.analyze_query)
	workflow.add_node("retrieve", ToolNode(self.tools))
	workflow.add_node("synthesize", self.synthesize_response)

	workflow.set_entry_point("analyze")

	workflow.add_conditional_edges(
	"analyze",
	self._needs_retrieval,
	{"retrieve": "retrieve", "direct": "synthesize"}
	)

	workflow.add_edge("retrieve", "synthesize")
	workflow.add_edge("synthesize", END)

	return workflow.compile()

	def _needs_retrieval(self, state: AgentState) -> str:
	"""Determine if document retrieval is needed"""
	query = state["messages"][-1].content.lower()
	return "retrieve" if any(kw in query for kw in {
	"research", "study", "project", "develop", "trend"
	}) else "direct"

	def analyze_query(self, state: AgentState):
	"""Analyze user query and determine next steps"""
	try:
	user_input = state["messages"][-1].content

	headers = {
	"Authorization": f"Bearer {Config.API_KEY}",
	"Content-Type": "application/json"
	}

	response = requests.post(
	"https://api.deepseek.com/v1/chat/completions",
	headers=headers,
	json={
	"model": "deepseek-chat",
	"messages": [{
	"role": "user",
	"content": f"""Analyze this query and format as:
	CATEGORY: [RESEARCH\|DEVELOPMENT\|GENERAL]
	KEY_TERMS: comma-separated list
	{user_input}"""
	}],
	"temperature": 0.3
	},
	timeout=15
	)

	response.raise_for_status()
	analysis = response.json()["choices"][0]["message"]["content"]

	return {"messages": [AIMessage(content=analysis)]}

	except Exception as e:
	return {"messages": [AIMessage(
	content=f"Analysis Error: {str(e)}. Please rephrase your question."
	)]}

	def synthesize_response(self, state: AgentState):
	"""Generate final response with citations"""
	try:
	context = "\n".join([msg.content for msg in state["messages"]])

	headers = {
	"Authorization": f"Bearer {Config.API_KEY}",
	"Content-Type": "application/json"
	}

	response = requests.post(
	"https://api.deepseek.com/v1/chat/completions",
	headers=headers,
	json={
	"model": "deepseek-chat",
	"messages": [{
	"role": "user",
	"content": f"""Synthesize this information:
	{context}

	Include:
	1. Key findings
	2. Supporting evidence
	3. Technical details
	4. Potential applications"""
	}],
	"temperature": 0.5
	},
	timeout=20
	)

	response.raise_for_status()
	return {"messages": [AIMessage(
	content=response.json()["choices"][0]["message"]["content"]
	)]}

	except Exception as e:
	return {"messages": [AIMessage(
	content=f"Synthesis Error: {str(e)}. Please try again later."
	)]}

	# ------------------------------
	# Professional UI Interface
	# ------------------------------
	def main():
	st.set_page_config(
	page_title="Research Assistant Pro",
	layout="wide",
	initial_sidebar_state="expanded"
	)

	# Dark theme implementation
	st.markdown("""
	<style>
	.stApp {
	background-color: #0f1114;
	color: #ffffff;
	}
	.stTextInput input, .stTextArea textarea {
	background-color: #1e1e24 !important;
	color: #ffffff !important;
	}
	.stButton>button {
	background: #2563eb;
	transition: all 0.2s;
	}
	.stButton>button:hover {
	background: #1d4ed8;
	transform: scale(1.02);
	}
	.result-card {
	background: #1a1a1f;
	border-radius: 8px;
	padding: 1.5rem;
	margin: 1rem 0;
	}
	</style>
	""", unsafe_allow_html=True)

	st.title("🔍 Research Assistant Pro")
	st.write("Advanced AI-Powered Research Analysis")

	col1, col2 = st.columns([1, 2])

	with col1:
	with st.form("query_form"):
	query = st.text_area("Research Query:", height=150,
	placeholder="Enter your research question...")
	submitted = st.form_submit_button("Analyze")

	if submitted and query:
	with st.spinner("Processing..."):
	try:
	assistant = ResearchAssistant()
	result = assistant.workflow.invoke({"messages": [
	HumanMessage(content=query)
	]})

	with st.expander("Analysis Details", expanded=True):
	st.markdown(f"""
	<div class="result-card">
	{result['messages'][-1].content}
	</div>
	""", unsafe_allow_html=True)
	except Exception as e:
	st.error(f"Processing Error: {str(e)}")

	with col2:
	st.subheader("Knowledge Base")
	with st.expander("Research Documents"):
	st.info("""
	- Advanced Image Recognition Systems
	- Transformer Architecture Analysis
	- Quantum ML Research
	""")

	with st.expander("Development Updates"):
	st.info("""
	- Project A: API Integration Phase
	- Project B: Feature Testing
	- Product Y: Optimization Stage
	""")

	if __name__ == "__main__":
	if not Config.API_KEY:
	st.error("""
	🔑 Configuration Required:
	Set DEEPSEEK_API_KEY environment variable
	""")
	st.stop()
	main()