Spaces:

dromerosm
/

crewai-multiagent-research

Running

App Files Files Community

dromerosm commited on Dec 30, 2024

Commit

7153d1f

1 Parent(s): b68285a

Update .gitignore, requirements, and README for project enhancements

Browse files

Files changed (7) hide show

.gitignore +2 -0
README.md +2 -2
__pycache__/config.cpython-310.pyc +0 -0
app.py +548 -114
config.py +23 -0
outputs/output.md +1 -0
requirements.txt +2 -2

.gitignore ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ .env
2	+ .conda

README.md CHANGED Viewed

@@ -1,10 +1,10 @@
 ---
-title: Crewai, Groq, Llama3 and Cohere for Research
 emoji: 📈
 colorFrom: blue
 colorTo: blue
 sdk: gradio
-sdk_version: 4.28.3
 app_file: app.py
 pinned: false
 license: cc-by-nc-nd-4.0

 ---
+title: Crewai Multiagent Research Tool
 emoji: 📈
 colorFrom: blue
 colorTo: blue
 sdk: gradio
+sdk_version: 5.0.0
 app_file: app.py
 pinned: false
 license: cc-by-nc-nd-4.0

__pycache__/config.cpython-310.pyc ADDED Viewed

Binary file (458 Bytes). View file

app.py CHANGED Viewed

@@ -1,201 +1,635 @@
 import os
 import gradio as gr
-import cohere
 import requests
-from crewai import Agent, Task, Crew, Process
-from langchain_groq import ChatGroq
-from langchain_cohere import ChatCohere
-from langchain_community.tools import DuckDuckGoSearchRun, DuckDuckGoSearchResults
-from crewai_tools import tool, SeleniumScrapingTool, ScrapeWebsiteTool
 from duckduckgo_search import DDGS
 from newspaper import Article
-# Ensure essential environment variables are set
-cohere_api_key = os.getenv('COHERE_API_KEY')
-if not cohere_api_key:
-    raise EnvironmentError("COHERE_API_KEY is not set in environment variables")
-groq_api_key = os.getenv("GROQ_API_KEY")
-if not groq_api_key:
-    raise EnvironmentError("GROQ_API_KEY is not set in environment variables")
-# Initialize API clients
-co = cohere.Client(cohere_api_key)
-print("client ok")
 def fetch_content(url):
     try:
-        article = Article(url)
-        article.download()
-        article.parse()
-        return article.text
     except Exception as e:
-        print("ERROR: " + str(e))
-        return f"Error fetching content: {e}"
-# Define the DuckDuckGoSearch tool
 @tool('DuckDuckGoSearchResults')
-def search_results(search_query: str) -> dict:
     """
-    Performs a web search to gather and return a collection of search results.
-    This tool automates the retrieval of web-based information related to a specified query.
-    Args:
-    - search_query (str): The query string that specifies the information to be searched on the web. This should be a clear and concise expression of the user's information needs.
-    Returns:
-    - list: A list of dictionaries, where each dictionary represents a search result. Each dictionary includes 'snippet' of the page and the 'link' with the url linking to it.
     """
-    results = DDGS().text(search_query, max_results=5, timelimit='m')
-    results_list = [{"title": result['title'], "snippet": result['body'], "link": result['href']} for result in results]
-    return results_list
 @tool('WebScrapper')
 def web_scrapper(url: str, topic: str) -> str:
     """
-    A tool designed to extract and read the content of a specified link and generate a summary on a specific topic.
-    It is capable of handling various types of web pages by making HTTP requests and parsing the received HTML content.
-    This tool is particularly useful for web scraping tasks, data collection, or extracting specific information from websites.
-    Args:
-    - url (str): The URL from which to scrape content.
-    - topic (str): The specific topic on which to generate a summary.
-    Returns:
-    - summary (str): summary of the url on the topic
     """
-    # Scrape content from the specified URL
-    content = fetch_content(url)
-    # Prepare the prompt for generating the summary
-    prompt = f"Generate a summary of the following content on the topic ## {topic} ### \n\nCONTENT:\n\n" + content
-    # Generate the summary using Cohere
-    response = co.chat(
-        model='command-r-plus',
-        message=prompt,
-        temperature=0.4,
-        max_tokens=1000,
-        chat_history=[],
-        prompt_truncation='AUTO'
-    )
-    summary_response = f"""###
-    Summary:
-    {response.text}
-    URL: {url}
-    ###
     """
-    return summary_response
-def kickoff_crew(topic: str, model_choice: str) -> str:
     try:
-        # Initialize the large language models based on user selection
-        groq_llm = ChatGroq(temperature=0, groq_api_key=groq_api_key, model_name="groq/" + model_choice)
-        # Define Agents with Groq LLM
         researcher = Agent(
             role='Researcher',
-            goal='Search and Collect detailed information on topic ## {topic} ##',
             tools=[search_results, web_scrapper],
-            llm=groq_llm,  # Assigning the LLM here
             backstory=(
-                "You are a meticulous researcher, skilled at navigating vast amounts of information to extract essential insights on any given topic. "
-                "Your dedication to detail ensures the reliability and thoroughness of your findings. "
-                "With a strategic approach, you carefully analyze and document data, aiming to provide accurate and trustworthy results."
             ),
             allow_delegation=False,
             max_iter=15,
-            max_rpm=20,
-            memory=True,
             verbose=True
         )
         editor = Agent(
             role='Editor',
-            goal='Compile and refine the information into a comprehensive report on topic ## {topic} ##',
-            llm=groq_llm,  # Assigning the LLM here
             backstory=(
                 "As an expert editor, you specialize in transforming raw data into clear, engaging reports. "
-                "Your strong command of language and attention to detail ensure that each report not only conveys essential insights "
-                "but is also easily understandable and appealing to diverse audiences. "
             ),
             allow_delegation=False,
             max_iter=5,
-            max_rpm=15,
-            memory=True,
             verbose=True
         )
         # Define Tasks
         research_task = Task(
             description=(
                 "Use the DuckDuckGoSearchResults tool to collect initial search snippets on ## {topic} ##. "
-                "If more detailed searches are required, generate and execute new queries related to ## {topic} ##. "
-                "Subsequently, employ the WebScrapper tool to delve deeper into significant URLs identified from the snippets, extracting further information and insights. "
-                "Compile these findings into a preliminary draft, documenting all relevant sources, titles, and links associated with the topic. "
-                "Ensure high accuracy throughout the process and avoid any fabrication or misrepresentation of information."
             ),
             expected_output=(
-                "A structured draft report about the topic, featuring an introduction, a detailed main body organized by different aspects of the topic, and a conclusion. "
-                "Each section should properly cite sources, providing a thorough overview of the information gathered."
             ),
             agent=researcher
         )
         edit_task = Task(
             description=(
-                "Review and refine the initial draft report from the research task. Organize the content logically to enhance information flow. "
-                "Verify the accuracy of all data, correct discrepancies, and update information to ensure it reflects current knowledge and is well-supported by sources. "
-                "Improve the report’s readability by enhancing language clarity, adjusting sentence structures, and maintaining a consistent tone. "
-                "Include a section listing all sources used, formatted as bullet points following this template: "
-                "- title: url'."
             ),
             expected_output=(
-                "A polished, comprehensive report on topic ## {topic} ##, with a clear, professional narrative that accurately reflects the research findings. "
-                "The report should include an introduction, an extensive discussion section, a concise conclusion, and a well-organized source list. "
-                "Ensure the document is grammatically correct and ready for publication or presentation."
             ),
             agent=editor,
             context=[research_task]
         )
-        # Forming the Crew
         crew = Crew(
             agents=[researcher, editor],
             tasks=[research_task, edit_task],
-            process=Process.sequential,
         )
-        # Kick-off the research process
         result = crew.kickoff(inputs={'topic': topic})
         if not isinstance(result, str):
             result = str(result)
         return result
     except Exception as e:
-        return f"Error: {str(e)}"
 def main():
     """Set up the Gradio interface for the CrewAI Research Tool."""
     with gr.Blocks() as demo:
-        gr.Markdown("## CrewAI Research Tool")
-        topic_input = gr.Textbox(label="Enter Topic", placeholder="Type here...")
-        model_choice = gr.Radio(choices=["mixtral-8x7b-32768", "llama-3.2-1b-preview", 'llama-3.2-3b-preview', 'llama-3.3-70b-versatile'], label="Choose Model")
-        submit_button = gr.Button("Start Research")
-        output = gr.Markdown(label="Result")
         submit_button.click(
-            fn=kickoff_crew,
-            inputs=[topic_input, model_choice],
-            outputs=output
         )
-    # demo.launch(debug=True)
     demo.queue(api_open=False, max_size=3).launch()
 if __name__ == "__main__":
     main()

+from config import OPENAI_MODELS, COHERE_MODELS, GROQ_MODELS, MAX_TOKENS_BASE, MAX_TOKENS_ADVANCED
 import os
 import gradio as gr
 import requests
+import logging
+from openai import AzureOpenAI, OpenAI
+from cohere import ClientV2
+from crewai import Agent, Task, Crew, Process, LLM
+from crewai_tools import tool
 from duckduckgo_search import DDGS
 from newspaper import Article
+import fitz  # PyMuPDF
+from io import BytesIO, StringIO
+import sys
+import threading
+import queue
+import time
+# Basic logger configuration
+logger = logging.getLogger(__name__)
+logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
+def setup_logging():
+    """Set up logging for better error tracking."""
+    logger = logging.getLogger(__name__)
+    logger.setLevel(logging.INFO)
+    # Remove any existing handlers
+    if logger.hasHandlers():
+        logger.handlers.clear()
+    # Create a handler that writes to stdout
+    handler = logging.StreamHandler(sys.stdout)
+    formatter = logging.Formatter('%(asctime)s | %(levelname)-8s | %(message)s', datefmt='%H:%M:%S')
+    handler.setFormatter(formatter)
+    logger.addHandler(handler)
+    return logger
+# Global variables
+TOKENS_SUMMARIZATION = 0
+MODEL_CHOICE = "openai"
+def export_to_markdown(result):
+    """Utility to export the final result to an output.md file."""
+    try:
+        with open("outputs/output.md", "w") as file:
+            file.write(result)
+        return "outputs/output.md"
+    except Exception as e:
+        logger.error("Error exporting to markdown: %s", str(e))
+        return f"Error exporting: {e}"
 def fetch_content(url):
+    """
+    Fetch the content from a URL, handling either PDFs or normal web articles.
+    - url: The URL to fetch the content from.
+    """
     try:
+        # HEAD request to check content type
+        response = requests.head(url, allow_redirects=True, timeout=10)
+        content_type = response.headers.get('Content-Type', '').lower()
+        if 'application/pdf' in content_type:
+            # The URL points to a PDF; download and extract text
+            pdf_response = requests.get(url, stream=True, timeout=10)
+            pdf_response.raise_for_status()
+            pdf_file = BytesIO(pdf_response.content)
+            with fitz.open(stream=pdf_file, filetype="pdf") as doc:
+                text = ""
+                for page_num, page in enumerate(doc, start=1):
+                    page_text = page.get_text()
+                    if page_text:
+                        text += page_text
+                    else:
+                        logger.warning(f"Unable to extract text from page {page_num} of the PDF.")
+            return text.strip()
+        else:
+            # Not a PDF; use newspaper3k’s Article to extract text
+            article = Article(url)
+            article.download()
+            article.parse()
+            return article.text
+    except requests.exceptions.RequestException as req_err:
+        logger.error("Error in the HTTP request: %s", str(req_err))
+        return f"Error in the HTTP request: {req_err}"
     except Exception as e:
+        logger.error("Error getting the content: %s", str(e))
+        return f"Error getting the content: {e}"
+# Tools
 @tool('DuckDuckGoSearchResults')
+def search_results(search_query: str) -> list:
     """
+    Performs a web search to gather and return a collection of search results with this structure:
+    - title: The title of the search result.
+    - snippet: A short snippet of the search result.
+    - link: The link to the search result.
     """
+    try:
+        results = DDGS().text(search_query, max_results=5, timelimit='m')
+        results_list = [{"title": result['title'],
+                         "snippet": result['body'],
+                         "link": result['href']} for result in results]
+        return results_list
+    except Exception as e:
+        logger.error("Error performing search: %s", str(e))
+        return []
 @tool('WebScrapper')
 def web_scrapper(url: str, topic: str) -> str:
     """
+    Extract and read the content of a specified link and generate a summary on a specific topic.
+    - url: The URL to extract the content from.
+    - topic: Strign with the topic to generate a summary on.
     """
+    global TOKENS_SUMMARIZATION
+    try:
+        content = fetch_content(url)
+        prompt = f"""
+        # OBJECTIVE
+        Generate an in-depth summary of the following CONTENT on the topic "{topic}"
+        # INSTRUCTIONS
+        - Provide in-depth insights based on the following CONTENT.
+        - If the following CONTENT is not directly related to the topic "{topic}", you MUST respond with INVALID CONTENT.
+        - Include insights about why the content is important for the topic, possible challenges and advances...
+        - The format will be markdown.
+        - Avoid making up anything. Every insight MUST be based on the content.
+        # CONTENT:
+        "{content}"
+        """
+        context_messages = [
+            {
+                "role": "system",
+                "content": "You are an expert summarizing content for use as context. Focus on the main points."
+            },
+            {
+                "role": "user",
+                "content": str(prompt)
+            }
+        ]
+        # Use AzureOpenAI, OpenAI or GROQ_COHERE based on model_choice
+        if MODEL_CHOICE == "azure":
+            client = AzureOpenAI(
+                azure_endpoint=os.getenv('AZURE_API_BASE'),
+                azure_deployment=os.getenv('AZURE_DEPLOYMENT_ID'),
+                api_key=os.getenv('AZURE_OPENAI_KEY'),
+                api_version=os.getenv('AZURE_API_VERSION')
+            )
+            response = client.chat.completions.create(
+                model=os.getenv('AZURE_DEPLOYMENT_ID'),
+                messages=context_messages,
+                temperature=0.7,
+                max_tokens=5000
+            )
+        elif MODEL_CHOICE == "openai":
+            client = OpenAI(api_key=os.getenv('OPENAI_API_KEY'))
+            response = client.chat.completions.create(
+                model=OPENAI_MODELS['base'],
+                messages=context_messages,
+                temperature=0.7,
+                max_tokens=5000
+            )
+        elif MODEL_CHOICE == "groq-cohere":
+            client = ClientV2(api_key=os.getenv('COHERE_API_KEY'))
+            response = client.chat(
+                model=COHERE_MODELS['advanced'],
+                messages=context_messages,
+                max_tokens=1000
+            )
+        else:
+            return "Error: Invalid model choice. Please select 'azure' or 'openai'."
+        summary = response.choices[0].message.content
+        if MODEL_CHOICE == "azure" or MODEL_CHOICE == "openai":
+            TOKENS_SUMMARIZATION += response.usage.total_tokens
+        elif MODEL_CHOICE == "groq-cohere":
+            TOKENS_SUMMARIZATION += response.usage.billed_units.input_tokens+response.usage.billed_units.output_tokens
+        summary_response = f"""<article_summary>
+                            # SUMMARY:
+                            {summary}
+                            # URL: {url}
+                            </article_summary>
+                            """
+        # include a delay of 10 second to avoid rate limiting of GROQ-Cohere
+        if MODEL_CHOICE=="groq-cohere":
+            time.sleep(10)
+        return summary_response
+    except Exception as e:
+        logger.error("Error generating summary: %s", str(e))
+        return f"""<article_summary>
+                # SUMMARY:
+                Error generating summary.
+                IGNORE THIS OUTPUT.
+                # URL: {url}
+                </article_summary>
+                """
+def capture_verbose_output(
+    agent_input,
+    model_choice,
+    azure_openai_key,
+    azure_deployment_id,
+    azure_api_base,
+    azure_api_version,
+    openai_api_key,
+    cohere_api_key,
+    groq_api_key
+):
     """
+    This generator captures stdout produced by the multi-agent process in real time,
+    updating the Gradio interface with logs, while returning the final result once done.
+    """
+    old_stdout = sys.stdout
+    mystdout = StringIO()
+    sys.stdout = mystdout
+    result_container = [None]
+    def run_kickoff():
+        result_container[0] = kickoff_crew(
+            topic=agent_input,
+            model_choice=model_choice,
+            azure_openai_key=azure_openai_key,
+            azure_deployment_id=azure_deployment_id,
+            azure_api_base=azure_api_base,
+            azure_api_version=azure_api_version,
+            openai_api_key=openai_api_key,
+            cohere_api_key=cohere_api_key,
+            groq_api_key=groq_api_key
+        )
+    kickoff_thread = threading.Thread(target=run_kickoff)
+    kickoff_thread.start()
+    verbose_output = ""
+    result_output = ""
+    # Initialize outputs
+    yield gr.update(value=result_output), gr.update(value=verbose_output)
+    while kickoff_thread.is_alive():
+        # Read new output from mystdout
+        new_output = mystdout.getvalue()
+        if new_output != verbose_output:
+            verbose_output = new_output
+            yield gr.update(value=result_output), gr.update(value=verbose_output)
+        time.sleep(0.1)
+    # Once done, get final result
+    kickoff_thread.join()
+    sys.stdout = old_stdout
+    result_output = result_container[0]
+    verbose_output = mystdout.getvalue()
+    yield gr.update(value=result_output), gr.update(value=verbose_output)
+def kickoff_crew(
+    topic: str,
+    model_choice: str,
+    azure_openai_key: str,
+    azure_deployment_id: str,
+    azure_api_base: str,
+    azure_api_version: str,
+    openai_api_key: str,
+    cohere_api_key: str,
+    groq_api_key: str
+) -> str:
+    """
+    Kick off the multi-agent pipeline.
+    """
     try:
+        global TOKENS_SUMMARIZATION, MODEL_CHOICE
+        TOKENS_SUMMARIZATION = 0
+        MODEL_CHOICE = model_choice
+        # Basic checks
+        if not topic.strip():
+            return "Error: The topic cannot be empty. Please provide a valid topic."
+        # ---- Define LLMs based on the user-provided inputs ----
+        # Inicializa las variables de los modelos con None
+        azure_llm_base = None
+        azure_llm_advanced = None
+        openai_llm_base = None
+        openai_llm_advanced = None
+        groq_llm_base = None
+        groq_llm_advanced = None
+        if model_choice == "azure":
+            if not azure_openai_key or not azure_deployment_id or not azure_api_base or not azure_api_version:
+                return "Error: Please provide all the required Azure OpenAI API details."
+            else:
+                os.environ['AZURE_API_BASE']=azure_api_base
+                os.environ['AZURE_API_VERSION']=azure_api_version
+                os.environ['AZURE_DEPLOYMENT_ID']=azure_deployment_id
+                os.environ['AZURE_OPENAI_KEY']=azure_openai_key
+            # Azure
+            azure_llm_base = LLM(
+                temperature=0.3,
+                model=f"azure/{azure_deployment_id}",
+                api_key=azure_openai_key,
+                base_url=azure_api_base,
+                api_version=azure_api_version,
+                max_tokens=4000
+            )
+            azure_llm_advanced = LLM(
+                temperature=0.6,
+                model=f"azure/{azure_deployment_id}",
+                api_key=azure_openai_key,
+                base_url=azure_api_base,
+                api_version=azure_api_version,
+                max_tokens=10000
+            )
+        elif model_choice == "openai":
+            if not openai_api_key:
+                return "Error: Please provide the OpenAI API key."
+            else:
+                os.environ['OPENAI_API_KEY']=openai_api_key
+            # OpenAI
+            openai_llm_base = LLM(
+                model=OPENAI_MODELS['base'],
+                api_key=openai_api_key,
+                max_completion_tokens=4000
+            )
+            openai_llm_advanced = LLM(
+                model=OPENAI_MODELS['advanced'],
+                api_key=openai_api_key,
+                temperature=0.4,
+                max_completion_tokens=10000
+            )
+        elif model_choice == "groq-cohere":
+            if not cohere_api_key or not groq_api_key:
+                return "Error: Please provide both the Cohere and GROQ API keys."
+            else:
+                os.environ['COHERE_API_KEY']=cohere_api_key
+                os.environ['GROQ_API_KEY']=groq_api_key
+            # GROQ - placeholder examples
+            groq_llm_base = LLM(
+                model=GROQ_MODELS['base'],
+                api_key=groq_api_key,
+                temperature=0.3,
+                max_tokens=1000
+            )
+            groq_llm_advanced = LLM(
+                model=GROQ_MODELS['advanced'],
+                api_key=groq_api_key,
+                temperature=0.6,
+                max_tokens=4000
+            )
+        # Diccionario para agrupar los LLM
+        llms = {
+            "azure": {
+                "base": azure_llm_base,
+                "advanced": azure_llm_advanced
+            },
+            "openai": {
+                "base": openai_llm_base,
+                "advanced": openai_llm_advanced
+            },
+            "groq-cohere": {
+                "base": groq_llm_base,
+                "advanced": groq_llm_advanced
+            }
+        }
+        # Obtain the selected LLM set
+        if model_choice not in llms:
+            return f"Error: Invalid model choice. Please select from {list(llms.keys())}."
+        selected_llm = llms[model_choice]
+        # Define Agents
         researcher = Agent(
             role='Researcher',
+            goal=f'Search and collect detailed information on topic ## {topic} ##',
             tools=[search_results, web_scrapper],
+            llm=selected_llm["base"],
             backstory=(
+                "You are a meticulous researcher, skilled at navigating vast amounts of information to extract "
+                "essential insights on any given topic. Your dedication to detail ensures the reliability and "
+                "thoroughness of your findings."
             ),
             allow_delegation=False,
             max_iter=15,
+            max_rpm=5 if model_choice == "groq-cohere" else 120,
             verbose=True
         )
         editor = Agent(
             role='Editor',
+            goal=f'Compile and refine the information into a comprehensive report on topic ## {topic} ##',
+            llm=selected_llm["advanced"],
             backstory=(
                 "As an expert editor, you specialize in transforming raw data into clear, engaging reports. "
+                "Your strong command of language and attention to detail ensure that each report not only conveys "
+                "essential insights but is also easily understandable to diverse audiences."
             ),
             allow_delegation=False,
             max_iter=5,
+            max_rpm=10 if model_choice == "groq-cohere" else 120,
             verbose=True
         )
         # Define Tasks
         research_task = Task(
             description=(
+                "Be sure to translate the topic into English first. "
                 "Use the DuckDuckGoSearchResults tool to collect initial search snippets on ## {topic} ##. "
+                "If more detailed searches are required, generate and execute new searches related to ## {topic} ##. "
+                "Subsequently, employ the WebScrapper tool to extract information from significant URLs, "
+                "extracting further insights. Compile these findings into a preliminary draft, documenting all "
+                "relevant sources, titles, and links associated with the topic. "
+                "Ensure high accuracy throughout the process and avoid any fabrication of information."
             ),
             expected_output=(
+                "A structured draft report about the topic, featuring an introduction, a detailed main body, "
+                "and a conclusion. Properly cite sources. Provide a thorough overview of the info gathered."
             ),
             agent=researcher
         )
         edit_task = Task(
             description=(
+                "Review and refine the initial draft report from the research task. Organize the content logically. "
+                "Elaborate on each section to provide in-depth information and insights. "
+                "Verify the accuracy of all data, correct discrepancies, update info to ensure currency, "
+                "and maintain a consistent tone. Include a section listing all sources used, formatted as bullet points."
             ),
             expected_output=(
+                "A polished, comprehensive report on topic ## {topic} ##, with a clear, professional narrative. "
+                "Include an introduction, an extensive discussion, a concise conclusion, and a source list with references."
             ),
             agent=editor,
             context=[research_task]
         )
+        # Form the Crew
         crew = Crew(
             agents=[researcher, editor],
             tasks=[research_task, edit_task],
+            process=Process.sequential
         )
+        # Kick off
         result = crew.kickoff(inputs={'topic': topic})
+        # Compute token usage (CrewAI aggregator usage)
+        tokens = result.token_usage.total_tokens / 1_000
+        tokens_summ = TOKENS_SUMMARIZATION / 1_000
         if not isinstance(result, str):
             result = str(result)
+        result += f"\n\n**Estimated tokens (Agents):** {tokens:.5f} k"
+        result += f"\n\n**Estimated tokens (Summarization):** {tokens_summ:.5f} k"
         return result
     except Exception as e:
+        logger.error("Error in kickoff_crew: %s", str(e))
+        return f"Error in kickoff_crew: {str(e)}"
 def main():
     """Set up the Gradio interface for the CrewAI Research Tool."""
+    description_demo = """# Automatic Insights Generation with Multi-Agents (CrewAI)
+- **Multi-agent framework**: CrewAI
+- **Multi-agents**: Two agents, Researcher and Editor, working together to extract information from the internet and compile a report on the topic of choice.
+- **Search tool**: Duck-Duck-Go-Search
+- **Web Retrieval**: Newspaper4k and PDF
+*Note: Groq is currently disabled due to rate limiting issues. Please use Azure or OpenAI for now.*
+"""
     with gr.Blocks() as demo:
+        gr.Markdown(description_demo)
+        with gr.Row():
+            with gr.Column(scale=1):
+                # Radio: now includes azure / openai / groq / cohere
+                model_choice = gr.Radio(
+                    choices=["azure", "openai", "groq-cohere"],
+                    label="Choose Model",
+                    value="openai",
+                    interactive=True
+                )
+                # ------------
+                # LLM config inputs
+                # ------------
+                # Azure
+                azure_api_base_input = gr.Textbox(label="Azure API Base (url)", type="password", visible=False, interactive=True)
+                azure_deployment_id_input = gr.Textbox(label="Azure Deployment ID (model)", type="password", visible=False, interactive=True)
+                azure_openai_key_input = gr.Textbox(label="Azure API Key", type="password", visible=False, interactive=True)
+                azure_api_version_input = gr.Textbox(label="Azure API Version", type="text", visible=False, interactive=True)
+                # OpenAI
+                openai_api_key_input = gr.Textbox(label="OpenAI API Key", type="password", visible=True, interactive=True)
+                # GROQ
+                groq_api_key_input = gr.Textbox(label="GROQ API Key", type="password", visible=False, interactive=False)
+                # Cohere
+                cohere_api_key_input = gr.Textbox(label="Cohere API Key", type="password", visible=False, interactive=False)
+                export_button = gr.Button("Export to Markdown", interactive=True)
+                file_output = gr.File(label="Download Markdown File")
+                credits = gr.Markdown(
+                    label="Credits",
+                    show_label=True,
+                    value="This tool is powered by [CrewAI](https://crewai.com), "
+                            "[OpenAI](https://openai.com), "
+                            "[Azure OpenAI Services](https://azure.microsoft.com/en-us/products/ai-services/openai-service), "
+                            "[Cohere](https://dashboard.cohere.com), and [GROQ](https://console.groq.com/playground).",
+                )
+            with gr.Column(scale=2):
+                topic_input = gr.Textbox(
+                    label="Enter Topic",
+                    placeholder="Type here the topic of interest...",
+                    interactive=True
+                )
+                submit_button = gr.Button("Start Research", interactive=True)
+                output = gr.Markdown(
+                    label="Result",
+                    show_copy_button=True,
+                    value="The generated insighsts will appear here...",
+                    latex_delimiters=[
+                        {"left": "\\[", "right": "\\]", "display": True},
+                        {"left": "\\(", "right": "\\)", "display": False},
+                        ]
+                )
+                verbose_output = gr.Textbox(
+                    label="Verbose Output",
+                    placeholder="Verbose logs will appear here...",
+                    lines=10,
+                    interactive=False,
+                    show_copy_button=True
+                )
+        # ---------------
+        # Dynamic toggling of LLM config boxes
+        # ---------------
+        def update_model_choice(model):
+            """Update visibility of config inputs based on the selected LLM."""
+            azure_visibility = False
+            openai_visibility = False
+            cohere_visibility = False
+            groq_visibility = False
+            if model == "azure":
+                azure_visibility = True
+            elif model == "openai":
+                openai_visibility = True
+            elif model == "groq-cohere":
+                cohere_visibility = True
+                groq_visibility = True
+            return {
+                azure_openai_key_input: gr.update(visible=azure_visibility),
+                azure_deployment_id_input: gr.update(visible=azure_visibility),
+                azure_api_base_input: gr.update(visible=azure_visibility),
+                azure_api_version_input: gr.update(visible=azure_visibility),
+                openai_api_key_input: gr.update(visible=openai_visibility),
+                cohere_api_key_input: gr.update(visible=cohere_visibility),
+                groq_api_key_input: gr.update(visible=groq_visibility),
+            }
+        model_choice.change(
+            fn=update_model_choice,
+            inputs=[model_choice],
+            outputs=[
+                azure_openai_key_input,
+                azure_deployment_id_input,
+                azure_api_base_input,
+                azure_api_version_input,
+                openai_api_key_input,
+                cohere_api_key_input,
+                groq_api_key_input
+            ]
+        )
         submit_button.click(
+            fn=capture_verbose_output,
+            inputs=[
+                topic_input,
+                model_choice,
+                azure_openai_key_input,
+                azure_deployment_id_input,
+                azure_api_base_input,
+                azure_api_version_input,
+                openai_api_key_input,
+                cohere_api_key_input,
+                groq_api_key_input
+            ],
+            outputs=[output, verbose_output]
+        )
+        export_button.click(
+            fn=export_to_markdown,
+            inputs=output,
+            outputs=file_output
         )
     demo.queue(api_open=False, max_size=3).launch()
 if __name__ == "__main__":
     main()

config.py ADDED Viewed

	@@ -0,0 +1,23 @@

+# config.py
+# Modelos de OpenAI
+OPENAI_MODELS = {
+    'base': 'gpt-4o-mini',  # Modelo base de OpenAI
+    'advanced': 'gpt-4o'    # Modelo avanzado de OpenAI
+}
+# Modelos de Cohere
+COHERE_MODELS = {
+    'base': 'command-r',    # Modelo base de Cohere
+    'advanced': 'command-r-plus'  # Modelo avanzado de Cohere
+}
+# Modelos de Groq
+GROQ_MODELS = {
+    'base': 'groq/llama-3.2-3b-preview',    # Modelo base de Groq
+    'advanced': 'groq/llama-3.3-70b-versatile'  # Modelo avanzado de Groq
+}
+# Configuración adicional
+MAX_TOKENS_BASE = 4000
+MAX_TOKENS_ADVANCED = 10000

outputs/output.md ADDED Viewed

	@@ -0,0 +1 @@


1	+ The generated insighsts will appear here...

requirements.txt CHANGED Viewed

@@ -1,7 +1,7 @@
 crewai
 crewai[tools]
-langchain-groq
-langchain-cohere
 duckduckgo-search
 cohere
 lxml_html_clean

+gradio>=5.0
+pymupdf
 crewai
 crewai[tools]
 duckduckgo-search
 cohere
 lxml_html_clean