agno-agi
diff --git a/‎cookbook/examples/streamlit_apps/deep_researcher/README.md‎
Lines changed: 193 additions & 0 deletions b/‎cookbook/examples/streamlit_apps/deep_researcher/README.md‎
Lines changed: 193 additions & 0 deletions
diff --git a/‎cookbook/examples/streamlit_apps/deep_researcher/agents.py‎
Lines changed: 125 additions & 0 deletions b/‎cookbook/examples/streamlit_apps/deep_researcher/agents.py‎
Lines changed: 125 additions & 0 deletions
@@ -0,0 +1,193 @@
+# Deep Researcher Agent
+
+![Demo](./assets/demo.png)
+
+A multi-stage AI-powered research workflow agent that automates comprehensive web research, analysis, and report generation using Agno, Scrapegraph, and Nebius AI.
+
+
+## Features
+
+- **Multi-Stage Research Workflow**: Automated pipeline for searching, analyzing, and reporting
+- **Web Scraping**: Advanced data extraction with Scrapegraph
+- **AI-Powered Analysis**: Uses Nebius AI for intelligent synthesis
+- **Streamlit Web UI**: Modern, interactive interface
+- **MCP Server**: Model Context Protocol server for integration
+- **Command-Line Support**: Run research tasks directly from the terminal
+
+## How It Works
+
+![Workflow](./assets/workflow.gif)
+
+1. **Searcher**: Finds and extracts high-quality, up-to-date information from the web using Scrapegraph and Nebius AI.
+2. **Analyst**: Synthesizes, interprets, and organizes the research findings, highlighting key insights and trends.
+3. **Writer**: Crafts a clear, structured, and actionable report, including references and recommendations.
+
+> **Workflow:**
+>
+> - Input a research topic or question
+> - The agent orchestrates web search, analysis, and report writing in sequence
+> - Results are presented in a user-friendly format (web or CLI)
+
+
+## Prerequisites
+
+- Python 3.10+
+- [uv](https://github.com/astral-sh/uv) for dependency management
+- API keys for [Nebius AI](https://dub.sh/nebius) and [Scrapegraph](https://dub.sh/scrapegraphai)
+
+
+
+## Installation
+
+Follow these steps to set up the **Deep Researcher Agent** on your machine:
+
+1. **Install `uv`** (if you don’t have it):
+
+   ```bash
+   curl -LsSf https://astral.sh/uv/install.sh | sh
+   ```
+
+2. **Clone the repository:**
+
+   ```bash
+   git clone https://github.com/Arindam200/awesome-ai-apps.git
+   ```
+
+3. **Navigate to the Deep Researcher Agent directory:**
+
+   ```bash
+   cd awesome-ai-apps/advance_ai_agents/deep_researcher_agent
+   ```
+
+4. **Install all dependencies:**
+
+   ```bash
+   uv sync
+   ```
+
+## Environment Setup
+
+Create a `.env` file in the project root with your API keys:
+
+```env
+NEBIUS_API_KEY=your_nebius_api_key_here
+SGAI_API_KEY=your_scrapegraph_api_key_here
+```
+
+
+## Usage
+
+![usage](./assets/usage.gif)
+
+You can use the Deep Researcher Agent in three ways. Each method below includes a demo image so you know what to expect.
+
+### Web Interface
+
+Run the Streamlit app:
+
+```bash
+uv run streamlit run app.py
+```
+
+Open your browser at [http://localhost:8501](http://localhost:8501)
+
+What it looks like:
+
+![demo](./assets/demo.png)
+
+### Command Line
+
+Run research directly from the command line:
+
+```bash
+uv run python agents.py
+```
+
+What it looks like:
+
+![Terminal Demo](./assets/terminal-demo.png)
+
+### MCP Server
+
+Add the following configuration to your .cursor/mcp.json or Claude/claude_desktop_config.json file (adjust paths and API keys as needed):
+
+```json
+{
+  "mcpServers": {
+    "deep_researcher_agent": {
+      "command": "python",
+      "args": [
+        "--directory",
+        "/Your/Path/to/directory/awesome-ai-apps/advance_ai_agents/deep_researcher_agent",
+        "run",
+        "server.py"
+      ],
+      "env": {
+        "NEBIUS_API_KEY": "your_nebius_api_key_here",
+        "SGAI_API_KEY": "your_scrapegraph_api_key_here"
+      }
+    }
+  }
+}
+```
+
+This allows tools like Claude Desktop to manage and launch the MCP server automatically.
+
+![Claude Desktop Demo](./assets/mcp-demo.png)
+
+
+
+## Project Structure
+
+```
+deep_researcher_agent/
+├── app.py              # Streamlit web interface
+├── agents.py           # Core agent workflow
+├── server.py           # MCP server
+├── assets/             # Static assets (images)
+├── pyproject.toml      # Project configuration
+└── README.md           # This file
+```
+
+---
+
+## Development
+
+### Code Formatting
+
+```bash
+uv run black .
+uv run isort .
+```
+
+### Type Checking
+
+```bash
+uv run mypy .
+```
+
+### Testing
+
+```bash
+uv run pytest
+```
+
+---
+
+## Contributing
+
+Contributions are welcome! Please feel free to submit a Pull Request or open an issue.
+
+---
+
+## Acknowledgments
+
+- [Agno](https://www.agno.com/) for agent orchestration
+- [Scrapegraph](https://dub.sh/scrapegraphai) for web scraping
+- [Nebius AI Studio](https://studio.nebius.com/) for AI model access
+- [Streamlit](https://streamlit.io/) for the web interface
+
+
+## Author
+
+Developed with ❤️ by [Arindam Majumder](https://www.youtube.com/c/Arindam_1729)
@@ -0,0 +1,125 @@
+import os
+from typing import Iterator
+
+from agno.agent import Agent
+from agno.models.nebius import Nebius
+
+# from agno.tools.scrapegraph import ScrapeGraphTools
+from agno.tools.duckduckgo import DuckDuckGoTools
+from agno.utils.log import logger
+from agno.workflow import RunResponse, Workflow
+
+
+class DeepResearcherAgent(Workflow):
+    """
+    A multi-stage research workflow that:
+    1. Gathers information from the web using advanced scraping tools.
+    2. Analyzes and synthesizes the findings.
+    3. Produces a clear, well-structured report.
+    """
+
+    searcher: Agent = Agent(
+        tools=[DuckDuckGoTools()],
+        model=Nebius(
+            id="deepseek-ai/DeepSeek-V3-0324", api_key=os.getenv("NEBIUS_API_KEY")
+        ),
+        show_tool_calls=True,
+        markdown=True,
+        description=(
+            "You are ResearchBot-X, an expert at finding and extracting high-quality, "
+            "up-to-date information from the web. Your job is to gather comprehensive, "
+            "reliable, and diverse sources on the given topic."
+        ),
+        instructions=(
+            "1. Search for the most recent and authoritative and up-to-date sources (news, blogs, official docs, research papers, forums, etc.) on the topic.\n"
+            "2. Extract key facts, statistics, and expert opinions.\n"
+            "3. Cover multiple perspectives and highlight any disagreements or controversies.\n"
+            "4. Include relevant statistics, data, and expert opinions where possible.\n"
+            "5. Organize your findings in a clear, structured format (e.g., markdown table or sections by source type).\n"
+            "6. If the topic is ambiguous, clarify with the user before proceeding.\n"
+            "7. Be as comprehensive and verbose as possible—err on the side of including more detail.\n"
+            "8. Mention the References & Sources of the Content. (It's Must)"
+        ),
+    )
+
+    # Analyst: Synthesizes and interprets the research findings
+    analyst: Agent = Agent(
+        model=Nebius(
+            id="deepseek-ai/DeepSeek-V3-0324", api_key=os.getenv("NEBIUS_API_KEY")
+        ),
+        markdown=True,
+        description=(
+            "You are AnalystBot-X, a critical thinker who synthesizes research findings "
+            "into actionable insights. Your job is to analyze, compare, and interpret the "
+            "information provided by the researcher."
+        ),
+        instructions=(
+            "1. Identify key themes, trends, and contradictions in the research.\n"
+            "2. Highlight the most important findings and their implications.\n"
+            "3. Suggest areas for further investigation if gaps are found.\n"
+            "4. Present your analysis in a structured, easy-to-read format.\n"
+            "5. Extract and list ONLY the reference links or sources that were ACTUALLY found and provided by the researcher in their findings. Do NOT create, invent, or hallucinate any links.\n"
+            "6. If no links were provided by the researcher, do not include a References section.\n"
+            "7. Don't add hallucinations or make up information. Use ONLY the links that were explicitly passed to you by the researcher.\n"
+            "8. Verify that each link you include was actually present in the researcher's findings before listing it.\n"
+            "9. If there's no Link found from the previous agent then just say, No reference Found."
+        ),
+    )
+
+    # Writer: Produces a final, polished report
+    writer: Agent = Agent(
+        model=Nebius(
+            id="deepseek-ai/DeepSeek-V3-0324", api_key=os.getenv("NEBIUS_API_KEY")
+        ),
+        markdown=True,
+        description=(
+            "You are WriterBot-X, a professional technical writer. Your job is to craft "
+            "a clear, engaging, and well-structured report based on the analyst's summary."
+        ),
+        instructions=(
+            "1. Write an engaging introduction that sets the context.\n"
+            "2. Organize the main findings into logical sections with headings.\n"
+            "3. Use bullet points, tables, or lists for clarity where appropriate.\n"
+            "4. Conclude with a summary and actionable recommendations.\n"
+            "5. Include a References & Sources section ONLY if the analyst provided actual links from their analysis.\n"
+            "6. Use ONLY the reference links that were explicitly provided by the analyst in their analysis. Do NOT create, invent, or hallucinate any links.\n"
+            "7. If the analyst provided links, format them as clickable markdown links in the References section.\n"
+            "8. If no links were provided by the analyst, do not include a References section at all.\n"
+            "9. Never add fake or made-up links - only use links that were actually found and passed through the research chain."
+        ),
+    )
+
+    def run(self, topic: str) -> Iterator[RunResponse]:
+        """
+        Orchestrates the research, analysis, and report writing process for a given topic.
+        """
+        logger.info(f"Running deep researcher agent for topic: {topic}")
+
+        # Step 1: Research
+        research_content = self.searcher.run(topic)
+        # logger.info(f"Searcher content: {research_content.content}")
+
+        logger.info("Analysis started")
+        # Step 2: Analysis
+        analysis = self.analyst.run(research_content.content)
+        # logger.info(f"Analyst analysis: {analysis.content}")
+
+        logger.info("Report Writing Started")
+        # Step 3: Report Writing
+        report = self.writer.run(analysis.content, stream=True)
+        yield from report
+
+
+def run_research(query: str) -> str:
+    agent = DeepResearcherAgent()
+    final_report_iterator = agent.run(
+        topic=query,
+    )
+    logger.info("Report Generated")
+
+    full_report = ""
+    for chunk in final_report_iterator:
+        if chunk.content:
+            full_report += chunk.content
+
+    return full_report