multi-agent_deep-research-etheroi

Sleeping

File size: 25,880 Bytes

import os
import json
import logging
from datetime import datetime
# Try both import methods
try:
    import google.generativeai as genai
    GENAI_PACKAGE = "generativeai"
except ImportError:
    try:
        import google.genai as genai
        GENAI_PACKAGE = "genai"
    except ImportError:
        logging.error("Failed to import Google AI package")
        raise
import gradio as gr
from tavily import TavilyClient
from dotenv import load_dotenv
from logger_config import setup_logging
from typing import List, Dict, Any, Optional
from utils import (
    validate_response, 
    parse_research_results, 
    format_sources_section, 
    save_markdown_report, 
    convert_to_html
)
# Base server class for MCP
class MCPServer:
    def __init__(self):
        self.test_mode = False

    def process_request(self, request: Dict[str, Any]) -> Dict[str, Any]:
        """Process a research request"""
        raise NotImplementedError("Subclasses must implement process_request")

    def create_interface(self) -> gr.Blocks:
        """Create the Gradio interface"""
        raise NotImplementedError("Subclasses must implement create_interface")

from agents import OrchestratorAgent, PlannerAgent, ReportAgent

# Set up logging
loggers = setup_logging()
server_logger = loggers['server']

class MultiAgentSystem:
    def __init__(self, use_gemini=True, gemini_api_key=None, gemini_model=None, 
                 tavily_api_key=None, openrouter_api_key=None, openrouter_model=None):
        self.use_gemini = use_gemini
        self.gemini_api_key = gemini_api_key
        self.gemini_model = gemini_model
        self.tavily_api_key = tavily_api_key
        self.openrouter_api_key = openrouter_api_key
        self.openrouter_model = openrouter_model

        # Handle different package versions for Gemini configuration
        if use_gemini and gemini_api_key:
            try:
                if GENAI_PACKAGE == "generativeai":
                    genai.configure(api_key=gemini_api_key)
                else:
                    os.environ["GOOGLE_API_KEY"] = gemini_api_key
            except Exception as e:
                server_logger.warning(f"Using fallback configuration method: {str(e)}")
                os.environ["GOOGLE_API_KEY"] = gemini_api_key

        # Initialize agents with version-aware configuration
        agent_kwargs = {
            'use_gemini': use_gemini,
            'api_key': gemini_api_key if use_gemini else openrouter_api_key,
            'openrouter_model': openrouter_model,
            'gemini_model': gemini_model
        }

        # Initialize agents with error handling
        try:
            self.orchestrator = OrchestratorAgent(**agent_kwargs)
            self.planner = PlannerAgent(**agent_kwargs)
            self.report_agent = ReportAgent(**agent_kwargs)
        except Exception as e:
            server_logger.error(f"Failed to initialize agents: {str(e)}")
            raise

        # Initialize Tavily client
        if tavily_api_key:
            self.tavily_client = TavilyClient(api_key=tavily_api_key)
        else:
            self.tavily_client = None

    def web_search(self, query: str) -> List[Dict[str, str]]:
        """Perform web search using Tavily"""
        if not self.tavily_client:
            raise ValueError("Tavily API key not provided")
        
        try:
            response = self.tavily_client.search(
                query, 
                search_depth="advanced",  # Only 'basic' or 'advanced' are allowed
                max_results=5,  # Limit results to keep responses focused
                async_search=True,  # Use async search for better performance
                timeout=30  # 30 second timeout
            )
            return response.get('results', [])
        except Exception as e:
            server_logger.error(f"Web search failed: {str(e)}")
            raise  # Re-raise the exception to handle it in the calling code
    
    def process_query(self, query: str) -> str:
        """Process a research query using the multi-agent system"""
        try:
            # Step 1: Create a structured research plan
            server_logger.info("Creating research plan...")
            research_plan = self.orchestrator.create_research_plan(query)
            server_logger.info(f"Generated research plan: {json.dumps(research_plan, indent=2)}")
            
            # Step 2: Initialize research process
            all_search_results = []
            MAX_SEARCHES_TOTAL = 30  # Total search limit
            MIN_RESULTS_PER_ITEM = 3  # Minimum results before checking progress
            MAX_ATTEMPTS_PER_ITEM = 2  # Maximum attempts to research each item
            search_count = 0
            seen_urls = set()  # Track seen URLs to avoid duplicates
            
            # Track research attempts for each item to prevent loops
            research_attempts = {}
            
            # Step 3: Conduct initial research
            while search_count < MAX_SEARCHES_TOTAL:
                # Evaluate current progress
                current_results = [r['content'] for r in all_search_results]
                progress = self.orchestrator.evaluate_research_progress(research_plan, current_results)
                
                # Check if we have completed all aspects
                if all(progress.values()):
                    server_logger.info("Research complete - all aspects covered with sufficient depth")
                    break
                
                # Get prioritized list of unfulfilled research needs
                remaining_items = self.planner.prioritize_unfulfilled_requirements(
                    research_plan, 
                    progress,
                    current_results
                )
                
                if not remaining_items:
                    break
                
                # Research each remaining item
                for item_type, research_item in remaining_items:
                    # Check if we've exceeded attempts for this item
                    item_key = f"{item_type}:{research_item}"
                    if research_attempts.get(item_key, 0) >= MAX_ATTEMPTS_PER_ITEM:
                        server_logger.info(f"Reached maximum attempts for {item_key}")
                        continue
                    
                    if search_count >= MAX_SEARCHES_TOTAL:
                        server_logger.info(f"Reached maximum total searches ({MAX_SEARCHES_TOTAL})")
                        break
                    
                    server_logger.info(f"Researching {item_type}: {research_item}")
                    search_queries = self.planner.create_search_strategy(research_item, item_type)
                    
                    # Track this research attempt
                    research_attempts[item_key] = research_attempts.get(item_key, 0) + 1
                    
                    # Conduct searches for this item
                    item_results = []
                    for search_query in search_queries:
                        if search_count >= MAX_SEARCHES_TOTAL:
                            break
                        
                        # Ensure search query is a simple string
                        query_str = str(search_query).strip()
                        if not query_str:
                            continue
                        
                        server_logger.info(f"Searching for: {query_str}")
                        results = self.web_search(query_str)
                        
                        # Deduplicate and filter results
                        new_results = []
                        for result in results:
                            url = result.get('url')
                            content = result.get('content', '').strip()
                            
                            # Skip if URL seen or content too short
                            if not url or url in seen_urls or len(content) < 100:
                                continue
                                
                            # Check if content is relevant to the research item
                            if any(keyword.lower() in content.lower() 
                                  for keyword in research_item.lower().split()):
                                seen_urls.add(url)
                                new_results.append(result)
                        
                        item_results.extend(new_results)
                        search_count += 1
                        
                        # Check if we have enough detailed results for this item
                        if len(item_results) >= MIN_RESULTS_PER_ITEM and all(
                            len(r.get('content', '')) > 200 for r in item_results
                        ):
                            break
                    
                    all_search_results.extend(item_results)
            
            # Step 4: Generate final report
            server_logger.info("Generating final report...")
            contexts, sources = parse_research_results(all_search_results)
            
            # Add research completion statistics
            completion_stats = {
                "total_searches": search_count,
                "unique_sources": len(seen_urls),
                "research_coverage": {k: v for k, v in progress.items()}
            }
            server_logger.info(f"Research stats: {json.dumps(completion_stats, indent=2)}")
            
            report = self.report_agent.generate_report(
                query=query,
                research_plan=research_plan,
                research_results=contexts,
                completion_stats=completion_stats
            )
            
            # Add sources section to the report
            report += "\n\n" + format_sources_section(sources)
            
            return report

        except Exception as e:
            server_logger.error(f"Error in process_query: {str(e)}", exc_info=True)
            raise

# Global UI component for progress tracking
progress_output = None

def create_interface():
    """Create the Gradio interface with API key inputs"""
    global progress_output

    css = """
    .log-container { 
        margin: 16px 0;
    }
    .log-output {
        font-family: monospace;
        white-space: pre !important;
        height: 300px;
        overflow-y: auto;
        background-color: #1e1e1e !important;
        color: #d4d4d4 !important;
        padding: 10px;
        border-radius: 4px;
    }
    .research-progress {
        position: relative;
    }
    .minimize-btn {
        position: absolute;
        right: 10px;
        top: 10px;
    }
    """

    with gr.Blocks(title="Multi-Agent Research System", css=css) as interface:
        gr.Markdown(
            """# Multi-Agent Research System
            
            This system uses multiple AI agents to perform comprehensive research and analysis.
            Please provide your API keys to begin."""
        )

        # Progress tracking container with minimize button
        with gr.Row(elem_classes="log-container"):
            with gr.Column(elem_classes="research-progress"):
                progress_output = gr.Textbox(
                    value="Waiting to begin research...",
                    elem_classes=["log-output"],
                    show_label=False,
                    lines=10,
                    max_lines=20,
                    interactive=False
                )
                minimize_btn = gr.Button("🔽", elem_classes="minimize-btn")

        with gr.Row():
            api_type = gr.Radio(
                choices=["Gemini", "OpenRouter"], 
                label="Choose API Type", 
                value="Gemini",
                info="Select which API to use for the agents"
            )

        with gr.Row():
            with gr.Column():
                gemini_key = gr.Textbox(
                    label="Gemini API Key", 
                    placeholder="Enter your Gemini API key",
                    type="password"
                )
                gemini_model = gr.Dropdown(
                    label="Gemini Model",
                    choices=[
                        "gemini-2.0-flash",
                        "gemini-2.0-flash-lite",
                        "gemini-1.5-pro",
                        "gemini-2.5-pro-preview-05-06",
                        "gemini-2.5-flash-preview-04-17"
                    ],
                    value="gemini-2.0-flash",
                    info="Choose Gemini model version"
                )
            with gr.Column():
                tavily_key = gr.Textbox(
                    label="Tavily API Key (Required)", 
                    placeholder="Enter your Tavily API key",
                    type="password"
                )

        with gr.Row():
            with gr.Column():
                openrouter_key = gr.Textbox(
                    label="OpenRouter API Key", 
                    placeholder="Enter your OpenRouter API key",
                    type="password",
                    visible=False
                )
                openrouter_model = gr.Textbox(
                    label="OpenRouter Model ID", 
                    placeholder="e.g., anthropic/claude-3-opus:beta",
                    info="Enter any valid OpenRouter model ID",
                    value="anthropic/claude-3-opus:beta",
                    visible=False
                )

        query_input = gr.Textbox(
            label="Research Query",
            placeholder="Enter your research question...",
            lines=3,
            info="Enter a detailed research question or topic to investigate"
        )

        submit_btn = gr.Button("Begin Research", variant="primary")
        
        with gr.Row():
            output = gr.Markdown(label="Research Results")
            download_md = gr.File(label="Download Markdown Report", visible=False)
            download_html = gr.File(label="Download HTML Report", visible=False)

        def update_api_visibility(choice):
            if choice == "Gemini":
                return {
                    gemini_key: gr.update(visible=True),
                    gemini_model: gr.update(visible=True),
                    openrouter_key: gr.update(visible=False),
                    openrouter_model: gr.update(visible=False)
                }
            else:
                return {
                    gemini_key: gr.update(visible=False),
                    gemini_model: gr.update(visible=False),
                    openrouter_key: gr.update(visible=True),
                    openrouter_model: gr.update(visible=True)
                }

        def run_research(query, api_type, gemini_key, gemini_model, tavily_key, openrouter_key, openrouter_model):
            try:
                if not tavily_key:
                    server_logger.error("Missing Tavily API key")
                    return gr.update(value="Error: Missing Tavily API key"), "Please provide a Tavily API key for web search capability."
                
                if api_type == "Gemini" and not gemini_key:
                    server_logger.error("Missing Gemini API key")
                    return gr.update(value="Error: Missing Gemini API key"), "Please provide a Gemini API key when using Gemini mode."
                    
                if api_type == "OpenRouter" and not openrouter_key:
                    server_logger.error("Missing OpenRouter API key")
                    return gr.update(value="Error: Missing OpenRouter API key"), "Please provide an OpenRouter API key when using OpenRouter mode."

                # Initialize log capture
                class LogCaptureHandler(logging.Handler):
                    def __init__(self):
                        super().__init__()
                        self.logs = []

                    def emit(self, record):
                        msg = self.format(record)
                        self.logs.append(msg)
                        return gr.update(value="\n".join(self.logs))

                log_handler = LogCaptureHandler()
                log_handler.setFormatter(logging.Formatter('%(levelname)s - %(message)s'))
                server_logger.addHandler(log_handler)

                # Initialize system and run query
                system = MultiAgentSystem(
                    use_gemini=(api_type == "Gemini"),
                    gemini_api_key=gemini_key if api_type == "Gemini" else None,
                    gemini_model=gemini_model if api_type == "Gemini" else None,
                    tavily_api_key=tavily_key,
                    openrouter_api_key=openrouter_key if api_type == "OpenRouter" else None,
                    openrouter_model=openrouter_model if api_type == "OpenRouter" else None
                )

                result = system.process_query(query)
                
                # Save markdown report and get file path
                md_file_path = save_markdown_report(result)
                html_file_path = convert_to_html(result)
                
                server_logger.removeHandler(log_handler)
                return (
                    gr.update(value="\n".join(log_handler.logs)),  # Progress output
                    result,  # Markdown output
                    gr.update(value=md_file_path, visible=True),  # Download markdown button
                    gr.update(value=html_file_path, visible=True)  # Download HTML button
                )

            except Exception as e:
                server_logger.error(f"Research failed: {str(e)}", exc_info=True)
                error_msg = f"ERROR: Research failed: {str(e)}"
                return (
                    gr.update(value=error_msg),  # Progress output
                    error_msg,  # Markdown output
                    gr.update(visible=False),  # Hide download button
                    gr.update(visible=False)   # Hide download button
                )

        # Connect event handlers
        api_type.change(
            fn=update_api_visibility,
            inputs=[api_type],
            outputs=[gemini_key, gemini_model, openrouter_key, openrouter_model]
        )

        submit_btn.click(
            fn=run_research,
            inputs=[
                query_input, api_type, gemini_key, gemini_model, 
                tavily_key, openrouter_key, openrouter_model
            ],
            outputs=[progress_output, output, download_md, download_html],
            show_progress="full"
        )

        gr.Examples(
            examples=[
                ["What are the latest advances in transformer architecture optimizations?"],
                ["Explain the mathematical foundations of diffusion models"],
                ["Compare and analyze different approaches to few-shot learning"]
            ],
            inputs=query_input
        )

    return interface

class GradioMCPServer(MCPServer):
    def __init__(self, use_gemini: bool = True, 
                 gemini_api_key: Optional[str] = None,
                 gemini_model: Optional[str] = None,
                 tavily_api_key: Optional[str] = None,
                 openrouter_api_key: Optional[str] = None,
                 openrouter_model: Optional[str] = None):
        super().__init__()
        self.test_mode = False
        
        # Initialize the multi-agent system
        self.agent_system = MultiAgentSystem(
            use_gemini=use_gemini,
            gemini_api_key=gemini_api_key,
            gemini_model=gemini_model,
            tavily_api_key=tavily_api_key,
            openrouter_api_key=openrouter_api_key,
            openrouter_model=openrouter_model
        )

    def process_request(self, request: Dict[str, Any]) -> Dict[str, Any]:
        """Process research requests and return markdown report"""
        try:
            query = request.get('query', '')
            output_format = request.get('format', 'markdown')
            
            if self.test_mode:
                markdown_text = """# Test Mode Response
                
## Overview
This is a sample report generated in test mode without using API credits.

## Key Findings
1. Test finding one
2. Test finding two

## Test Results
Sample analysis content...
"""
                file_path = save_markdown_report(markdown_text) if output_format == 'markdown' else convert_to_html(markdown_text)
            else:
                # Use multi-agent system to process query
                report, _, _ = self.agent_system.process_query(query)
                file_path = save_markdown_report(report) if output_format == 'markdown' else convert_to_html(report)
                markdown_text = report
                
            # Return response with markdown content and file path
            return {
                "response": markdown_text,
                "file_path": file_path,
                "status": "success"
            }
            
        except Exception as e:
            server_logger.error(f"Error processing request: {str(e)}")
            return {
                "response": f"Error: {str(e)}",
                "file_path": None,
                "status": "error"
            }

    def create_interface(self) -> gr.Blocks:
        """Create the Gradio interface with markdown preview and file download"""
        with gr.Blocks(title="Research Assistant", theme=gr.themes.Soft()) as interface:
            gr.Markdown("# Research Assistant")
            
            with gr.Row():
                with gr.Column(scale=3):
                    query_input = gr.Textbox(
                        label="Research Query",
                        placeholder="Enter your research question...",
                        lines=3
                    )
                with gr.Column(scale=1):
                    test_mode_checkbox = gr.Checkbox(
                        label="Test Mode (No API credits used)",
                        value=False
                    )
            
            submit_btn = gr.Button("Begin Research", variant="primary")
            
            with gr.Row():
                # Preview panel
                report_output = gr.Markdown(label="Research Results")
                # Download panel
                with gr.Column():
                    gr.Markdown("### Download Options")
                    with gr.Row():
                        download_md = gr.File(label="Download Markdown", visible=False)
                        download_html = gr.File(label="Download HTML", visible=False)
            
            def process_query(query: str, test_mode: bool) -> tuple[str, str, str]:
                """Process the query and return markdown content and file paths"""
                try:
                    self.test_mode = test_mode
                    if self.test_mode:
                        markdown_text = """# Test Mode Response
                
## Overview
This is a sample report generated in test mode without using API credits.

## Key Findings
1. Test finding one
2. Test finding two

## Test Results
Sample analysis content..."""
                    else:
                        # Use multi-agent system to process query
                        markdown_text = self.agent_system.process_query(query)
                    
                    # Generate both markdown and HTML files
                    md_path = save_markdown_report(markdown_text)
                    html_path = convert_to_html(markdown_text)
                    
                    # Make download buttons visible and return results
                    return (
                        markdown_text,  # Preview content
                        gr.update(value=md_path, visible=True),  # Markdown download
                        gr.update(value=html_path, visible=True)  # HTML download
                    )
                    
                except Exception as e:
                    server_logger.error(f"Error processing query: {str(e)}")
                    return (
                        f"Error: {str(e)}",  # Error message in preview
                        gr.update(visible=False),  # Hide markdown download
                        gr.update(visible=False)   # Hide HTML download
                    )
            
            # Connect the button to the processing function
            submit_btn.click(
                fn=process_query,
                inputs=[query_input, test_mode_checkbox],
                outputs=[report_output, download_md, download_html]
            )
            
            # Add example queries
            gr.Examples(
                examples=[
                    ["What are the latest advances in transformer architecture optimizations?"],
                    ["Explain the mathematical foundations of diffusion models"],
                    ["Compare and analyze different approaches to few-shot learning"]
                ],
                inputs=query_input
            )
            
        return interface

if __name__ == "__main__":
    try:
        # Configure event loop policy for Windows
        if os.name == 'nt':  # Windows
            import asyncio
            import sys
            if sys.version_info[0] == 3 and sys.version_info[1] >= 8:
                asyncio.set_event_loop_policy(asyncio.WindowsSelectorEventLoopPolicy())

        server_logger.info("Starting Gradio server")
        interface = create_interface()
        interface.launch(
            server_name="0.0.0.0",
            share=False,
            debug=True,
            prevent_thread_lock=True,  # Allow for proper cleanup
            mcp_server=True,
        )
    except Exception as e:
        server_logger.error(f"Failed to start Gradio server: {str(e)}", exc_info=True)
        raise