Spaces:

scdrand23
/

awesome-multi-agent-collaborative-perception

Running

awesome-multi-agent-collaborative-perception

File size: 15,651 Bytes

5fc4576

import gradio as gr

# Sample data for demonstration
perception_papers = [
    {
        "title": "CoSDH: Communication-Efficient Collaborative Perception",
        "venue": "CVPR 2025",
        "description": "Novel approach for efficient collaborative perception using supply-demand awareness.",
        "link": "https://arxiv.org/abs/2503.03430"
    },
    {
        "title": "V2X-R: Cooperative LiDAR-4D Radar Fusion",
        "venue": "CVPR 2025", 
        "description": "Cooperative fusion of LiDAR and 4D radar sensors for enhanced 3D object detection.",
        "link": "https://arxiv.org/abs/2411.08402"
    },
    {
        "title": "Where2comm: Efficient Collaborative Perception via Spatial Confidence Maps",
        "venue": "NeurIPS 2022",
        "description": "Groundbreaking work on efficient collaborative perception using spatial confidence maps.",
        "link": "https://openreview.net/forum?id=dLL4KXzKUpS"
    },
    {
        "title": "STAMP: Scalable Task-Agnostic Collaborative Perception",
        "venue": "ICLR 2025",
        "description": "Framework for scalable collaborative perception that is both task and model agnostic.",
        "link": "https://openreview.net/forum?id=8NdNniulYE"
    },
    {
        "title": "CoBEVFlow: Robust Asynchronous Collaborative 3D Detection",
        "venue": "NeurIPS 2023",
        "description": "Handles temporal asynchrony in collaborative perception using bird's eye view flow.",
        "link": "https://openreview.net/forum?id=UHIDdtxmVS"
    }
]

datasets_data = [
    ["DAIR-V2X", "2022", "Real-world", "V2I", "71K frames", "3D boxes, Infrastructure"],
    ["V2V4Real", "2023", "Real-world", "V2V", "20K frames", "Real V2V, Highway"],
    ["TUMTraf-V2X", "2024", "Real-world", "V2X", "2K sequences", "Dense labels, Urban"],
    ["OPV2V", "2022", "Simulation", "V2V", "Large-scale", "CARLA, Multi-agent"],
    ["V2X-Sim", "2021", "Simulation", "Multi", "Scalable", "Multi-agent, Collaborative"],
    ["DOLPHINS", "2024", "Simulation", "UAV", "UAV swarms", "AirSim, Multi-UAV"]
]

def create_paper_card(paper):
    return f"""
    <div style="border: 1px solid #ddd; border-radius: 10px; padding: 20px; margin: 10px 0; background: white; box-shadow: 0 2px 5px rgba(0,0,0,0.1);">
        <div style="background: #667eea; color: white; padding: 5px 10px; border-radius: 15px; display: inline-block; font-size: 0.8em; margin-bottom: 10px;">
            {paper['venue']}
        </div>
        <h3 style="color: #333; margin: 10px 0;">{paper['title']}</h3>
        <p style="color: #666; line-height: 1.5; margin-bottom: 15px;">{paper['description']}</p>
        <a href="{paper['link']}" target="_blank" style="background: #667eea; color: white; padding: 8px 15px; border-radius: 5px; text-decoration: none; font-size: 0.9em;">
            📄 Read Paper
        </a>
    </div>
    """

# Custom CSS
custom_css = """
.gradio-container {
    max-width: 1200px !important;
}
.main-header {
    text-align: center;
    background: linear-gradient(135deg, #667eea 0%, #764ba2 100%);
    color: white;
    padding: 40px 20px;
    border-radius: 15px;
    margin-bottom: 30px;
}
"""

# Create the interface
with gr.Blocks(
    title="🤖 Awesome Multi-Agent Collaborative Perception",
    theme=gr.themes.Soft(),
    css=custom_css
) as demo:
    
    # Header
    gr.HTML("""
    <div class="main-header">
        <h1 style="font-size: 2.5rem; margin-bottom: 10px;">🤖 Awesome Multi-Agent Collaborative Perception</h1>
        <p style="font-size: 1.2rem; opacity: 0.9;">Explore cutting-edge resources for Multi-Agent Collaborative Perception, Prediction, and Planning</p>
        <div style="display: flex; justify-content: center; gap: 30px; margin-top: 20px; flex-wrap: wrap;">
            <div style="background: rgba(255,255,255,0.2); padding: 10px 20px; border-radius: 25px;">
                <div style="font-size: 1.5rem; font-weight: bold;">200+</div>
                <div>Papers</div>
            </div>
            <div style="background: rgba(255,255,255,0.2); padding: 10px 20px; border-radius: 25px;">
                <div style="font-size: 1.5rem; font-weight: bold;">25+</div>
                <div>Datasets</div>
            </div>
            <div style="background: rgba(255,255,255,0.2); padding: 10px 20px; border-radius: 25px;">
                <div style="font-size: 1.5rem; font-weight: bold;">50+</div>
                <div>Code Repos</div>
            </div>
            <div style="background: rgba(255,255,255,0.2); padding: 10px 20px; border-radius: 25px;">
                <div style="font-size: 1.5rem; font-weight: bold;">2025</div>
                <div>Updated</div>
            </div>
        </div>
    </div>
    """)
    
    # Main navigation tabs
    with gr.Tabs():
        
        with gr.Tab("🔍 Perception"):
            gr.Markdown("## Multi-Agent Collaborative Perception Papers")
            gr.Markdown("*Latest research in collaborative sensing, 3D object detection, and V2X communication*")
            
            # Create paper cards
            papers_html = "".join([create_paper_card(paper) for paper in perception_papers])
            gr.HTML(papers_html)
            
            gr.Markdown("""
            ### 🔄 Key Communication Strategies:
            - **Early Fusion**: Raw sensor data sharing
            - **Late Fusion**: Detection-level information exchange  
            - **Intermediate Fusion**: Feature-level collaboration
            - **Selective Communication**: Confidence-based data sharing
            """)
            
        with gr.Tab("📊 Datasets"):
            gr.Markdown("## Datasets & Benchmarks")
            gr.Markdown("*Comprehensive collection of real-world and simulation datasets*")
            
            gr.Dataframe(
                value=datasets_data,
                headers=["Dataset", "Year", "Type", "Agents", "Size", "Features"],
                datatype=["str", "str", "str", "str", "str", "str"],
                interactive=False
            )
            
            gr.Markdown("""
            ### 🌟 Notable Features:
            - **DAIR-V2X**: First real-world V2I collaborative perception dataset with infrastructure sensors
            - **V2V4Real**: Real vehicle-to-vehicle communication dataset collected on highways
            - **TUMTraf-V2X**: Dense annotations for urban collaborative perception scenarios
            - **OPV2V**: Large-scale simulation benchmark built on CARLA platform
            - **V2X-Sim**: Comprehensive multi-agent simulation with customizable scenarios
            """)
            
        with gr.Tab("📍 Tracking"):
            gr.Markdown("## Multi-Object Tracking & State Estimation")
            gr.Markdown("*Collaborative tracking across distributed agents with uncertainty quantification*")
            
            gr.HTML("""
            <div style="display: grid; grid-template-columns: repeat(auto-fit, minmax(300px, 1fr)); gap: 20px; margin: 20px 0;">
                <div style="border: 1px solid #ddd; border-radius: 10px; padding: 20px; background: white; box-shadow: 0 2px 5px rgba(0,0,0,0.1);">
                    <h3 style="color: #4ECDC4;">MOT-CUP</h3>
                    <p>Multi-Object Tracking with Conformal Uncertainty Propagation</p>
                    <a href="https://arxiv.org/abs/2303.14346" target="_blank" style="color: #667eea;">📄 Paper</a>
                </div>
                <div style="border: 1px solid #ddd; border-radius: 10px; padding: 20px; background: white; box-shadow: 0 2px 5px rgba(0,0,0,0.1);">
                    <h3 style="color: #4ECDC4;">DMSTrack</h3>
                    <p>Probabilistic 3D Multi-Object Cooperative Tracking (ICRA 2024)</p>
                    <a href="https://arxiv.org/abs/2309.14655" target="_blank" style="color: #667eea;">📄 Paper</a>
                </div>
                <div style="border: 1px solid #ddd; border-radius: 10px; padding: 20px; background: white; box-shadow: 0 2px 5px rgba(0,0,0,0.1);">
                    <h3 style="color: #4ECDC4;">CoDynTrust</h3>
                    <p>Dynamic Feature Trust for Robust Asynchronous Collaborative Perception (ICRA 2025)</p>
                    <a href="https://arxiv.org/abs/2502.08169" target="_blank" style="color: #667eea;">📄 Paper</a>
                </div>
            </div>
            """)
            
            gr.Markdown("""
            ### 🎯 Key Challenges:
            - **Temporal Asynchrony**: Handling different sensor timestamps and communication delays
            - **Uncertainty Quantification**: Reliable confidence estimation across multiple agents
            - **Data Association**: Multi-agent correspondence and track management
            - **Scalability**: Maintaining performance with increasing number of agents
            """)
            
        with gr.Tab("🔮 Prediction"):
            gr.Markdown("## Trajectory Forecasting & Motion Prediction")
            gr.Markdown("*Cooperative prediction for autonomous systems and multi-agent coordination*")
            
            gr.HTML("""
            <div style="display: grid; grid-template-columns: repeat(auto-fit, minmax(300px, 1fr)); gap: 20px; margin: 20px 0;">
                <div style="border: 1px solid #ddd; border-radius: 10px; padding: 20px; background: white; box-shadow: 0 2px 5px rgba(0,0,0,0.1);">
                    <h3 style="color: #45B7D1;">V2X-Graph</h3>
                    <p>Learning Cooperative Trajectory Representations (NeurIPS 2024)</p>
                    <a href="https://arxiv.org/abs/2311.00371" target="_blank" style="color: #667eea;">📄 Paper</a>
                </div>
                <div style="border: 1px solid #ddd; border-radius: 10px; padding: 20px; background: white; box-shadow: 0 2px 5px rgba(0,0,0,0.1);">
                    <h3 style="color: #45B7D1;">Co-MTP</h3>
                    <p>Cooperative Multi-Temporal Prediction Framework (ICRA 2025)</p>
                    <a href="https://arxiv.org/abs/2502.16589" target="_blank" style="color: #667eea;">📄 Paper</a>
                </div>
            </div>
            """)
            
            gr.HTML("""
            <div style="background: #f8f9fa; border-radius: 10px; padding: 20px; margin: 20px 0;">
                <h3>🧠 Key Approaches:</h3>
                <ul style="line-height: 1.8;">
                    <li><strong>Graph Neural Networks</strong>: Modeling agent interactions and social behaviors</li>
                    <li><strong>Transformer Architectures</strong>: Attention-based prediction with long-range dependencies</li>
                    <li><strong>Multi-Modal Fusion</strong>: Combining LiDAR, camera, and communication data</li>
                    <li><strong>Uncertainty Quantification</strong>: Reliable confidence estimation for safety-critical applications</li>
                </ul>
            </div>
            """)
            
        with gr.Tab("⚙️ Methods"):
            gr.Markdown("## Methods & Techniques")
            gr.Markdown("*Core methodologies for communication, robustness, and learning in collaborative systems*")
            
            with gr.Row():
                with gr.Column():
                    gr.Markdown("""
                    ### 📡 Communication Strategies
                    - **Bandwidth Optimization**: Compression and selective sharing
                    - **Protocol Design**: V2V, V2I, V2X communication standards
                    - **Network Topology**: Centralized vs. distributed architectures
                    - **Quality of Service**: Latency and reliability management
                    """)
                
                with gr.Column():
                    gr.Markdown("""
                    ### 🛡️ Robustness Approaches
                    - **Byzantine Fault Tolerance**: Handling adversarial agents
                    - **Uncertainty Handling**: Robust fusion under noise
                    - **Privacy Preservation**: Secure multi-party computation
                    - **Malicious Agent Detection**: CP-Guard framework (AAAI 2025)
                    """)
            
            gr.HTML("""
            <div style="background: linear-gradient(135deg, #667eea 0%, #764ba2 100%); color: white; border-radius: 10px; padding: 20px; margin: 20px 0;">
                <h3>🧠 Learning Paradigms</h3>
                <div style="display: grid; grid-template-columns: repeat(auto-fit, minmax(250px, 1fr)); gap: 15px; margin-top: 15px;">
                    <div>• <strong>Federated Learning</strong>: Distributed model training</div>
                    <div>• <strong>Transfer Learning</strong>: Cross-domain adaptation</div>
                    <div>• <strong>Meta-Learning</strong>: Quick adaptation to new scenarios</div>
                    <div>• <strong>Heterogeneous Learning</strong>: HEAL framework (ICLR 2024)</div>
                </div>
            </div>
            """)
            
        with gr.Tab("🏛️ Conferences"):
            gr.Markdown("## Top Venues & Publication Trends")
            gr.Markdown("*Premier conferences and emerging research directions in collaborative perception*")
            
            conference_data = [
                ["CVPR 2025", "5+", "End-to-end systems, robustness"],
                ["ICLR 2025", "3+", "Learning representations, scalability"], 
                ["AAAI 2025", "4+", "AI applications, defense mechanisms"],
                ["ICRA 2025", "6+", "Robotics applications, real-world deployment"],
                ["NeurIPS 2024", "2+", "Theoretical foundations, novel architectures"]
            ]
            
            gr.Dataframe(
                value=conference_data,
                headers=["Conference", "Papers", "Focus Areas"],
                datatype=["str", "str", "str"],
                interactive=False
            )
            
            gr.Markdown("""
            ### 📊 Research Trends (2024-2025):
            - **Communication Efficiency**: 40% increase in bandwidth-aware methods
            - **Robustness & Security**: Emerging focus on adversarial robustness (15+ papers)
            - **Real-World Deployment**: Growing emphasis on practical systems and field tests
            - **Heterogeneous Systems**: Multi-modal and multi-agent diversity becoming standard
            - **End-to-End Learning**: Integration of perception, prediction, and planning
            """)
    
    # Footer
    gr.HTML("""
    <div style="text-align: center; margin-top: 40px; padding: 30px; background: #f8f9fa; border-radius: 10px;">
        <h3>🤝 Contributing</h3>
        <p>We welcome contributions! Please submit papers, datasets, and code repositories via GitHub.</p>
        <div style="margin-top: 20px;">
            <a href="https://github.com/your-username/awesome-multi-agent-collaborative-perception" target="_blank" 
               style="background: #667eea; color: white; padding: 10px 20px; border-radius: 5px; text-decoration: none; margin: 5px;">
                📚 GitHub Repository
            </a>
            <a href="https://huggingface.co/spaces/your-username/awesome-multi-agent-collaborative-perception" target="_blank"
               style="background: #ff6b6b; color: white; padding: 10px 20px; border-radius: 5px; text-decoration: none; margin: 5px;">
                🤗 Hugging Face Space
            </a>
        </div>
        <p style="margin-top: 20px; color: #666;">Made with ❤️ for the Collaborative Perception Community</p>
    </div>
    """)

if __name__ == "__main__":
    demo.launch()