FutureBench / process_data /config_db.py
vinid's picture
Leaderboard deployment 2025-07-16 18:05:41
6441bc6
"""
Configuration for database to HuggingFace pipeline.
Update these settings to match your setup.
"""
import os
# Database Configuration
# Note: Database connection is handled by future_bench.database.get_session()
# The script uses the same database connection as the main FutureBench app
# HuggingFace Configuration
HF_CONFIG = {
"token": os.getenv("HF_TOKEN"), # Set this in your environment
"data_repo": "futurebench/data",
"results_repo": "futurebench/results",
"requests_repo": "futurebench/requests", # Optional: for model submissions
}
# Data Processing Settings
PROCESSING_CONFIG = {
"days_history": 180, # How many days of data to include
"min_predictions": 5, # Minimum predictions per model to include
"event_types": ["news", "polymarket", "sports"], # Which event types to include
"exclude_models": ["test", "debug"], # Models to exclude from public dataset
}
# Note: Schema mapping not needed since we use SQLAlchemy ORM models
# The script uses the same models as convert_to_csv.py:
# - EventBase (events table)
# - Prediction (predictions table)