NEWLINE = "\n" | |
TITLE = """<h1 align="center" id="space-title">Roblox LLM Leaderboard</h1>""" | |
TASK_DESCRIPTIONS = [ | |
{ | |
"name": "RobloxQA", | |
"link": "https://huggingface.co/datasets/boatbomber/RobloxQA-v1.0", | |
"description": "Multiple choice question answering about Roblox APIs and concepts.", | |
}, | |
{ | |
"name": "RobloxQA_OpenEnded", | |
"link": "https://huggingface.co/datasets/boatbomber/RobloxQA-OpenEnded-v1.0", | |
"description": ( | |
"Question answering about Roblox APIs and concepts without multiple choices. " | |
"Response correctness judged by an ensemble of reasoning LLMs by comparing the generated answer to the correct answer." | |
), | |
}, | |
] | |
INTRODUCTION_TEXT = f""" | |
Tracking LLM capabilities regarding Roblox game development. | |
### Benchmarks: | |
{NEWLINE.join([f"- [{task['name']}]({task['link']}): {task['description']}" for task in TASK_DESCRIPTIONS])} | |
""" | |