| NEWLINE = "\n" | |
| TITLE = """<h1 align="center" id="space-title">Roblox LLM Leaderboard</h1>""" | |
| TASK_DESCRIPTIONS = [ | |
| { | |
| "name": "RobloxQA", | |
| "link": "https://huggingface.co/datasets/boatbomber/RobloxQA-v1.0", | |
| "description": "Multiple choice question answering about Roblox APIs and concepts.", | |
| }, | |
| { | |
| "name": "RobloxQA_OpenEnded", | |
| "link": "https://huggingface.co/datasets/boatbomber/RobloxQA-OpenEnded-v1.0", | |
| "description": ( | |
| "Question answering about Roblox APIs and concepts without multiple choices. " | |
| "Response correctness judged by an ensemble of reasoning LLMs by comparing the generated answer to the correct answer." | |
| ), | |
| }, | |
| ] | |
| INTRODUCTION_TEXT = f""" | |
| Tracking LLM capabilities regarding Roblox game development. | |
| ### Benchmarks: | |
| {NEWLINE.join([f"- [{task['name']}]({task['link']}): {task['description']}" for task in TASK_DESCRIPTIONS])} | |
| """ | |