|
TITLE = """<h1 align="center" id="space-title">Roblox LLM Leaderboard</h1>""" |
|
|
|
|
|
TASK_DESCRIPTIONS = [ |
|
{ |
|
"name": "RobloxQA", |
|
"link": "https://huggingface.co/datasets/boatbomber/RobloxQA-v1.0", |
|
"description": "Multiple choice question answering about Roblox APIs and concepts.", |
|
}, |
|
{ |
|
"name": "RobloxQA_OpenEnded", |
|
"link": "https://huggingface.co/datasets/boatbomber/RobloxQA-OpenEnded-v1.0", |
|
"description": ( |
|
"Question answering about Roblox APIs and concepts without multiple choices. " |
|
"Response correctness judged by an ensemble of reasoning LLMs by comparing the generated answer to the correct answer." |
|
), |
|
}, |
|
] |
|
|
|
INTRODUCTION_TEXT = f""" |
|
Tracking LLM capabilities regarding Roblox game development. |
|
|
|
### Benchmarks: |
|
|
|
{"\n".join([f"- [{task['name']}]({task['link']}): {task['description']}" for task in TASK_DESCRIPTIONS])} |
|
""" |
|
|