File size: 925 Bytes
f8efcf6 c8be55c 8fcbcdb f8efcf6 1c17c69 99931b9 1c17c69 8fcbcdb c8be55c |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 |
TITLE = """<h1 align="center" id="space-title">Roblox LLM Leaderboard</h1>"""
TASK_DESCRIPTIONS = [
{
"name": "RobloxQA",
"link": "https://huggingface.co/datasets/boatbomber/RobloxQA-v1.0",
"description": "Multiple choice question answering about Roblox APIs and concepts.",
},
{
"name": "RobloxQA_OpenEnded",
"link": "https://huggingface.co/datasets/boatbomber/RobloxQA-OpenEnded-v1.0",
"description": (
"Question answering about Roblox APIs and concepts without multiple choices. "
"Response correctness judged by an ensemble of reasoning LLMs by comparing the generated answer to the correct answer."
),
},
]
INTRODUCTION_TEXT = f"""
Tracking LLM capabilities regarding Roblox game development.
### Benchmarks:
{"\n".join([f"- [{task['name']}]({task['link']}): {task['description']}" for task in TASK_DESCRIPTIONS])}
"""
|