Spaces:

opencompass
/

CompassAcademic-Leaderboard-Full-Version

Running

myhs commited on Apr 7

Commit

0ef0084

verified ·

1 Parent(s): c7c0bc8

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -34,7 +34,10 @@ head_style = """
 DATA_URL_BASE = "http://opencompass.oss-cn-shanghai.aliyuncs.com/dev-assets/hf-research/"
 MAIN_LEADERBOARD_DESCRIPTION = """## Compass Academic Leaderboard (Full Version)
---WIP--
 """
 Initial_title = 'Compass Academic Leaderboard'

 DATA_URL_BASE = "http://opencompass.oss-cn-shanghai.aliyuncs.com/dev-assets/hf-research/"
 MAIN_LEADERBOARD_DESCRIPTION = """## Compass Academic Leaderboard (Full Version)
+The CompassAcademic currently focuses on the comprehensive reasoning abilities of LLMs.
+- The datasets selected so far include General Knowledge Reasoning (MMLU-Pro/GPQA-Diamond), Logical Reasoning (BBH), Mathematical Reasoning (MATH-500, AIME), Code Completion (LiveCodeBench, HumanEval), and Instruction Following (IFEval).
+- Currently, the evaluation primarily targets chat models, with updates featuring the latest community models at irregular intervals.
+- Prompts and reproduction scripts can be found in [**OpenCompass**: A Toolkit for Evaluation of LLMs](https://github.com/open-compass/opencompass)🏆.
 """
 Initial_title = 'Compass Academic Leaderboard'