Spaces:

opll-org
/

Open-Persian-LLM-Leaderboard

Running

tohid.abedini commited on Nov 16, 2024

Commit

b9dac59

1 Parent(s): c604eb0

test

Files changed (2) hide show

app.py CHANGED Viewed

@@ -2,7 +2,7 @@ import gradio as gr
 from gradio_leaderboard import Leaderboard, SelectColumns, ColumnFilter
 from pathlib import Path
-from utils import LLM_BENCHMARKS_ABOUT_TEXT, LLM_BENCHMARKS_SUBMIT_TEXT, custom_css, jsonl_to_dataframe, add_average_column_to_df, apply_markdown_format_for_columns, submit
@@ -26,6 +26,7 @@ columns_data_type = ["markdown" for i in range(len(leaderboard_df.columns))]
 with gr.Blocks(css=custom_css) as demo:
     gr.Markdown("""
     # Persian LLM Leaderboard
     """)

 from gradio_leaderboard import Leaderboard, SelectColumns, ColumnFilter
 from pathlib import Path
+from utils import LLM_BENCHMARKS_ABOUT_TEXT, LLM_BENCHMARKS_SUBMIT_TEXT, custom_css, jsonl_to_dataframe, add_average_column_to_df, apply_markdown_format_for_columns, submit, PART_LOGO
 with gr.Blocks(css=custom_css) as demo:
+    gr.HTML(PART_LOGO)
     gr.Markdown("""
     # Persian LLM Leaderboard
     """)

utils.py CHANGED Viewed

@@ -114,7 +114,7 @@ LLM_BENCHMARKS_ABOUT_TEXT = f"""
 > The Persian LLM Evaluation Leaderboard, developed by **Part DP AI** in collaboration with **AUT (Amirkabir University of Technology) NLP Lab**, provides a comprehensive benchmarking system specifically designed for Persian LLMs. This leaderboard, based on the open-source [LM Evaluation Harness](https://github.com/EleutherAI/lm-evaluation-harness), offers a unique platform for evaluating the performance of large language models (LLMs) on tasks that demand linguistic proficiency and technical skill in Persian.
-> **Note:** This leaderboard is continuously updating its data and models, reflecting the latest developments in Persian LLMs. It is currently in version 1, serving as the initial benchmark for Persian LLM evaluation, with plans for future enhancements.
 ## 1. Key Features
@@ -172,6 +172,11 @@ LLM_BENCHMARKS_SUBMIT_TEXT = """## Submitting a Model for Evaluation
 """
 def load_jsonl(input_file):
     data = []
     with open(input_file, 'r') as f:

 > The Persian LLM Evaluation Leaderboard, developed by **Part DP AI** in collaboration with **AUT (Amirkabir University of Technology) NLP Lab**, provides a comprehensive benchmarking system specifically designed for Persian LLMs. This leaderboard, based on the open-source [LM Evaluation Harness](https://github.com/EleutherAI/lm-evaluation-harness), offers a unique platform for evaluating the performance of large language models (LLMs) on tasks that demand linguistic proficiency and technical skill in Persian.
+> **Note:** This leaderboard is continuously updating its data and models, reflecting the latest developments in Persian LLMs. It is currently in version 1.0.0, serving as the initial benchmark for Persian LLM evaluation, with plans for future enhancements.
 ## 1. Key Features
 """
+PART_LOGO = """
+<img src="https://avatars.githubusercontent.com/u/39557177?v=4" style="width:30%;display:block;margin-left:auto;margin-right:auto">
+<h1 style="font-size: 28px; margin-bottom: 2px;">Part DP AI</h1>
+"""
 def load_jsonl(input_file):
     data = []
     with open(input_file, 'r') as f: