tohid.abedini
commited on
Commit
·
a8f0c8f
1
Parent(s):
7d525f5
[Add] average to df
Browse files
app.py
CHANGED
@@ -10,7 +10,7 @@ import json
|
|
10 |
import requests
|
11 |
|
12 |
from envs import API, EVAL_REQUESTS_PATH, TOKEN, QUEUE_REPO
|
13 |
-
from utils import LLM_BENCHMARKS_ABOUT_TEXT, LLM_BENCHMARKS_SUBMIT_TEXT, custom_css, jsonl_to_dataframe
|
14 |
|
15 |
|
16 |
|
@@ -108,8 +108,8 @@ base_df = jsonl_to_dataframe(str(abs_path / "leaderboard_base.jsonl"))
|
|
108 |
all_columns = ["Average ⬆️", "Precision", "#Params (B)", "Part Multiple Choice", "ARC Easy", "ARC Challenging", "MMLU Pro", "GSM8k Persian", "Multiple Choice Persian"]
|
109 |
columns_to_average = ["Part Multiple Choice", "ARC Easy", "ARC Challenging", "MMLU Pro", "GSM8k Persian", "Multiple Choice Persian"]
|
110 |
|
111 |
-
persian_df =
|
112 |
-
base_df =
|
113 |
|
114 |
|
115 |
with gr.Blocks(css=custom_css) as demo:
|
|
|
10 |
import requests
|
11 |
|
12 |
from envs import API, EVAL_REQUESTS_PATH, TOKEN, QUEUE_REPO
|
13 |
+
from utils import LLM_BENCHMARKS_ABOUT_TEXT, LLM_BENCHMARKS_SUBMIT_TEXT, custom_css, jsonl_to_dataframe
|
14 |
|
15 |
|
16 |
|
|
|
108 |
all_columns = ["Average ⬆️", "Precision", "#Params (B)", "Part Multiple Choice", "ARC Easy", "ARC Challenging", "MMLU Pro", "GSM8k Persian", "Multiple Choice Persian"]
|
109 |
columns_to_average = ["Part Multiple Choice", "ARC Easy", "ARC Challenging", "MMLU Pro", "GSM8k Persian", "Multiple Choice Persian"]
|
110 |
|
111 |
+
persian_df["Average ⬆️"] = persian_df[columns_to_average].mean(axis=1)
|
112 |
+
base_df["Average ⬆️"] = base_df[columns_to_average].mean(axis=1)
|
113 |
|
114 |
|
115 |
with gr.Blocks(css=custom_css) as demo:
|
utils.py
CHANGED
@@ -149,16 +149,3 @@ def load_jsonl(input_file):
|
|
149 |
def jsonl_to_dataframe(input_file):
|
150 |
data = load_jsonl(input_file)
|
151 |
return pd.DataFrame(data)
|
152 |
-
|
153 |
-
|
154 |
-
def compute_averages(df, columns_to_average):
|
155 |
-
average_metrics = {col: df[col].mean() for col in columns_to_average if col in df}
|
156 |
-
average_metrics["Model"] = "Average ⬆️" # Label the row as "Average"
|
157 |
-
return average_metrics
|
158 |
-
|
159 |
-
def add_average_row_to_df(df, columns_to_average):
|
160 |
-
average_row = compute_averages(df, columns_to_average)
|
161 |
-
average_df = pd.DataFrame([average_row])
|
162 |
-
print(average_df.columns, average_df)
|
163 |
-
df = pd.concat([df, average_df], ignore_index=True)
|
164 |
-
return df
|
|
|
149 |
def jsonl_to_dataframe(input_file):
|
150 |
data = load_jsonl(input_file)
|
151 |
return pd.DataFrame(data)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|