Spaces:

opll-org
/

Open-Persian-LLM-Leaderboard

Running

App Files Files Community

tohid.abedini commited on Nov 14, 2024

Commit

17c1bbe

1 Parent(s): 54fdeab

[Add] first phase of changes

Browse files

Files changed (5) hide show

app.py +18 -37
envs.py +4 -4
leaderboard_plinder.json → leaderboard_base.json +0 -0
leaderboard_pinder.json → leaderboard_persian.json +0 -0
utils.py +135 -0

app.py CHANGED Viewed

@@ -10,6 +10,7 @@ import json
 import requests
 from envs import API, EVAL_REQUESTS_PATH, TOKEN, QUEUE_REPO
 def fill_form(model_name, model_id, contact_email, challenge, submission_id, paper_link, architecture, license):
@@ -39,7 +40,7 @@ def fill_form(model_name, model_id, contact_email, challenge, submission_id, pap
 def sendForm(url, data):
     try:
-        requests.post(url, data = data)
         print("Submitted successfully!")
     except:
         print("Error!")
@@ -99,68 +100,48 @@ def submit(model_name, model_id, contact_email, challenge, submission_id, paper_
 abs_path = Path(__file__).parent
 # Any pandas-compatible data
-pinder_df = pd.read_json(str(abs_path / "leaderboard_pinder.json"))
-plinder_df = pd.read_json(str(abs_path / "leaderboard_plinder.json"))
-with gr.Blocks() as demo:
     gr.Markdown("""
-    # MLSB 2024 Leaderboard
     """)
-    with gr.Tab("🎖️ PINDER Leaderboard"):
-        gr.Markdown("""## PINDER Leaderboard
-                Evaluating Protein-Protein interaction prediction
                 """)
         Leaderboard(
-        value=pinder_df,
         select_columns=["Arch", "Model", "L_rms", "I_rms",
             "F_nat", "DOCKQ", "CAPRI"],
         search_columns=["model_name_for_query"],
         hide_columns=["model_name_for_query",],
         filter_columns=["Arch"],
     )
-    with gr.Tab("🥇 PLINDER Leaderboard"):
-        gr.Markdown("""## PLINDER Leaderboard
                 Evaluating Protein-Ligand prediction
                 """)
         Leaderboard(
-        value=plinder_df,
         select_columns=["Arch", "Model", "Mean lDDT-PLI", "Mean lDDT-LP",
                         "Median RMSD", "% lDDT-PLI >= 0.5", "% pass PoseBusters"],
         search_columns=["model_name_for_query"],
         hide_columns=["model_name_for_query",],
         filter_columns=["Arch"],
     )
     with gr.Tab("✉️ Submit"):
-        gr.Markdown("""## Submit your model
-                Submit your model to the leaderboard using the below form AFTER following the following steps:
-                - Create a HuggingFace account and request to join the  [MLSB organization](https://huggingface.co/MLSB)
-                - Create a new space in the MLSB organization and add your model using the inference templates: https://huggingface.co/new-space?owner=MLSB
-                - Fill the submission form.
-                ## Prerequisites:
-                To qualify for submission, each team must:
-                - Provide an MLSB submission ID (find it on CMT) or a link to a preprint/paper describing their methodology. This publication does not have to specifically report training or evaluation on the P(L)INDER dataset. Previously published methods, such as DiffDock, only need to link their existing paper. Note that entry into this competition does not equate to an MLSB workshop paper submission.
-                - Create a copy of the provided [inference templates](https://huggingface.co/MLSB/).
-                    - Go to the top right corner of the page of the respective inference template and click on the drop-down menu (vertical ellipsis) right next to the “Community”, then select “Duplicate this space”.
-                - Change files in the newly create space to reflect the peculiarities of your model
-                    - Edit `requirements.txt` to capture all python dependencies.
-                    - Modify the Dockerfile as appropriate (including selecting the right base image)
-                    - Include a `inference_app.py` file. This contains a `predict` function that should be modified to reflect the specifics of inference using their model.
-                    - Include a `train.py` file to ensure that training and model selection use only the PINDER/PLINDER datasets and to clearly show any additional hyperparameters used.
-                    - Provide a LICENSE file that allows for reuse, derivative works, and distribution of the provided software and weights (e.g., MIT or Apache2 license).
-                - Submit to the leaderboard via the [form below](https://huggingface.co/spaces/MLSB/leaderboard2024).
-                    - On submission page, add reference to the newly created space in the format username/space (e.g mlsb/alphafold3). You can create the space on your personal Huggingface account and transfer it to MLSB for the submission to get a GPU assigned.
-                After a brief technical review by our organizers we will grant you a free GPU until MLSB so that anyone can play with the model and we will run the evaluation.
-                If you have a questions please email: [email protected]
-                """)
         model_name = gr.Textbox(label="Model name")
         model_id = gr.Textbox(label="username/space e.g mlsb/alphafold3")
         contact_email = gr.Textbox(label="Contact E-Mail")
-        challenge = gr.Radio(choices=["PINDER", "PLINDER"],label="Challenge")
         gr.Markdown("Either give a submission id if you submitted to the MLSB workshop or provide a link to the preprint/paper describing the method.")
         with gr.Row():
             submission_id = gr.Textbox(label="Submission ID on CMT")

 import requests
 from envs import API, EVAL_REQUESTS_PATH, TOKEN, QUEUE_REPO
+from utils import LLM_BENCHMARKS_ABOUT_TEXT, LLM_BENCHMARKS_SUBMIT_TEXT, custom_css
 def fill_form(model_name, model_id, contact_email, challenge, submission_id, paper_link, architecture, license):
 def sendForm(url, data):
     try:
+        requests.post(url, data=data)
         print("Submitted successfully!")
     except:
         print("Error!")
 abs_path = Path(__file__).parent
 # Any pandas-compatible data
+persian_df = pd.read_json(str(abs_path / "leaderboard_persian.json"))
+base_df = pd.read_json(str(abs_path / "leaderboard_base.json"))
+with gr.Blocks(css=custom_css) as demo:
     gr.Markdown("""
+    # Part LLM Leaderboard
     """)
+    with gr.Tab("🎖️ Persian Leaderboard"):
+        gr.Markdown("""## Persian LLM Leaderboard
+                Evaluating Persian Fine-Tuned models
                 """)
         Leaderboard(
+        value=persian_df,
         select_columns=["Arch", "Model", "L_rms", "I_rms",
             "F_nat", "DOCKQ", "CAPRI"],
         search_columns=["model_name_for_query"],
         hide_columns=["model_name_for_query",],
         filter_columns=["Arch"],
     )
+    with gr.Tab("🥇 Base Leaderboard"):
+        gr.Markdown("""## Base Leaderboard
                 Evaluating Protein-Ligand prediction
                 """)
         Leaderboard(
+        value=base_df,
         select_columns=["Arch", "Model", "Mean lDDT-PLI", "Mean lDDT-LP",
                         "Median RMSD", "% lDDT-PLI >= 0.5", "% pass PoseBusters"],
         search_columns=["model_name_for_query"],
         hide_columns=["model_name_for_query",],
         filter_columns=["Arch"],
     )
+    with gr.TabItem("📝 About"):
+        gr.Markdown(LLM_BENCHMARKS_ABOUT_TEXT)
     with gr.Tab("✉️ Submit"):
+        gr.Markdown(LLM_BENCHMARKS_SUBMIT_TEXT)
         model_name = gr.Textbox(label="Model name")
         model_id = gr.Textbox(label="username/space e.g mlsb/alphafold3")
         contact_email = gr.Textbox(label="Contact E-Mail")
+        challenge = gr.Radio(choices=["Persian", "Base"],label="Challenge")
         gr.Markdown("Either give a submission id if you submitted to the MLSB workshop or provide a link to the preprint/paper describing the method.")
         with gr.Row():
             submission_id = gr.Textbox(label="Submission ID on CMT")

envs.py CHANGED Viewed

@@ -6,12 +6,12 @@ from huggingface_hub import HfApi
 # ----------------------------------
 TOKEN = os.environ.get("HF_TOKEN") # A read/write token for your org
-OWNER = "MLSB" # Change to your org - don't forget to create a results and request dataset, with the correct format!
 # ----------------------------------
-REPO_ID = f"{OWNER}/leaderboard2024"
-QUEUE_REPO = f"{OWNER}/requests"
-RESULTS_REPO = f"{OWNER}/results"
 # If you setup a cache later, just change HF_HOME
 CACHE_PATH=os.getenv("HF_HOME", ".")

 # ----------------------------------
 TOKEN = os.environ.get("HF_TOKEN") # A read/write token for your org
+OWNER = "PartAI" # Change to your org - don't forget to create a results and request dataset, with the correct format!
 # ----------------------------------
+REPO_ID = f"{OWNER}/llm-leaderboard-2"
+QUEUE_REPO = f"{OWNER}/leaderboard-requests"
+RESULTS_REPO = f"{OWNER}/leaderboard-results"
 # If you setup a cache later, just change HF_HOME
 CACHE_PATH=os.getenv("HF_HOME", ".")

leaderboard_plinder.json → leaderboard_base.json RENAMED Viewed

File without changes

leaderboard_pinder.json → leaderboard_persian.json RENAMED Viewed

File without changes

utils.py ADDED Viewed

	@@ -0,0 +1,135 @@

+custom_css = """
+@import url('https://fonts.googleapis.com/css2?family=Vazirmatn&display=swap');
+body, .gradio-container, .gr-button, .gr-input, .gr-slider, .gr-dropdown, .gr-markdown {
+    font-family: 'Vazirmatn', sans-serif !important;
+}
+.markdown-text {
+    font-size: 16px !important;
+}
+#models-to-add-text {
+    font-size: 18px !important;
+}
+#citation-button span {
+    font-size: 16px !important;
+}
+#citation-button textarea {
+    font-size: 16px !important;
+}
+#citation-button > label > button {
+    margin: 6px;
+    transform: scale(1.3);
+}
+#leaderboard-table {
+    margin-top: 15px
+}
+#leaderboard-table-lite {
+    margin-top: 15px
+}
+#search-bar-table-box > div:first-child {
+    background: none;
+    border: none;
+}
+#search-bar {
+    padding: 0px;
+}
+/* Limit the width of the first AutoEvalColumn so that names don't expand too much */
+#leaderboard-table td:nth-child(2),
+#leaderboard-table th:nth-child(2) {
+    max-width: 400px;
+    overflow: auto;
+    white-space: nowrap;
+}
+.tab-buttons button {
+    font-size: 20px;
+}
+#scale-logo {
+    border-style: none !important;
+    box-shadow: none;
+    display: block;
+    margin-left: auto;
+    margin-right: auto;
+    max-width: 600px;
+}
+#scale-logo .download {
+    display: none;
+}
+#filter_type{
+    border: 0;
+    padding-left: 0;
+    padding-top: 0;
+}
+#filter_type label {
+    display: flex;
+}
+#filter_type label > span{
+    margin-top: var(--spacing-lg);
+    margin-right: 0.5em;
+}
+#filter_type label > .wrap{
+    width: 103px;
+}
+#filter_type label > .wrap .wrap-inner{
+    padding: 2px;
+}
+#filter_type label > .wrap .wrap-inner input{
+    width: 1px
+}
+#filter-columns-type{
+    border:0;
+    padding:0.5;
+}
+#filter-columns-size{
+    border:0;
+    padding:0.5;
+}
+#box-filter > .form{
+    border: 0
+}
+"""
+LLM_BENCHMARKS_ABOUT_TEXT = f"""
+## How it works
+## Reproducibility
+To reproduce our results, here is the commands you can run:
+"""
+LLM_BENCHMARKS_SUBMIT_TEXT = """## Submit your model
+                Submit your model to the leaderboard using the below form AFTER following the following steps:
+                - Create a HuggingFace account and request to join the  [MLSB organization](https://huggingface.co/MLSB)
+                - Create a new space in the MLSB organization and add your model using the inference templates: https://huggingface.co/new-space?owner=MLSB
+                - Fill the submission form.
+                ## Prerequisites:
+                To qualify for submission, each team must:
+                - Provide an MLSB submission ID (find it on CMT) or a link to a preprint/paper describing their methodology. This publication does not have to specifically report training or evaluation on the P(L)INDER dataset. Previously published methods, such as DiffDock, only need to link their existing paper. Note that entry into this competition does not equate to an MLSB workshop paper submission.
+                - Create a copy of the provided [inference templates](https://huggingface.co/MLSB/).
+                    - Go to the top right corner of the page of the respective inference template and click on the drop-down menu (vertical ellipsis) right next to the “Community”, then select “Duplicate this space”.
+                - Change files in the newly create space to reflect the peculiarities of your model
+                    - Edit `requirements.txt` to capture all python dependencies.
+                    - Modify the Dockerfile as appropriate (including selecting the right base image)
+                    - Include a `inference_app.py` file. This contains a `predict` function that should be modified to reflect the specifics of inference using their model.
+                    - Include a `train.py` file to ensure that training and model selection use only the Persian/Base datasets and to clearly show any additional hyperparameters used.
+                    - Provide a LICENSE file that allows for reuse, derivative works, and distribution of the provided software and weights (e.g., MIT or Apache2 license).
+                - Submit to the leaderboard via the [form below](https://huggingface.co/spaces/MLSB/leaderboard2024).
+                    - On submission page, add reference to the newly created space in the format username/space (e.g mlsb/alphafold3). You can create the space on your personal Huggingface account and transfer it to MLSB for the submission to get a GPU assigned.
+                After a brief technical review by our organizers we will grant you a free GPU until MLSB so that anyone can play with the model and we will run the evaluation.
+                If you have a questions please email: [email protected]
+                """