Spaces:

opll-org
/

Open-Persian-LLM-Leaderboard

Running

tohid.abedini commited on Nov 14, 2024

Commit

e72de6c

1 Parent(s): 17c1bbe

[Add] 2nd phase of changes

Files changed (3) hide show

app.py CHANGED Viewed

@@ -108,30 +108,27 @@ with gr.Blocks(css=custom_css) as demo:
     # Part LLM Leaderboard
     """)
     with gr.Tab("🎖️ Persian Leaderboard"):
         gr.Markdown("""## Persian LLM Leaderboard
                 Evaluating Persian Fine-Tuned models
                 """)
         Leaderboard(
         value=persian_df,
-        select_columns=["Arch", "Model", "L_rms", "I_rms",
-            "F_nat", "DOCKQ", "CAPRI"],
         search_columns=["model_name_for_query"],
         hide_columns=["model_name_for_query",],
-        filter_columns=["Arch"],
     )
     with gr.Tab("🥇 Base Leaderboard"):
-        gr.Markdown("""## Base Leaderboard
-                Evaluating Protein-Ligand prediction
                 """)
         Leaderboard(
         value=base_df,
-        select_columns=["Arch", "Model", "Mean lDDT-PLI", "Mean lDDT-LP",
-                        "Median RMSD", "% lDDT-PLI >= 0.5", "% pass PoseBusters"],
         search_columns=["model_name_for_query"],
         hide_columns=["model_name_for_query",],
-        filter_columns=["Arch"],
     )
     with gr.TabItem("📝 About"):
         gr.Markdown(LLM_BENCHMARKS_ABOUT_TEXT)

     # Part LLM Leaderboard
     """)
     with gr.Tab("🎖️ Persian Leaderboard"):
         gr.Markdown("""## Persian LLM Leaderboard
                 Evaluating Persian Fine-Tuned models
                 """)
         Leaderboard(
         value=persian_df,
+        select_columns=["Model", "Precision", "#Params (B)", "Part Multiple Choice", "ARC Easy", "ARC Challenging", "MMLU Pro", "GSM8k Persian", "Multiple Choice Persian"],
         search_columns=["model_name_for_query"],
         hide_columns=["model_name_for_query",],
+        filter_columns=["Precision", "#Params (B)"],
     )
     with gr.Tab("🥇 Base Leaderboard"):
+        gr.Markdown("""## Base LLM Leaderboard
+                Evaluating Base Models
                 """)
         Leaderboard(
         value=base_df,
+        select_columns=["Model", "Precision", "#Params (B)", "Part Multiple Choice", "ARC Easy", "ARC Challenging", "MMLU Pro", "GSM8k Persian", "Multiple Choice Persian"],
         search_columns=["model_name_for_query"],
         hide_columns=["model_name_for_query",],
+        filter_columns=["Precision", "#Params (B)"],
     )
     with gr.TabItem("📝 About"):
         gr.Markdown(LLM_BENCHMARKS_ABOUT_TEXT)

leaderboard_base.json CHANGED Viewed

	@@ -1 +1,38 @@
1	- {"Arch":{"0":"GNN"},"Model":{"0":"example/example"},"Mean lDDT-PLI":{"0":0.2}, "Mean lDDT-LP":{"0":0.8}, "Median RMSD":{"0":5.78}, "% lDDT-PLI >= 0.5":{"0":20.78}, "% pass PoseBusters":{"0":58.47},"Runtime":{"0":"2 +-0.2"},"Hub License":{"0":"apache-2.0"},"#Params (B)":{"0":72.29},"Model sha":{"0":"fda5cf998a0f2d89b53b5fa490793e3e50bb8239"},"model_name_for_query":{"0":"example/example"}}

+{
+  "Arch": {
+    "0": "GNN"
+  },
+  "Model": {
+    "0": "example/example"
+  },
+  "Mean lDDT-PLI": {
+    "0": 0.2
+  },
+  "Mean lDDT-LP": {
+    "0": 0.8
+  },
+  "Median RMSD": {
+    "0": 5.78
+  },
+  "% lDDT-PLI >= 0.5": {
+    "0": 20.78
+  },
+  "% pass PoseBusters": {
+    "0": 58.47
+  },
+  "Runtime": {
+    "0": "2 +-0.2"
+  },
+  "Hub License": {
+    "0": "apache-2.0"
+  },
+  "#Params (B)": {
+    "0": 72.29
+  },
+  "Model sha": {
+    "0": "fda5cf998a0f2d89b53b5fa490793e3e50bb8239"
+  },
+  "model_name_for_query": {
+    "0": "example/example"
+  }
+}

leaderboard_persian.json CHANGED Viewed

	@@ -1 +1,38 @@
1	- {"Arch":{"0":"GNN"},"Model":{"0":"example/example"},"L_rms":{"0":81.22},"I_rms":{"0":79.78},"F_nat":{"0":91.15},"DOCKQ":{"0":77.95},"CAPRI":{"0":74.5},"Runtime":{"0":"2 +-0.2"},"Hub License":{"0":"apache-2.0"},"#Params (B)":{"0":72.29},"Model sha":{"0":"fda5cf998a0f2d89b53b5fa490793e3e50bb8239"},"model_name_for_query":{"0":"example/example"}}

+{
+  "Arch": {
+    "0": "GNN"
+  },
+  "Model": {
+    "0": "example/example"
+  },
+  "L_rms": {
+    "0": 81.22
+  },
+  "I_rms": {
+    "0": 79.78
+  },
+  "F_nat": {
+    "0": 91.15
+  },
+  "DOCKQ": {
+    "0": 77.95
+  },
+  "CAPRI": {
+    "0": 74.5
+  },
+  "Runtime": {
+    "0": "2 +-0.2"
+  },
+  "Hub License": {
+    "0": "apache-2.0"
+  },
+  "#Params (B)": {
+    "0": 72.29
+  },
+  "Model sha": {
+    "0": "fda5cf998a0f2d89b53b5fa490793e3e50bb8239"
+  },
+  "model_name_for_query": {
+    "0": "example/example"
+  }
+}