open_pt_llm_leaderboard

Restarting on CPU Upgrade

eduagarcia commited on Apr 21

Commit

f49e1e5

•

2 Parent(s): a3b0a0f 77a5f61

Merge branch 'main' of https://huggingface.co/spaces/eduagarcia/open_pt_llm_leaderboard

Files changed (3) hide show

app.py CHANGED Viewed

@@ -62,7 +62,8 @@ from src.tools.plots import (
 def restart_space():
     print("Running Restart")
     try:
-        API.restart_space(repo_id=REPO_ID, token=H4_TOKEN)
     except:
         print("Restart failed")

 def restart_space():
     print("Running Restart")
     try:
+        #API.restart_space(repo_id=REPO_ID, token=H4_TOKEN)
+        pass
     except:
         print("Restart failed")

proprietary_models_results.json CHANGED Viewed

@@ -103,5 +103,26 @@
         },
         "result_metrics_average": 0.6993914868794414,
         "result_metrics_npm": 0.551208000273598
     }
 ]

         },
         "result_metrics_average": 0.6993914868794414,
         "result_metrics_npm": 0.551208000273598
+    },
+    {
+        "model": "gemini-1.5-pro-preview-0409",
+        "name": "Gemini 1.5 Pro Preview (0409)",
+        "link": "https://cloud.google.com/vertex-ai",
+        "date": "2024-04-15",
+        "status": "full",
+        "main_language": "English",
+        "result_metrics": {
+            "enem_challenge": 0.8509447165850245,
+            "bluex": 0.7719054242002782,
+            "oab_exams": 0.6888382687927107,
+            "assin2_sts": 0.8159702278408203,
+            "assin2_rte": 0.9328989988467518,
+            "faquad_nli": 0.7290756302521009,
+            "hatebr_offensive": 0.8697698647467024,
+            "portuguese_hate_speech": 0.7539414414414414,
+            "tweetsentbr": 0.772785080895884
+        },
+        "result_metrics_average": 0.7984588504001905,
+        "result_metrics_npm": 0.6908188311933006
     }
 ]

src/display/about.py CHANGED Viewed

@@ -24,6 +24,11 @@ The leaderboard's backend runs on a [fork](https://github.com/eduagarcia/lm-eval
 {SUPPORT_DESCRIPTION}
 """
 task_count = 0
 TASKS_LIST= ""
 for task in Tasks:
@@ -104,7 +109,17 @@ To get more information about quantization, see:
 ## Useful links
 - [Community resources](https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard/discussions/174)
-- [Collection of best models](https://huggingface.co/collections/{PATH_TO_COLLECTION})
 """
 REMOTE_CODE_EXAPLANATION = f"- *Yes.*"

 {SUPPORT_DESCRIPTION}
 """
+CITATION_TEXT = ""
+if 'citation' in TASK_CONFIG['readme']:
+      CITATION_TEXT += TASK_CONFIG['readme']['citation']
 task_count = 0
 TASKS_LIST= ""
 for task in Tasks:
 ## Useful links
 - [Community resources](https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard/discussions/174)
+- [Collection of best models](https://huggingface.co/collections/{PATH_TO_COLLECTION})
+"""
+if CITATION_TEXT:
+    ABOUT_DESCRIPTION_CONTEXT += f"""
+    ## Citation
+    ```bibtex
+    {CITATION_TEXT}
+    ```
 """
 REMOTE_CODE_EXAPLANATION = f"- *Yes.*"