Spaces:

T145
/

open-llm-leaderboard-results-to-modelcard

Running

T145 commited on 21 days ago

Commit

190123d

1 Parent(s): 5ef372e

Use official test keys

Files changed (1) hide show

functions.py CHANGED Viewed

@@ -21,12 +21,14 @@ The purpose of this PR is to add evaluation results from the Open LLM Leaderboar
 Please report any issues here: https://huggingface.co/spaces/T145/open-llm-leaderboard-results-to-modelcard/discussions"""
 KEY_IFEVAL = "IFEval"
 KEY_BBH = "BBH"
 KEY_MATH = "MATH Lvl 5"
 KEY_GPQA = "GPQA"
-KEY_MUSR = "MuSR"
-KEY_MMLU = "MMLU-Pro"
 def normalize_within_range(value, lower_bound=0, higher_bound=1):
     return (np.clip(value - lower_bound, 0, None)) / (higher_bound - lower_bound) * 100

 Please report any issues here: https://huggingface.co/spaces/T145/open-llm-leaderboard-results-to-modelcard/discussions"""
+# Keys are named after the backend keys
+# https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard/blob/main/backend/README.md#leaderboard
 KEY_IFEVAL = "IFEval"
 KEY_BBH = "BBH"
 KEY_MATH = "MATH Lvl 5"
 KEY_GPQA = "GPQA"
+KEY_MUSR = "MUSR"
+KEY_MMLU = "MMLU-PRO"
 def normalize_within_range(value, lower_bound=0, higher_bound=1):
     return (np.clip(value - lower_bound, 0, None)) / (higher_bound - lower_bound) * 100