Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
Update src/display_models/read_results.py
Browse files
src/display_models/read_results.py
CHANGED
@@ -11,7 +11,7 @@ from src.display_models.utils import AutoEvalColumn, make_clickable_model
|
|
11 |
|
12 |
# 현우 - ko_commongen_v2 : acc_norm인지 체크 필요함
|
13 |
METRICS = ["acc_norm", "acc_norm", "acc", "mc2", "acc_norm"]
|
14 |
-
BENCHMARKS = ["ko_arc_challenge", "ko_hellaswag", "ko_mmlu", "ko_truthfulqa_mc", "
|
15 |
BENCH_TO_NAME = {
|
16 |
"ko_arc_challenge": AutoEvalColumn.arc.name,
|
17 |
"ko_hellaswag": AutoEvalColumn.hellaswag.name,
|
|
|
11 |
|
12 |
# 현우 - ko_commongen_v2 : acc_norm인지 체크 필요함
|
13 |
METRICS = ["acc_norm", "acc_norm", "acc", "mc2", "acc_norm"]
|
14 |
+
BENCHMARKS = ["ko_arc_challenge", "ko_hellaswag", "ko_mmlu", "ko_truthfulqa_mc", "ko_commongen_v2"] #, "ethicalverification"]
|
15 |
BENCH_TO_NAME = {
|
16 |
"ko_arc_challenge": AutoEvalColumn.arc.name,
|
17 |
"ko_hellaswag": AutoEvalColumn.hellaswag.name,
|