Spaces:
Sleeping
Sleeping
bofenghuang
commited on
Commit
•
c775ae1
1
Parent(s):
ddff2a6
Update common.py
Browse files
common.py
CHANGED
@@ -623,13 +623,13 @@ def resolve_single_judgment_dict(
|
|
623 |
"""Return the correct single answer grading judge."""
|
624 |
if multi_turn:
|
625 |
if question["category"] in NEED_REF_CATS:
|
626 |
-
return model_judgments_math[("gpt-
|
627 |
-
return model_judgments_normal[("gpt-
|
628 |
|
629 |
if question["category"] in NEED_REF_CATS:
|
630 |
-
return model_judgments_math[("gpt-
|
631 |
else:
|
632 |
-
return model_judgments_normal[("gpt-
|
633 |
|
634 |
|
635 |
def get_pairwise_judge_explanation(gamekey, judgment_dict):
|
|
|
623 |
"""Return the correct single answer grading judge."""
|
624 |
if multi_turn:
|
625 |
if question["category"] in NEED_REF_CATS:
|
626 |
+
return model_judgments_math[("gpt-4o-2024-05-13", "single-math-v1-multi-turn")]
|
627 |
+
return model_judgments_normal[("gpt-4o-2024-05-13", "single-v1-multi-turn")]
|
628 |
|
629 |
if question["category"] in NEED_REF_CATS:
|
630 |
+
return model_judgments_math[("gpt-4o-2024-05-13", "single-math-v1")]
|
631 |
else:
|
632 |
+
return model_judgments_normal[("gpt-4o-2024-05-13", "single-v1")]
|
633 |
|
634 |
|
635 |
def get_pairwise_judge_explanation(gamekey, judgment_dict):
|