bofenghuang commited on
Commit
c775ae1
1 Parent(s): ddff2a6

Update common.py

Browse files
Files changed (1) hide show
  1. common.py +4 -4
common.py CHANGED
@@ -623,13 +623,13 @@ def resolve_single_judgment_dict(
623
  """Return the correct single answer grading judge."""
624
  if multi_turn:
625
  if question["category"] in NEED_REF_CATS:
626
- return model_judgments_math[("gpt-4", "single-math-v1-multi-turn")]
627
- return model_judgments_normal[("gpt-4", "single-v1-multi-turn")]
628
 
629
  if question["category"] in NEED_REF_CATS:
630
- return model_judgments_math[("gpt-4", "single-math-v1")]
631
  else:
632
- return model_judgments_normal[("gpt-4", "single-v1")]
633
 
634
 
635
  def get_pairwise_judge_explanation(gamekey, judgment_dict):
 
623
  """Return the correct single answer grading judge."""
624
  if multi_turn:
625
  if question["category"] in NEED_REF_CATS:
626
+ return model_judgments_math[("gpt-4o-2024-05-13", "single-math-v1-multi-turn")]
627
+ return model_judgments_normal[("gpt-4o-2024-05-13", "single-v1-multi-turn")]
628
 
629
  if question["category"] in NEED_REF_CATS:
630
+ return model_judgments_math[("gpt-4o-2024-05-13", "single-math-v1")]
631
  else:
632
+ return model_judgments_normal[("gpt-4o-2024-05-13", "single-v1")]
633
 
634
 
635
  def get_pairwise_judge_explanation(gamekey, judgment_dict):