Spaces:

bofenghuang
/

mt-bench-french-browser

Running

bofenghuang commited on Nov 12, 2024

Commit

c775ae1

verified ·

1 Parent(s): ddff2a6

Update common.py

Files changed (1) hide show

common.py CHANGED Viewed

@@ -623,13 +623,13 @@ def resolve_single_judgment_dict(
     """Return the correct single answer grading judge."""
     if multi_turn:
         if question["category"] in NEED_REF_CATS:
-            return model_judgments_math[("gpt-4", "single-math-v1-multi-turn")]
-        return model_judgments_normal[("gpt-4", "single-v1-multi-turn")]
     if question["category"] in NEED_REF_CATS:
-        return model_judgments_math[("gpt-4", "single-math-v1")]
     else:
-        return model_judgments_normal[("gpt-4", "single-v1")]
 def get_pairwise_judge_explanation(gamekey, judgment_dict):

     """Return the correct single answer grading judge."""
     if multi_turn:
         if question["category"] in NEED_REF_CATS:
+            return model_judgments_math[("gpt-4o-2024-05-13", "single-math-v1-multi-turn")]
+        return model_judgments_normal[("gpt-4o-2024-05-13", "single-v1-multi-turn")]
     if question["category"] in NEED_REF_CATS:
+        return model_judgments_math[("gpt-4o-2024-05-13", "single-math-v1")]
     else:
+        return model_judgments_normal[("gpt-4o-2024-05-13", "single-v1")]
 def get_pairwise_judge_explanation(gamekey, judgment_dict):