Update common.py
Browse files
common.py
CHANGED
|
@@ -623,13 +623,13 @@ def resolve_single_judgment_dict(
|
|
| 623 |
"""Return the correct single answer grading judge."""
|
| 624 |
if multi_turn:
|
| 625 |
if question["category"] in NEED_REF_CATS:
|
| 626 |
-
return model_judgments_math[("gpt-
|
| 627 |
-
return model_judgments_normal[("gpt-
|
| 628 |
|
| 629 |
if question["category"] in NEED_REF_CATS:
|
| 630 |
-
return model_judgments_math[("gpt-
|
| 631 |
else:
|
| 632 |
-
return model_judgments_normal[("gpt-
|
| 633 |
|
| 634 |
|
| 635 |
def get_pairwise_judge_explanation(gamekey, judgment_dict):
|
|
|
|
| 623 |
"""Return the correct single answer grading judge."""
|
| 624 |
if multi_turn:
|
| 625 |
if question["category"] in NEED_REF_CATS:
|
| 626 |
+
return model_judgments_math[("gpt-4o-2024-05-13", "single-math-v1-multi-turn")]
|
| 627 |
+
return model_judgments_normal[("gpt-4o-2024-05-13", "single-v1-multi-turn")]
|
| 628 |
|
| 629 |
if question["category"] in NEED_REF_CATS:
|
| 630 |
+
return model_judgments_math[("gpt-4o-2024-05-13", "single-math-v1")]
|
| 631 |
else:
|
| 632 |
+
return model_judgments_normal[("gpt-4o-2024-05-13", "single-v1")]
|
| 633 |
|
| 634 |
|
| 635 |
def get_pairwise_judge_explanation(gamekey, judgment_dict):
|