diff --git a/fastchat/llm_judge/gen_judgment.py b/fastchat/llm_judge/gen_judgment.py index d2d7617c6..23d371883 100644 --- a/fastchat/llm_judge/gen_judgment.py +++ b/fastchat/llm_judge/gen_judgment.py @@ -154,15 +154,6 @@ def make_judge_single(judge_model, judge_prompts): judges = {} judges["default"] = Judge(judge_model, judge_prompts["single-v1"]) judges["math"] = Judge(judge_model, judge_prompts["single-math-v1"], ref_based=True) - judges["default-mt"] = Judge( - judge_model, judge_prompts["single-v1-multi-turn"], multi_turn=True - ) - judges["math-mt"] = Judge( - judge_model, - judge_prompts["single-math-v1-multi-turn"], - ref_based=True, - multi_turn=True, - ) return judges