We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent f357065 commit 088dea6Copy full SHA for 088dea6
eval_protocol/quickstart/llm_judge.py
@@ -64,6 +64,8 @@ def aime2025_dataset_adapter(rows: List[Dict[str, Any]]) -> List[EvaluationRow]:
64
],
65
rollout_processor=SingleTurnRolloutProcessor(),
66
# preprocess_fn=split_multi_turn_rows,
67
+ num_runs=1,
68
+ max_dataset_rows=1,
69
max_concurrent_rollouts=64,
70
mode="pointwise",
71
)
0 commit comments