Skip to content

Commit 66278e4

Browse files
committed
test
1 parent d998db4 commit 66278e4

File tree

1 file changed

+4
-4
lines changed

1 file changed

+4
-4
lines changed

eval_protocol/benchmarks/test_aime25.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -87,17 +87,17 @@ def aime2025_dataset_adapter(rows: List[Dict[str, Any]]) -> List[EvaluationRow]:
8787
completion_params=[
8888
{
8989
"max_tokens": 131000,
90-
"extra_body": {"reasoning_effort": "low"},
91-
"model": "fireworks_ai/accounts/fireworks/models/gpt-oss-120b",
92-
"request_timeout": 1200, # 20 minutes Fireworks timeout
90+
# "extra_body": {"reasoning_effort": "low"},
91+
"model": "fireworks_ai/accounts/pyroworks/deployedModels/glm-4p6-qpwrimne",
92+
"request_timeout": 30,
9393
}
9494
],
9595
rollout_processor=SingleTurnRolloutProcessor(),
9696
aggregation_method="mean",
9797
passed_threshold=0.8,
9898
num_runs=1,
9999
max_dataset_rows=1,
100-
max_concurrent_rollouts=4,
100+
max_concurrent_rollouts=1,
101101
mode="pointwise",
102102
)
103103
def test_aime25_pointwise(row: EvaluationRow) -> EvaluationRow:

0 commit comments

Comments
 (0)