Skip to content

Commit d5f3b81

Browse files
committed
how about 2 and 4
1 parent a26cf02 commit d5f3b81

File tree

2 files changed

+10
-5
lines changed

2 files changed

+10
-5
lines changed

eval_protocol/benchmarks/test_aime25.py

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -93,6 +93,11 @@ def aime2025_dataset_adapter(rows: List[Dict[str, Any]]) -> List[EvaluationRow]:
9393
"extra_body": {"reasoning_effort": "low"},
9494
"model": "fireworks_ai/accounts/fireworks/models/gpt-oss-20b",
9595
},
96+
{
97+
"max_tokens": 131000,
98+
"extra_body": {"reasoning_effort": "medium"},
99+
"model": "fireworks_ai/accounts/fireworks/models/gpt-oss-20b",
100+
},
96101
],
97102
rollout_processor=SingleTurnRolloutProcessor(),
98103
aggregation_method="mean",

eval_protocol/quickstart/llm_judge.py

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -49,11 +49,11 @@
4949
"extra_body": {"reasoning_effort": "low"},
5050
"model": "fireworks_ai/accounts/fireworks/models/gpt-oss-20b",
5151
},
52-
{
53-
"max_tokens": 131000,
54-
"extra_body": {"reasoning_effort": "low"},
55-
"model": "fireworks_ai/accounts/fireworks/models/gpt-oss-120b",
56-
},
52+
# {
53+
# "max_tokens": 131000,
54+
# "extra_body": {"reasoning_effort": "low"},
55+
# "model": "fireworks_ai/accounts/fireworks/models/gpt-oss-120b",
56+
# },
5757
],
5858
rollout_processor=SingleTurnRolloutProcessor(),
5959
# preprocess_fn=split_multi_turn_rows,

0 commit comments

Comments
 (0)