Skip to content

Commit 684131d

Browse files
committed
update
1 parent 25dff74 commit 684131d

1 file changed

Lines changed: 2 additions & 2 deletions

File tree

eval_protocol/benchmarks/test_aime25.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -90,8 +90,8 @@ def aime2025_dataset_adapter(rows: List[Dict[str, Any]]) -> List[EvaluationRow]:
9090
rollout_processor=SingleTurnRolloutProcessor(),
9191
aggregation_method="mean",
9292
passed_threshold=0.8,
93-
num_runs=8,
94-
max_concurrent_rollouts=4,
93+
num_runs=2,
94+
max_concurrent_rollouts=16,
9595
mode="pointwise",
9696
)
9797
def test_aime25_pointwise(row: EvaluationRow) -> EvaluationRow:

0 commit comments

Comments
 (0)