We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 6324f38 commit 25dff74Copy full SHA for 25dff74
1 file changed
eval_protocol/benchmarks/test_aime25.py
@@ -91,7 +91,6 @@ def aime2025_dataset_adapter(rows: List[Dict[str, Any]]) -> List[EvaluationRow]:
91
aggregation_method="mean",
92
passed_threshold=0.8,
93
num_runs=8,
94
- max_dataset_rows=2,
95
max_concurrent_rollouts=4,
96
mode="pointwise",
97
)
0 commit comments