Skip to content

Commit 43cabb7

Browse files
committed
[Create PR]:
- Remove --use_lmeval_batching arg
1 parent 6c3cb22 commit 43cabb7

1 file changed

Lines changed: 5 additions & 16 deletions

File tree

examples/mmlu_benchmark/mmlu_benchmark.py

Lines changed: 5 additions & 16 deletions
Original file line numberDiff line numberDiff line change
@@ -161,11 +161,6 @@ def parse_args():
161161
default=None,
162162
help="Pad predictions to this size with -inf (default: no padding, disco-public uses 31)",
163163
)
164-
parser.add_argument(
165-
"--use_lmeval_batching",
166-
action="store_true",
167-
help="Use lm-evaluation-harness batching for exact numerical match. This batches ALL requests together before computing logprobs.",
168-
)
169164

170165
return parser.parse_args()
171166

@@ -564,7 +559,7 @@ def _resolve_data_path(data_path: str) -> str:
564559

565560

566561
def _apply_eval_config_from_repo(repo_path: Path, args: "argparse.Namespace") -> None:
567-
"""Load eval_config from repo; forbid passing --pca/--pad_to_size/--use_lmeval_batching, then set args from eval_config."""
562+
"""Load eval_config from repo; forbid passing --pca/--pad_to_size, then set args from eval_config."""
568563
config_path = repo_path / DISCO_CONFIG_FILENAME
569564
if not config_path.exists():
570565
return
@@ -579,8 +574,6 @@ def _apply_eval_config_from_repo(repo_path: Path, args: "argparse.Namespace") ->
579574
errors.append(f"do not pass --pca (model uses pca={eval_config['pca']})")
580575
if "pad_to_size" in eval_config and args.pad_to_size is not None:
581576
errors.append(f"do not pass --pad_to_size (model uses pad_to_size={eval_config['pad_to_size']})")
582-
if "use_lmeval_batching" in eval_config and args.use_lmeval_batching:
583-
errors.append("do not pass --use_lmeval_batching (model uses use_lmeval_batching=True)")
584577
if errors:
585578
raise ValueError("When using a DISCO model from the Hub, " + "; ".join(errors) + ". Omit these flags to use the model's eval_config.")
586579
# Require data_path to match model config (use_full_prompt is always True)
@@ -592,8 +585,6 @@ def _apply_eval_config_from_repo(repo_path: Path, args: "argparse.Namespace") ->
592585
args.pca = eval_config["pca"]
593586
if "pad_to_size" in eval_config:
594587
args.pad_to_size = eval_config["pad_to_size"]
595-
if "use_lmeval_batching" in eval_config:
596-
args.use_lmeval_batching = eval_config["use_lmeval_batching"]
597588

598589

599590
def _resolve_hf_disco_repo(
@@ -700,12 +691,10 @@ def main():
700691
num_workers=args.num_workers,
701692
)
702693

703-
# Optionally precompute logprobs using lm-eval batching for exact match
704-
if args.use_lmeval_batching:
705-
print("\nPrecomputing logprobs using lm-eval batching ...")
706-
# Get task list for precomputation
707-
task_list = list(tasks._anchor_tasks if hasattr(tasks, "_anchor_tasks") else tasks._tasks)
708-
benchmark.precompute_all_logprobs_lmeval(task_list)
694+
# Precompute logprobs using lm-eval batching for exact numerical match
695+
print("\nPrecomputing logprobs using lm-eval batching ...")
696+
task_list = list(tasks._anchor_tasks if hasattr(tasks, "_anchor_tasks") else tasks._tasks)
697+
benchmark.precompute_all_logprobs_lmeval(task_list)
709698

710699
# Run evaluation
711700
print("\nRunning evaluation...")

0 commit comments

Comments
 (0)