Skip to content

Commit 1d889b8

Browse files
committed
Cleanup comments, ammend lighteval
1 parent 34e3b2a commit 1d889b8

3 files changed

Lines changed: 3 additions & 6 deletions

File tree

benchmarks/benchmark_lib.sh

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -160,7 +160,6 @@ run_benchmark_serving() {
160160

161161
_install_lm_eval_deps() {
162162
python3 -m pip install -q --no-cache-dir "lm-eval[api]" || true
163-
# Temporary: workaround issue by using main
164163
python3 -m pip install -q --no-cache-dir --no-deps \
165164
"git+https://github.com/EleutherAI/lm-evaluation-harness.git@b315ef3b05176acc9732bb7fdec116abe1ecc476" || true
166165
}
@@ -356,7 +355,7 @@ META
356355
# ------------------------------
357356

358357
_install_lighteval_deps() {
359-
python3 -m pip install -q --no-cache-dir "lighteval[api]" "litellm" || true
358+
python3 -m pip install -q --no-cache-dir "lighteval==0.13.0" "litellm==1.80.7" || true
360359
}
361360

362361
# Patch lighteval's LiteLLMClient to handle reasoning content and Python name mangling
@@ -615,7 +614,7 @@ run_lighteval_eval() {
615614
local base_url="http://0.0.0.0:${port}/v1"
616615
export OPENAI_API_KEY="${OPENAI_API_KEY:-EMPTY}"
617616

618-
local MODEL_ARGS="model_name=${lite_model},base_url=${base_url},api_key=${OPENAI_API_KEY},generation_parameters={temperature:0.0,top_p=1,max_new_tokens:2048},concurrent_requests=${concurrent_requests}"
617+
local MODEL_ARGS="model_name=${lite_model},base_url=${base_url},api_key=${OPENAI_API_KEY},generation_parameters={temperature:0.0,top_p:1,max_new_tokens:2048},concurrent_requests=${concurrent_requests}"
619618
local TASK_SPEC="${task}|${num_fewshot}"
620619

621620
# Respect absolute paths (e.g., /tmp/eval_out); otherwise write under /workspace

benchmarks/gptoss_fp4_h200_slurm.sh

Lines changed: 0 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -39,8 +39,6 @@ export TORCH_CUDA_ARCH_LIST="9.0"
3939
PORT=$(( 8888 + $PORT_OFFSET ))
4040
MODEL_NAME=${MODEL##*/}
4141

42-
export TORCH_CUDA_ARCH_LIST="9.0"
43-
4442
PYTHONNOUSERSITE=1 vllm serve $MODEL --host 0.0.0.0 --port $PORT \
4543
--config config.yaml \
4644
--gpu-memory-utilization 0.9 \

utils/evals/custom_gsm8k.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,7 @@
1313
evaluation_splits=["test"],
1414
few_shots_split=None,
1515
few_shots_select="random_sampling_from_train",
16-
generation_size=768, # raised this from 256
16+
generation_size=1024, # raised this from 256
1717
metrics=[Metrics.expr_gold_metric],
1818
stop_sequence=None, # avoid early stop on "Question:"
1919
version=0,

0 commit comments

Comments
 (0)