Skip to content

Commit 1ed958f

Browse files
committed
Update project names in benchmark YAML files to 'benchmarking'; modify process killing function to exclude additional substring.
1 parent 0ab6d6b commit 1ed958f

12 files changed

Lines changed: 15 additions & 13 deletions

File tree

ajet/utils/cleaner.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,7 @@ def kill_ray_processes():
2020

2121
def fast_kill_by_keyword_bash(
2222
keyword: str,
23-
exclude_substrings=["alpha_auto_research", "vscode", "benchmark", "jupyter", "supervisord", "download_model", "opencode", "opencodex"],
23+
exclude_substrings=["alpha", "vscode", "benchmark", "jupyter", "supervisord", "download_model", "opencode", "opencodex", "pai-nohang"],
2424
grace_seconds: float = 1.0,
2525
):
2626
"""Use bash pipelines to kill processes matching keyword quickly.

scripts/deploy_model.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -15,14 +15,14 @@
1515
parser = argparse.ArgumentParser(description="deploy Hugging Face model")
1616
parser.add_argument(
1717
"--target",
18-
# default="/mnt/data_cpfs/model_cache/modelscope/hub/Qwen/Qwen/Qwen3-235B-A22B-Instruct-2507/",
19-
default="/mnt/data_cpfs/model_cache/modelscope/hub/Qwen/Qwen/Qwen2___5-14B-Instruct",
18+
default="/mnt/data_cpfs/model_cache/modelscope/hub/Qwen/Qwen/Qwen3-235B-A22B-Instruct-2507/",
19+
# default="/mnt/data_cpfs/model_cache/modelscope/hub/Qwen/Qwen/Qwen2___5-14B-Instruct",
2020
type=str,
2121
help="Model path",
2222
)
2323
parser.add_argument(
2424
"--alias",
25-
default="Qwen/Qwen2.5-14B-Instruct",
25+
default="Qwen/Qwen3-235B-A22B-Instruct-2507",
2626
type=str,
2727
help="Model alias",
2828
)

tests/bench/README.md

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -19,6 +19,8 @@ python -m pytest -s tests/bench/benchmark_countdown/execute_benchmark_countdown.
1919
python -m pytest -s tests/bench/benchmark_learn2ask/execute_benchmark_learn2ask.py
2020
python -m pytest -s tests/bench/benchmark_frozenlake/execute_benchmark_frozenlake.py
2121

22+
23+
别忘了Benchmark Api Key
2224
VERL_PYTHON="./.venv/bin/python" python -m pytest -s tests/bench/benchmark_math/execute_benchmark_math.py::TestBenchmarkMath::test_01_begin_verl
2325
VERL_PYTHON="./.venv/bin/python" python -m pytest -s tests/bench/benchmark_appworld/execute_benchmark_appworld.py::TestBenchmarkAppworld::test_01_begin_verl
2426
VERL_PYTHON="./.venv/bin/python" python -m pytest -s tests/bench/benchmark_countdown/execute_benchmark_countdown.py::TestBenchmarkCountdown::test_01_begin_verl

tests/bench/benchmark_appworld/benchmark_appworld.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
# ------------------ 主要配置 ------------------
22
ajet:
3-
project_name: example_appworld
3+
project_name: benchmarking
44
experiment_name: "read_yaml_name"
55
task_judge:
66
# ✨✨✨✨ 编写并选择评价函数

tests/bench/benchmark_appworld/benchmark_appworld_2nodes.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
# ------------------ 主要配置 ------------------
22
ajet:
3-
project_name: example_appworld
3+
project_name: benchmarking
44
experiment_name: "read_yaml_name"
55
task_judge:
66
# ✨✨✨✨ 编写并选择评价函数

tests/bench/benchmark_appworld/benchmark_appworld_oai_sdk.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
# ------------------ 主要配置 ------------------
22
ajet:
3-
project_name: example_appworld
3+
project_name: benchmarking
44
task_judge:
55
# ✨✨✨✨ 编写并选择评价函数
66
judge_protocol: ajet.task_judge.env_service_as_judge->EnvServiceJudge

tests/bench/benchmark_appworldlora/benchmark_appworldlora.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
# ------------------ 主要配置 ------------------
22
ajet:
3-
project_name: example_appworld_lora
3+
project_name: benchmarking
44
experiment_name: "read_yaml_name"
55
task_judge:
66
# ✨✨✨✨ 编写并选择评价函数

tests/bench/benchmark_countdownlora/benchmark_countdownlora.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
# ------------------ main configuration ------------------
22
ajet:
3-
project_name: benchmarking_lora
3+
project_name: benchmarking
44

55
model:
66
# ✨✨✨✨ which model should be trained

tests/bench/benchmark_frozenlakelora/benchmark_frozenlakelora.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
# ------------------ main config ------------------
22
ajet:
3-
project_name: benchmarking_lora
3+
project_name: benchmarking
44

55
task_reader:
66
type: random_dummy # ✨✨✨✨ `env_service` or `dataset_file` or `huggingface_dat_repo` or `random_dummy`

tests/bench/benchmark_learn2ask/benchmark_learn2ask.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
# ------------------ 主要配置 ------------------
22
ajet:
3-
project_name: example_learn2ask_enhancedreward
3+
project_name: benchmarking
44
task_reader:
55
type: jsonl_dataset_file
66
jsonl_dataset_file:

0 commit comments

Comments
 (0)