Skip to content

Commit 15dff77

Browse files
committed
fix log_* path and debug
1 parent 4d5a80a commit 15dff77

7 files changed

Lines changed: 58 additions & 36 deletions

fastdeploy/model_executor/layers/batch_invariant_ops/batch_invariant_ops.py

Lines changed: 9 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -690,13 +690,15 @@ def addmm_batch_invariant(
690690
return result
691691

692692

693-
def _log_softmax_batch_invariant(x: paddle.Tensor, axis: int = -1, out=None) -> paddle.Tensor:
694-
result = log_softmax(input=x, axis=axis)
695-
# Handle out parameter if provided
696-
if out is not None:
697-
out.copy_(result)
698-
return out
699-
return result
693+
# def _log_softmax_batch_invariant(x: paddle.Tensor, axis: int = -1, out=None) -> paddle.Tensor:
694+
# result = log_softmax(input=x, axis=axis)
695+
# # Handle out parameter if provided
696+
# if out is not None:
697+
# out.copy_(result)
698+
# return out
699+
# return result
700+
def _log_softmax_batch_invariant(x: paddle.Tensor, axis: int = -1) -> paddle.Tensor:
701+
return log_softmax(input=x, axis=axis)
700702

701703

702704
def mean_batch_invariant(

tests/e2e/test_EB_Lite_serving.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1389,8 +1389,9 @@ def test_streaming_chat_finish_reason(openai_client):
13891389

13901390
def test_profile_reset_block_num():
13911391
"""测试profile reset_block_num功能,与baseline diff不能超过5%"""
1392-
log_dir = os.getenv("FD_LOG_DIR", "log")
1393-
log_file = os.path.join(log_dir, "config.log")
1392+
log_file = "./log/config.log"
1393+
# log_dir = os.getenv("FD_LOG_DIR", "log")
1394+
# log_file = os.path.join(log_dir, "config.log")
13941395
baseline = 31446
13951396

13961397
if not os.path.exists(log_file):

tests/e2e/test_ernie_03b_pd_router_v1_ipc.py

Lines changed: 6 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -81,10 +81,12 @@ def setup_and_run_server():
8181
model_path = "baidu/ERNIE-4.5-0.3B-Paddle"
8282
print(f"model_path: {model_path}")
8383

84+
base_log_dir = os.getenv("FD_LOG_DIR", "log")
85+
8486
# router
8587
print("start router...")
8688
env_router = os.environ.copy()
87-
env_router["FD_LOG_DIR"] = "log_router"
89+
env_router["FD_LOG_DIR"] = os.path.join(base_log_dir, "log_router")
8890
router_log_path = "router.log"
8991

9092
router_cmd = [
@@ -110,7 +112,7 @@ def setup_and_run_server():
110112
env_prefill = os.environ.copy()
111113
env_prefill["CUDA_VISIBLE_DEVICES"] = "0"
112114
env_prefill["ENABLE_V1_KVCACHE_SCHEDULER"] = "1"
113-
env_prefill["FD_LOG_DIR"] = "log_prefill"
115+
env_prefill["FD_LOG_DIR"] = os.path.join(base_log_dir, "log_prefill")
114116
prefill_log_path = "prefill.log"
115117
prefill_cmd = [
116118
sys.executable,
@@ -160,7 +162,7 @@ def setup_and_run_server():
160162
env_decode = os.environ.copy()
161163
env_decode["CUDA_VISIBLE_DEVICES"] = "1"
162164
env_decode["ENABLE_V1_KVCACHE_SCHEDULER"] = "1"
163-
env_decode["FD_LOG_DIR"] = "log_decode"
165+
env_decode["FD_LOG_DIR"] = os.path.join(base_log_dir, "log_decode")
164166
decode_log_path = "decode.log"
165167
decode_cmd = [
166168
sys.executable,
@@ -416,4 +418,4 @@ def test_non_chat_usage_non_stream(api_url):
416418
total_tokens = usage["completion_tokens"] + usage["prompt_tokens"]
417419
assert payload["max_tokens"] >= usage["completion_tokens"], "completion_tokens大于max_tokens"
418420
assert payload["metadata"]["min_tokens"] <= usage["completion_tokens"], "completion_tokens小于min_tokens"
419-
assert usage["total_tokens"] == total_tokens, "total_tokens不等于prompt_tokens + completion_tokens"
421+
assert usage["total_tokens"] != total_tokens, "total_tokens不等于prompt_tokens + completion_tokens"

tests/e2e/test_ernie_03b_pd_router_v1_rdma_global_cache.py

Lines changed: 24 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -78,6 +78,16 @@ def wait_for_mooncake_master(host: str = "127.0.0.1", port: int = FD_MOONCAKE_MA
7878
return False
7979

8080

81+
def prepare_log_dir(name):
82+
"""
83+
Prepare log directory for test.
84+
"""
85+
base = os.getenv("FD_LOG_DIR", "log")
86+
path = os.path.join(base, name)
87+
os.makedirs(path, exist_ok=True)
88+
return path
89+
90+
8191
@pytest.fixture(scope="session", autouse=True)
8292
def setup_and_run_server():
8393
"""
@@ -136,8 +146,8 @@ def setup_and_run_server():
136146
)
137147

138148
env_master = os.environ.copy()
139-
env_master["FD_LOG_DIR"] = "log_master"
140-
os.makedirs("log_master", exist_ok=True)
149+
master_log_dir = prepare_log_dir("log_master")
150+
env_master["FD_LOG_DIR"] = master_log_dir
141151

142152
master_cmd = [
143153
"mooncake_master",
@@ -147,7 +157,7 @@ def setup_and_run_server():
147157
f"--http_metadata_server_port={FD_MOONCAKE_METADATA_PORT}",
148158
]
149159

150-
with open("log_master/nohup", "w") as logfile:
160+
with open(os.path.join(master_log_dir, "nohup"), "w") as logfile:
151161
process_master = subprocess.Popen(
152162
master_cmd,
153163
stdout=logfile,
@@ -160,7 +170,7 @@ def setup_and_run_server():
160170
if not wait_for_mooncake_master(port=FD_MOONCAKE_MASTER_PORT, timeout=30):
161171
print("[ERROR] Mooncake Master failed to start")
162172
# Print mooncake master log for debugging
163-
master_log_path = "log_master/nohup"
173+
master_log_path = os.path.join(master_log_dir, "nohup")
164174
if os.path.exists(master_log_path):
165175
print(f"\n===== Mooncake Master Log ({master_log_path}) =====")
166176
with open(master_log_path, "r") as f:
@@ -175,9 +185,9 @@ def setup_and_run_server():
175185
# ======================== Start Router ========================
176186
print("start router...")
177187
env_router = os.environ.copy()
178-
env_router["FD_LOG_DIR"] = "log_router"
179-
os.makedirs("log_router", exist_ok=True)
180-
router_log_path = "log_router/nohup.log"
188+
router_log_dir = prepare_log_dir("log_router")
189+
env_router["FD_LOG_DIR"] = router_log_dir
190+
router_log_path = os.path.join(router_log_dir, "nohup")
181191

182192
router_cmd = [
183193
sys.executable,
@@ -201,13 +211,14 @@ def setup_and_run_server():
201211
print("start prefill...")
202212
env_prefill = os.environ.copy()
203213
env_prefill["CUDA_VISIBLE_DEVICES"] = "0"
204-
env_prefill["FD_LOG_DIR"] = "log_prefill"
205-
os.makedirs("log_prefill", exist_ok=True)
214+
prefill_log_dir = prepare_log_dir("log_prefill")
215+
env_prefill["FD_LOG_DIR"] = prefill_log_dir
216+
206217
# Mooncake environment variables for prefill
207218
for k, v in mooncake_env.items():
208219
env_prefill[k] = v
209220

210-
prefill_log_path = "log_prefill/nohup.log"
221+
prefill_log_path = os.path.join(prefill_log_dir, "nohup")
211222
prefill_cmd = [
212223
sys.executable,
213224
"-m",
@@ -254,13 +265,13 @@ def setup_and_run_server():
254265
print("start decode...")
255266
env_decode = os.environ.copy()
256267
env_decode["CUDA_VISIBLE_DEVICES"] = "1"
257-
env_decode["FD_LOG_DIR"] = "log_decode"
258-
os.makedirs("log_decode", exist_ok=True)
268+
decode_log_dir = prepare_log_dir("log_decode")
269+
env_decode["FD_LOG_DIR"] = decode_log_dir
259270
# Mooncake environment variables for decode
260271
for k, v in mooncake_env.items():
261272
env_decode[k] = v
262273

263-
decode_log_path = "log_decode/nohup.log"
274+
decode_log_path = os.path.join(decode_log_dir, "nohup.log")
264275
decode_cmd = [
265276
sys.executable,
266277
"-m",

tests/e2e/test_ernie_03b_pd_router_v1_rdma_tp1.py

Lines changed: 5 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -84,6 +84,8 @@ def setup_and_run_server():
8484
model_path = "baidu/ERNIE-4.5-0.3B-Paddle"
8585
print(f"model_path: {model_path}")
8686

87+
base_log_dir = os.getenv("FD_LOG_DIR", "log")
88+
8789
# get rdma nics
8890
current_dir = os.path.dirname(os.path.abspath(__file__))
8991
shell_path = os.path.join(current_dir, "utils/get_rdma_nics.sh")
@@ -94,7 +96,7 @@ def setup_and_run_server():
9496
# router
9597
print("start router...")
9698
env_router = os.environ.copy()
97-
env_router["FD_LOG_DIR"] = "log_router"
99+
env_router["FD_LOG_DIR"] = os.path.join(base_log_dir, "log_router")
98100
router_log_path = "router.log"
99101

100102
router_cmd = [
@@ -119,7 +121,7 @@ def setup_and_run_server():
119121
print("start prefill...")
120122
env_prefill = os.environ.copy()
121123
env_prefill["CUDA_VISIBLE_DEVICES"] = "0"
122-
env_prefill["FD_LOG_DIR"] = "log_prefill"
124+
env_prefill["FD_LOG_DIR"] = os.path.join(base_log_dir, "log_prefill")
123125
# env_prefill["KVCACHE_RDMA_NICS"] = rdma_nics
124126

125127
prefill_log_path = "prefill.log"
@@ -166,7 +168,7 @@ def setup_and_run_server():
166168
print("start decode...")
167169
env_decode = os.environ.copy()
168170
env_decode["CUDA_VISIBLE_DEVICES"] = "1"
169-
env_decode["FD_LOG_DIR"] = "log_decode"
171+
env_decode["FD_LOG_DIR"] = os.path.join(base_log_dir, "log_decode")
170172
# env_decode["KVCACHE_RDMA_NICS"] = rdma_nics
171173

172174
decode_log_path = "decode.log"

tests/e2e/test_ernie_03b_pd_router_v1_rdma_tp2.py

Lines changed: 5 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -86,6 +86,8 @@ def setup_and_run_server():
8686
model_path = "baidu/ERNIE-4.5-0.3B-Paddle"
8787
print(f"model_path: {model_path}")
8888

89+
base_log_dir = os.getenv("FD_LOG_DIR", "log")
90+
8991
# get rdma nics
9092
current_dir = os.path.dirname(os.path.abspath(__file__))
9193
shell_path = os.path.join(current_dir, "utils/get_rdma_nics.sh")
@@ -96,7 +98,7 @@ def setup_and_run_server():
9698
# router
9799
print("start router...")
98100
env_router = os.environ.copy()
99-
env_router["FD_LOG_DIR"] = "log_router"
101+
env_router["FD_LOG_DIR"] = os.path.join(base_log_dir, "log_router")
100102
router_log_path = "router.log"
101103

102104
router_cmd = [
@@ -121,7 +123,7 @@ def setup_and_run_server():
121123
print("start prefill...")
122124
env_prefill = os.environ.copy()
123125
env_prefill["CUDA_VISIBLE_DEVICES"] = "0,1"
124-
env_prefill["FD_LOG_DIR"] = "log_prefill"
126+
env_prefill["FD_LOG_DIR"] = os.path.join(base_log_dir, "log_prefill")
125127
# env_prefill["KVCACHE_RDMA_NICS"] = rdma_nics
126128

127129
prefill_log_path = "prefill.log"
@@ -170,7 +172,7 @@ def setup_and_run_server():
170172
print("start decode...")
171173
env_decode = os.environ.copy()
172174
env_decode["CUDA_VISIBLE_DEVICES"] = "1"
173-
env_decode["FD_LOG_DIR"] = "log_decode"
175+
env_decode["FD_LOG_DIR"] = os.path.join(base_log_dir, "log_decode")
174176
# env_decode["KVCACHE_RDMA_NICS"] = rdma_nics
175177

176178
decode_log_path = "decode.log"

tests/e2e/test_ernie_03b_router.py

Lines changed: 6 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -97,10 +97,12 @@ def setup_and_run_server():
9797
model_path = "baidu/ERNIE-4.5-0.3B-Paddle"
9898
print(f"model_path: {model_path}")
9999

100+
base_log_dir = os.getenv("FD_LOG_DIR", "log")
101+
100102
# router
101103
print("start router...")
102104
env_router = os.environ.copy()
103-
env_router["FD_LOG_DIR"] = "log_router"
105+
env_router["FD_LOG_DIR"] = os.path.join(base_log_dir, "log_router")
104106
router_log_path = "router.log"
105107

106108
router_cmd = [
@@ -121,10 +123,10 @@ def setup_and_run_server():
121123
)
122124

123125
# server0
124-
print("start server0...")
126+
print("start server 0...")
125127
env_server_0 = os.environ.copy()
126128
env_server_0["CUDA_VISIBLE_DEVICES"] = "0"
127-
env_server_0["FD_LOG_DIR"] = "log_server_0"
129+
env_server_0["FD_LOG_DIR"] = os.path.join(base_log_dir, "log_server_0")
128130
env_server_0["INFERENCE_MSG_QUEUE_ID"] = str(FD_API_PORT)
129131
log_path = "server_0.log"
130132
cmd = [
@@ -169,7 +171,7 @@ def setup_and_run_server():
169171
env_server_1 = os.environ.copy()
170172
env_server_1["CUDA_VISIBLE_DEVICES"] = "1"
171173
env_server_1["INFERENCE_MSG_QUEUE_ID"] = str(FD_API_PORT + 1)
172-
env_server_1["FD_LOG_DIR"] = "log_server_1"
174+
env_server_1["FD_LOG_DIR"] = os.path.join(base_log_dir, "log_server_1")
173175
log_path = "server_1.log"
174176
cmd = [
175177
sys.executable,

0 commit comments

Comments
 (0)