Skip to content

Commit 3e1380c

Browse files
author
Weichao Luo
committed
fix lint.
1 parent 643bca5 commit 3e1380c

7 files changed

Lines changed: 17 additions & 23 deletions

File tree

lightllm/server/router/model_infer/mode_backend/base_backend.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -524,7 +524,7 @@ def _post_handle(
524524
eos_ids=self.eos_id,
525525
extra_post_req_handle_func=extra_post_req_handle_func,
526526
is_master_in_dp=self.is_master_in_dp,
527-
call_post_handle_for_chunk=call_post_handle_for_chunk
527+
call_post_handle_for_chunk=call_post_handle_for_chunk,
528528
)
529529

530530
g_infer_context.req_manager.req_sampling_params_manager.update_reqs_token_counter(

lightllm/server/router/model_infer/mode_backend/chunked_prefill/impl.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -138,7 +138,7 @@ def prefill_normal(
138138
next_token_logprobs=next_token_logprobs_cpu,
139139
run_reqs_update_packs=update_packs,
140140
extra_post_req_handle_func=self.extra_post_req_handle_func,
141-
call_post_handle_for_chunk=self.call_post_handle_for_chunk
141+
call_post_handle_for_chunk=self.call_post_handle_for_chunk,
142142
)
143143
# 第四阶段
144144
event_pack.notify_pre_post_handle()
@@ -185,7 +185,7 @@ def decode_normal(
185185
next_token_ids=next_token_ids_cpu,
186186
next_token_logprobs=next_token_logprobs_cpu,
187187
run_reqs_update_packs=update_packs,
188-
extra_post_req_handle_func=self.extra_post_req_handle_func
188+
extra_post_req_handle_func=self.extra_post_req_handle_func,
189189
)
190190

191191
# 第四阶段
@@ -351,7 +351,7 @@ def decode_mtp(
351351
next_token_ids=next_token_ids_cpu[select_mask],
352352
next_token_logprobs=next_token_logprobs_cpu[select_mask],
353353
run_reqs_update_packs=update_packs,
354-
extra_post_req_handle_func=self.extra_post_req_handle_func
354+
extra_post_req_handle_func=self.extra_post_req_handle_func,
355355
)
356356
if len(need_free_mem_indexes) > 0:
357357
g_infer_state_lock.acquire()

lightllm/server/router/model_infer/mode_backend/dp_backend/impl.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -160,7 +160,7 @@ def prefill_normal(
160160
next_token_logprobs=next_token_logprobs_cpu,
161161
run_reqs_update_packs=update_packs,
162162
extra_post_req_handle_func=self.extra_post_req_handle_func,
163-
call_post_handle_for_chunk=self.call_post_handle_for_chunk
163+
call_post_handle_for_chunk=self.call_post_handle_for_chunk,
164164
)
165165
# 第四阶段
166166
event_pack.notify_pre_post_handle()
@@ -291,7 +291,7 @@ def prefill_overlap(self, event_pack: OverlapEventPack, prefill_reqs: List[Infer
291291
next_token_logprobs=next_token_logprobs_cpu,
292292
run_reqs_update_packs=update_packs,
293293
extra_post_req_handle_func=self.extra_post_req_handle_func,
294-
call_post_handle_for_chunk=self.call_post_handle_for_chunk
294+
call_post_handle_for_chunk=self.call_post_handle_for_chunk,
295295
)
296296
# 第四阶段
297297
event_pack.notify_pre_post_handle()
@@ -664,7 +664,7 @@ def prefill_overlap_mtp(self, event_pack: OverlapEventPack, prefill_reqs: List[I
664664
next_token_logprobs=next_token_logprobs_cpu,
665665
run_reqs_update_packs=update_packs,
666666
extra_post_req_handle_func=self.extra_post_req_handle_func,
667-
call_post_handle_for_chunk=self.call_post_handle_for_chunk
667+
call_post_handle_for_chunk=self.call_post_handle_for_chunk,
668668
)
669669
event_pack.notify_pre_post_handle()
670670
else:

lightllm/server/router/model_infer/mode_backend/pd_nixl/impl_for_pd_base.py

Lines changed: 7 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -190,7 +190,6 @@ def _handle_chunked_transfer(self, req: InferReq, next_token_id: int = None, nex
190190
transfer_state.next_token_logprob = next_token_logprob
191191

192192
async def _transfer_kv_to_remote_paged_batch(self, transfer_reqs: List[KVMoveRequest]):
193-
start = time.time()
194193
requests_by_agents = dict()
195194
transfer_pages = self.page_scheduer.borrow(len(transfer_reqs))
196195
# first copy the kv to transfer pages & build notification
@@ -216,7 +215,9 @@ async def _transfer_kv_to_remote_paged_batch(self, transfer_reqs: List[KVMoveReq
216215
receive_page = transfer_state.free_page_ids.pop(0)
217216
requests_by_agents[decode_id][0].append(page_index)
218217
requests_by_agents[decode_id][1].append(receive_page)
219-
is_last = transfer_state.is_finished and start_kv_len + trans_kv_len == transfer_state.current_kv_len
218+
is_last = (
219+
transfer_state.is_finished and start_kv_len + trans_kv_len == transfer_state.current_kv_len
220+
)
220221

221222
requests_by_agents[decode_id][2].append(
222223
RemotePrefillStatus(
@@ -241,8 +242,6 @@ async def _transfer_kv_to_remote_paged_batch(self, transfer_reqs: List[KVMoveReq
241242
# transfer
242243
self.nixl_agent.write_blocks_paged(decode_id, transfer_pages, receive_pages, notifications)
243244

244-
# logger.info(f"transfer kv to remote paged batch: {len(transfer_reqs)} " f"took: {time.time() - start} seconds")
245-
246245
async def _handle_transfer_loop(self):
247246
while True:
248247
free_transfer_pages = self.page_scheduer.current_size()
@@ -424,8 +423,7 @@ def _post_remote_prefill(self, req: InferReq, success: bool = True):
424423
assert group_req_id in self.request_to_first_token, f"{group_req_id} not in request_to_first_token dict"
425424
token_id, token_logprob = self.request_to_first_token.pop(group_req_id)
426425

427-
428-
#(TODO) figure out how to update req_to_next_token_ids
426+
# (TODO) figure out how to update req_to_next_token_ids
429427
# req.cur_output_len += 1
430428

431429
# pack = InferReqUpdatePack(req, req.cur_output_len)
@@ -439,9 +437,7 @@ def _post_remote_prefill(self, req: InferReq, success: bool = True):
439437
# )
440438
return token_id
441439

442-
def _decode_filter_reqs(
443-
self, prefill_reqs: List[InferReq], decode_reqs: List[InferReq]
444-
):
440+
def _decode_filter_reqs(self, prefill_reqs: List[InferReq], decode_reqs: List[InferReq]):
445441
new_prefill_reqs: List[InferReq] = []
446442
remote_prefill_reqs: List[InferReq] = []
447443
failed_prefill_reqs: List[InferReq] = []
@@ -534,5 +530,6 @@ def _prefill_abort_remote(self, req_objs: List[InferReq]):
534530
class PDNIXLBackendBaseChunked(PDNIXLBackendBase, ChunkedPrefillBackend):
535531
pass
536532

533+
537534
class PDNIXLBackendBaseDPChunked(PDNIXLBackendBase, DPChunkedPrefillBackend):
538-
pass
535+
pass

lightllm/server/router/model_infer/mode_backend/pd_nixl/impl_for_pd_decode.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -73,15 +73,16 @@ def _pre_handle_finished_reqs(self, finished_reqs: List[InferReq]):
7373

7474
finished_reqs = new_finished_reqs
7575

76-
7776
def _get_classed_reqs(
7877
self,
7978
req_ids: List[int] = None,
8079
no_decode: bool = False,
8180
strict_prefill: bool = False,
8281
recover_paused: bool = False,
8382
):
84-
prefill_reqs, decode_reqs = super(type(self), self)._get_classed_reqs(req_ids, no_decode, strict_prefill, recover_paused)
83+
prefill_reqs, decode_reqs = super(type(self), self)._get_classed_reqs(
84+
req_ids, no_decode, strict_prefill, recover_paused
85+
)
8586
prefill_reqs, decode_reqs, failed_reqs, _ = self._decode_filter_reqs(prefill_reqs, decode_reqs)
8687

8788
if failed_reqs:

lightllm/server/router/model_infer/mode_backend/pd_nixl/impl_for_pd_decode_dp.py

Lines changed: 0 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,6 @@
11
from types import MethodType
22
import torch.multiprocessing as mp
33
from lightllm.utils.log_utils import init_logger
4-
from lightllm.utils.envs_utils import get_env_start_args
54

65
from .impl_for_pd_base import PDNIXLBackendBaseDPChunked
76
from .impl_for_pd_decode import PDNIXLBackendForDecodeNode
@@ -20,4 +19,3 @@ def __init__(self, prefill_task_queue: mp.Queue, prefill_done_queue: mp.Queue, n
2019
self._trigger_remote_prefill = MethodType(PDNIXLBackendForDecodeNode._trigger_remote_prefill, self)
2120
self._pre_handle_finished_reqs = MethodType(PDNIXLBackendForDecodeNode._pre_handle_finished_reqs, self)
2221
self._get_classed_reqs = MethodType(PDNIXLBackendForDecodeNode._get_classed_reqs, self)
23-

lightllm/server/router/model_infer/mode_backend/pd_nixl/impl_for_pd_prefill_dp.py

Lines changed: 0 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -2,8 +2,6 @@
22
import torch.multiprocessing as mp
33
from lightllm.server.router.model_infer.infer_batch import g_infer_context
44
from lightllm.utils.log_utils import init_logger
5-
from lightllm.utils.envs_utils import get_env_start_args
6-
# from lightllm.server.router.model_infer.mode_backend.dp_backend.impl import DPChunkedPrefillBackend
75

86
from .impl_for_pd_base import PDNIXLBackendBaseDPChunked
97
from .impl_for_pd_prefill import PDNIXLBackendForPrefillNode

0 commit comments

Comments
 (0)