Skip to content

Commit 3569d53

Browse files
committed
fix
1 parent 68954b0 commit 3569d53

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

lightllm/server/router/model_infer/mode_backend/base_backend.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1007,7 +1007,7 @@ def _flush_routing_to_kv_buffer(self, mem_indexes: torch.Tensor, microbatch_inde
10071007
if not mem_indexes.is_cuda:
10081008
mem_indexes = mem_indexes.cuda(non_blocking=True)
10091009
num_tokens = mem_indexes.shape[0]
1010-
_routing_mgr.g_routing_capture_manager.flush_to_kv_buffer(mem_indexes, num_tokens, microbatch_index)
1010+
_routing_mgr.g_routing_capture_manager.flush_to_routing_buffer(mem_indexes, num_tokens, microbatch_index)
10111011

10121012
def _dp_all_gather_prefill_and_decode_req_num(
10131013
self, prefill_reqs: List[InferReq], decode_reqs: List[InferReq]

0 commit comments

Comments
 (0)