Skip to content

Commit 507e464

Browse files
committed
Reset buffer size of R3
1 parent 8c4f5a6 commit 507e464

1 file changed

Lines changed: 2 additions & 3 deletions

File tree

fastdeploy/worker/input_batch.py

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -189,9 +189,8 @@ def init_share_inputs(self):
189189
self.cu_seqlens_k = paddle.full([max_num_seqs + 1], 0, dtype="int32")
190190

191191
# Initialize addressing buffers
192-
_max_batched_tokens = self.scheduler_config.max_num_batched_tokens
193-
self.position_ids_buffer = paddle.zeros([_max_batched_tokens], dtype=paddle.int32)
194-
self.slot_mapping_buffer = paddle.zeros([_max_batched_tokens], dtype=paddle.int64)
192+
self.position_ids_buffer = paddle.zeros([self.max_chunk_tokens], dtype=paddle.int32)
193+
self.slot_mapping_buffer = paddle.zeros([self.max_chunk_tokens], dtype=paddle.int64)
195194

196195
# Declare AttentionBackend buffers
197196
self.decoder_batch_ids = None

0 commit comments

Comments
 (0)