File tree Expand file tree Collapse file tree
custom_ops/gpu_ops/append_attn Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -485,26 +485,8 @@ __global__ void multi_query_append_attention_warp1_4_kernel(
485485 const int *block_table_now = block_table + batch_id * max_block_num_per_seq;
486486
487487 const uint32_t q_len = seq_lens[batch_id];
488- if (q_len <= 0 ) {
489- return ;
490- }
488+ const uint32_t kv_len = seq_lens_kv[batch_id] + q_len;
491489
492- uint32_t kv_len = seq_lens_kv[batch_id];
493- if (ENABLE_PREFILL) {
494- kv_len += q_len;
495- if (kv_len <= 0 ) {
496- return ;
497- }
498- } else {
499- if (kv_len <= 0 ) {
500- return ;
501- }
502- kv_len += q_len;
503- }
504- const int seq_len_enc = seq_lens_encoder[batch_id];
505- if (seq_len_enc > 0 ) {
506- return ;
507- }
508490 const uint32_t num_chunks_this_seq = div_up (kv_len, chunk_size);
509491 if (chunk_idx >= num_chunks_this_seq) {
510492 return ;
You can’t perform that action at this time.
0 commit comments