Skip to content

Commit fd44bb7

Browse files
zhoutianzi666“liuruian”
andauthored
cpmmot (#7105)
Co-authored-by: “liuruian” <liuruian@baidu.com>
1 parent 5c5dc66 commit fd44bb7

1 file changed

Lines changed: 1 addition & 19 deletions

File tree

custom_ops/gpu_ops/append_attn/multiquery_attention_c16_impl.cuh

Lines changed: 1 addition & 19 deletions
Original file line numberDiff line numberDiff line change
@@ -485,26 +485,8 @@ __global__ void multi_query_append_attention_warp1_4_kernel(
485485
const int *block_table_now = block_table + batch_id * max_block_num_per_seq;
486486

487487
const uint32_t q_len = seq_lens[batch_id];
488-
if (q_len <= 0) {
489-
return;
490-
}
488+
const uint32_t kv_len = seq_lens_kv[batch_id] + q_len;
491489

492-
uint32_t kv_len = seq_lens_kv[batch_id];
493-
if (ENABLE_PREFILL) {
494-
kv_len += q_len;
495-
if (kv_len <= 0) {
496-
return;
497-
}
498-
} else {
499-
if (kv_len <= 0) {
500-
return;
501-
}
502-
kv_len += q_len;
503-
}
504-
const int seq_len_enc = seq_lens_encoder[batch_id];
505-
if (seq_len_enc > 0) {
506-
return;
507-
}
508490
const uint32_t num_chunks_this_seq = div_up(kv_len, chunk_size);
509491
if (chunk_idx >= num_chunks_this_seq) {
510492
return;

0 commit comments

Comments
 (0)