Skip to content

Commit 1ea59e9

Browse files
committed
fix condition
Signed-off-by: Ceng23333 <441651826@qq.com>
1 parent 12244c2 commit 1ea59e9

1 file changed

Lines changed: 1 addition & 7 deletions

File tree

src/infinicore/ops/multi_head_attention_varlen/mha_varlen_flashattn.cc

Lines changed: 1 addition & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -152,11 +152,7 @@ void run(void *planned_meta) {
152152

153153
#if defined(ENABLE_METAX_API)
154154
run_flashattn_varlen_metax(p);
155-
return;
156-
#endif
157-
158-
// Original InfiniCore path (NVIDIA + xmake flash-attn-nvidia). MetaX is handled above.
159-
#if defined(ENABLE_NVIDIA_API)
155+
#else
160156
c10::cuda::CUDAStreamGuard guard(infinicore::adaptor::get_cuda_stream());
161157

162158
auto q = infinicore::adaptor::to_aten_tensor(p->q);
@@ -195,8 +191,6 @@ void run(void *planned_meta) {
195191
0.0,
196192
false,
197193
std::nullopt);
198-
#else
199-
throw std::runtime_error("FlashAttention varlen: no supported GPU backend in this build");
200194
#endif
201195

202196
#else

0 commit comments

Comments
 (0)