--amend

lowdy1 · lowdy1 · commit 87928a4f4af5 · 2026-03-27T02:12:43.000Z
diff --git a/src/liger_kernel/ops/backends/_ascend/ops/multi_token_attention.py b/src/liger_kernel/ops/backends/_ascend/ops/multi_token_attention.py
@@ -1,10 +1,3 @@
-"""
-Fused causal masking + softmax/sparsemax Triton kernels for NPU.
-
-This implementation fuses causal masking with softmax and sparsemax forward and backward
-operations in single kernels to reduce memory traffic and improve performance.
-"""
-
 import torch
 import torch.nn.functional as F
 import triton