--amend

lowdy1 · lowdy1 · commit 7c9ff55dbe00 · 2026-03-03T07:36:16.000Z
diff --git a/src/liger_kernel/ops/backends/_ascend/ops/multi_token_attention.py b/src/liger_kernel/ops/backends/_ascend/ops/multi_token_attention.py
@@ -1,10 +1,3 @@
-"""
-Fused causal masking + softmax/sparsemax Triton kernels for NPU.
-
-This implementation fuses causal masking with softmax and sparsemax forward and backward
-operations in single kernels to reduce memory traffic and improve performance.
-"""
-
 import torch
 import torch.nn.functional as F
 import triton