Skip to content

Commit d0c0f51

Browse files
committed
Fix skip softmax defaults
1 parent 52e662d commit d0c0f51

1 file changed

Lines changed: 2 additions & 2 deletions

File tree

  • modelopt/torch/sparsity/attention_sparsity

modelopt/torch/sparsity/attention_sparsity/config.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -399,9 +399,9 @@ class FlashSkipSoftmaxConfig(SparseAttentionConfig):
399399
SKIP_SOFTMAX_CALIB = {
400400
"sparse_cfg": {
401401
"calibration": {
402-
"target_sparse_ratio": {"prefill": 0.9, "decode": 0.9},
402+
"target_sparse_ratio": {"prefill": 0.5, "decode": 0.5},
403403
"samples": 64,
404-
"max_seqlen": 65536,
404+
"max_seqlen": 16384,
405405
"chunk_size": 4096,
406406
},
407407
"*attn*": {

0 commit comments

Comments
 (0)