Skip to content

Commit 644ec6e

Browse files
committed
Minor fix
1 parent cd50af2 commit 644ec6e

1 file changed

Lines changed: 1 addition & 1 deletion

File tree

examples/models/gemma4_31b/export.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -162,7 +162,7 @@ def _export_cuda(model: Gemma4_31B, config: Gemma4_31BConfig, output_dir: str) -
162162

163163
# Prefill (T>=2): shim does dequant+cuBLAS (optimal for large M).
164164
max_prefill = min(config.max_seq_len - 1, config.sliding_window * 2)
165-
seq_dim = Dim("seq_len", min=2, max=max_prefill)
165+
seq_dim = Dim("seq_len", min=5, max=max_prefill)
166166
print(f"Exporting prefill (T in [2, {max_prefill}])...")
167167
with torch.no_grad():
168168
prefill_ep = export(

0 commit comments

Comments
 (0)