We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 00deb30 commit 09a501aCopy full SHA for 09a501a
1 file changed
bionemo-recipes/recipes/codonfm_native_te/slurm/1b.sh
@@ -121,6 +121,11 @@ echo "Job ID: ${SLURM_JOB_ID}"
121
echo "Nodes: ${SLURM_JOB_NUM_NODES}"
122
echo "========================================="
123
124
+# cuDNN fused-attn sub-backend 1 OOMs on Blackwell (sm_103) with THD+padding (TE 2.12 / cuDNN 9.19); force flash-attn varlen.
125
+if [ "${USE_SEQUENCE_PACKING}" = "True" ]; then
126
+ export NVTE_FUSED_ATTN=0
127
+fi
128
+
129
# Pick training script based on distributed strategy.
130
case "${DIST_STRATEGY}" in
131
fsdp)
0 commit comments