Skip to content

Commit 1fa7260

Browse files
committed
Update default fp32 residual
Signed-off-by: John St. John <jstjohn@nvidia.com>
1 parent 5411e09 commit 1fa7260

2 files changed

Lines changed: 1 addition & 4 deletions

File tree

bionemo-recipes/recipes/evo2_megatron/src/bionemo/evo2/models/evo2_provider.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -306,7 +306,7 @@ class HyenaModelProvider(TransformerConfig, ModelProviderMixin[MCoreHyenaModel])
306306
apply_rope_fusion: bool = True
307307
make_vocab_size_divisible_by: int = 128
308308
gated_linear_unit: bool = True
309-
fp32_residual_connection: bool = True
309+
fp32_residual_connection: bool = False
310310
normalization: str = "RMSNorm"
311311
add_bias_linear: bool = False
312312
hidden_dropout: float = 0.0

bionemo-recipes/recipes/evo2_megatron/src/bionemo/evo2/run/predict.py

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1046,9 +1046,6 @@ def predict(
10461046
# Set the model to use fewer layers and skip post-processing (output heads).
10471047
model_provider.num_layers = target_num_layers
10481048
model_provider.post_process = False
1049-
if hasattr(model_provider, "fp32_residual_connection"):
1050-
model_provider.fp32_residual_connection = False
1051-
10521049
# Also truncate the hybrid_override_pattern if it exists, since it must match num_layers
10531050
if hasattr(model_provider, "hybrid_override_pattern") and model_provider.hybrid_override_pattern is not None:
10541051
original_pattern = model_provider.hybrid_override_pattern

0 commit comments

Comments
 (0)