We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent c003616 commit 99178efCopy full SHA for 99178ef
1 file changed
main_training_mamba.py
@@ -114,7 +114,8 @@ def main(**kwargs):
114
params_without_decay = []
115
for name, param in model.named_parameters():
116
print(f'{name=}')
117
- if 'A_log' in name or 'D' in name or 'dt_bias' in name:
+ suff = name.split('.')[-1]
118
+ if 'A_log' in suff or 'D' in suff or 'dt_bias' in suff:
119
params_without_decay.append(param)
120
else:
121
params_with_decay.append(param)
0 commit comments