We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent feea682 commit 1f1d127Copy full SHA for 1f1d127
2 files changed
scripts/benchmarks/scenarios-moe.yaml
@@ -76,7 +76,7 @@ scenarios:
76
learning_rate: 5e-5
77
torch_dtype: bfloat16
78
gradient_accumulation_steps: null
79
- per_device_train_batch_size: 2
+ per_device_train_batch_size: 8
80
logging_steps: 1
81
packing: False
82
adam_epsilon: 1e-8
tox.ini
@@ -34,6 +34,9 @@ commands =
34
# some models need this for tokenizers
35
pip install protobuf
36
37
+ # for mamba based models
38
+ pip install --no-build-isolation mamba_ssm[causal-conv1d]>=2.0.0
39
+
40
# install the plugins for test
41
# NOTE: when there are more plugins install here
42
python -m fms_acceleration.cli install -e {toxinidir}/plugins/accelerated-peft
0 commit comments