We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent e24b768 commit ef2a995Copy full SHA for ef2a995
1 file changed
scripts/benchmarks/scenarios-moe.yaml
@@ -76,7 +76,7 @@ scenarios:
76
learning_rate: 5e-5
77
torch_dtype: bfloat16
78
gradient_accumulation_steps: null
79
- per_device_train_batch_size: 2
+ per_device_train_batch_size: 4
80
logging_steps: 1
81
packing: False
82
adam_epsilon: 1e-8
0 commit comments