We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 3b4692d commit e24b768Copy full SHA for e24b768
1 file changed
scripts/benchmarks/scenarios-moe.yaml
@@ -76,7 +76,7 @@ scenarios:
76
learning_rate: 5e-5
77
torch_dtype: bfloat16
78
gradient_accumulation_steps: null
79
- per_device_train_batch_size: 4
+ per_device_train_batch_size: 2
80
logging_steps: 1
81
packing: False
82
adam_epsilon: 1e-8
0 commit comments