We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
2 parents 9fcf589 + ab7a7ce commit 61c225fCopy full SHA for 61c225f
1 file changed
src/maxtext/configs/post_train/rl.yml
@@ -23,8 +23,7 @@ sampler_devices_fraction: 0.5
23
chips_per_vm: 4 # depends on hardware, for v5p this is 4
24
num_trainer_slices: -1
25
num_samplers_slices: -1
26
-# Only specify rollout_data_parallelism when you would like to use more than one model
27
-# replicas in rollout. If not specified, rollout_tensor_parallelism will be auto-determined.
+# If rollout_data_parallelism is not specified, it will be auto-determined.
28
rollout_data_parallelism: -1
29
rollout_tensor_parallelism: 1
30
rollout_expert_parallelism: 1
0 commit comments