We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 7ca0434 commit 59120b6Copy full SHA for 59120b6
1 file changed
xtuner/v1/ray/rollout/lmdeploy.py
@@ -349,6 +349,11 @@ def _transform_rollout_config_to_server_configs(self) -> Namespace:
349
{
350
"LMDEPLOY_DP_MASTER_ADDR": dist_addr,
351
"LMDEPLOY_DP_MASTER_PORT": dist_port,
352
+ # DEEPEP_MAX_TOKENS_PER_RANK is required by DLBlas's DeepEP
353
+ # token dispatcher used in lmdeploy EP mode. Without it,
354
+ # lmdeploy will fail during warmup.
355
+ # Ref: https://github.com/DeepLink-org/DLBlas/blob/aae23445/dlblas/layers/moe/token_dispatcher.py#L81
356
+ # Ref: https://github.com/InternLM/lmdeploy/blob/81627e3d/lmdeploy/utils.py#L375
357
"DEEPEP_MAX_TOKENS_PER_RANK": str(max_batch_size),
358
}
359
)
0 commit comments