adapt both fla-attn and fused_moe

Ceng23333 · Ceng23333 · commit 5a1b634ffb8d · 2026-04-21T06:07:20.000Z
Signed-off-by: Ceng23333 &lt;441651826@qq.com&gt;
diff --git a/pyproject.toml b/pyproject.toml
@@ -13,6 +13,8 @@ requires-python = ">=3.8"
 [project.optional-dependencies]
 # Same interpreter as InfiniCore built with ``--aten=y`` (see vllm_kernel_reuse_evaluation.md).
 vllm = ["vllm==0.19.0"]
+# MiniCPM5 fused stub + jiuge: vLLM fused MoE + helper deps (flash-attn install separately; see InfiniLM/examples/FLASH_ATTN_AND_VLLM_FUSED_MOE.md).
+vllm-fused-moe = ["vllm==0.19.0", "janus>=1.0.0", "xxhash>=3.0.0"]
 
 classifiers = [
     "Programming Language :: Python :: 3",