@@ -167,6 +167,7 @@ class EngineArgs:
167167 'auto': Use native FastDeploy implementation when available, fallback to PaddleFormers.
168168 'fastdeploy': Use only native FastDeploy implementations.
169169 'paddleformers': Use PaddleFormers backend with FastDeploy optimizations.
170+ 'paddlefleet': Use PaddleFleet backend with FastDeploy optimizations.
170171 """
171172 override_pooler_config : Optional [Union [dict , PoolerConfig ]] = None
172173 """
@@ -678,7 +679,7 @@ def __post_init__(self):
678679 "kvcache_storage_backend is only supported when ENABLE_V1_KVCACHE_SCHEDULER=1"
679680 )
680681
681- valid_model_impls = ["auto" , "fastdeploy" , "paddleformers" ]
682+ valid_model_impls = ["auto" , "fastdeploy" , "paddleformers" , "paddlefleet" ]
682683 if self .model_impl not in valid_model_impls :
683684 raise NotImplementedError (
684685 f"not support model_impl: '{ self .model_impl } '. " f"Must be one of: { ', ' .join (valid_model_impls )} "
@@ -1063,13 +1064,14 @@ def add_cli_args(parser: FlexibleArgumentParser) -> FlexibleArgumentParser:
10631064 model_group .add_argument (
10641065 "--model-impl" ,
10651066 type = str ,
1066- choices = ["auto" , "fastdeploy" , "paddleformers" ],
1067+ choices = ["auto" , "fastdeploy" , "paddleformers" , "paddlefleet" ],
10671068 default = EngineArgs .model_impl ,
10681069 help = (
10691070 "Model implementation backend. "
10701071 "'auto': Use native FastDeploy when available, fallback to PaddleFormers. "
10711072 "'fastdeploy': Use only native FastDeploy implementations. "
10721073 "'paddleformers': Use PaddleFormers backend with FastDeploy optimizations."
1074+ "'paddlefleet': Use PaddleFleet backend with FastDeploy optimizations."
10731075 ),
10741076 )
10751077
0 commit comments