1414# limitations under the License.
1515"""
1616
17- import importlib
18-
1917import paddle
2018import triton
2119from paddleformers .utils .log import logger
2220
21+ from fastdeploy .model_executor .layers .utils import get_sm_version
2322from fastdeploy .model_executor .ops .triton_ops import _per_token_group_quant_fp8
23+ from fastdeploy .model_executor .utils import try_import
2424from fastdeploy .platforms import current_platform
2525
2626if current_platform .is_cuda ():
2727 from fastdeploy .model_executor .ops .gpu import per_token_group_fp8_quant
2828
2929
30- from ..utils import get_sm_version
31-
32-
33- def try_import (modules , name = None , fail_msg = None ):
34- """
35- try_import
36- """
37- if not isinstance (modules , (list , tuple )):
38- modules = [modules ]
39-
40- for m in modules :
41- assert isinstance (m , str ), m
42- try :
43- m = importlib .import_module (m )
44- except ImportError :
45- m = None
46-
47- if m is not None :
48- if name is None :
49- return m
50- elif hasattr (m , name ):
51- return getattr (m , name )
52-
53- if fail_msg is not None :
54- logger .warning (fail_msg )
55-
56-
5730paddlefleet_ops = try_import (["paddlefleet.ops" ])
5831
5932
@@ -72,7 +45,7 @@ def load_deep_gemm():
7245 try :
7346 import logging
7447
75- import paddlefleet . ops .deep_gemm as deep_gemm
48+ import paddlefleet_ops .deep_gemm as deep_gemm
7649
7750 logging .getLogger ().handlers .clear ()
7851 logger .info ("Detected sm100, use PaddleFleet DeepGEMM" )
0 commit comments