Add convert_to_export() and deprecate convert_to_torchscript()

aymuos15 · aymuos15 · commit a769c7e6fd46 · 2026-03-16T23:41:24.000Z
Introduce convert_to_export() as the torch.export replacement for
convert_to_torchscript(), with a _recursive_to() helper for moving
ExportedProgram state dicts across devices.  Mark
convert_to_torchscript() as deprecated and update convert_to_trt()
to use the dynamo path gated behind pytorch_after().

Signed-off-by: Soumya Snigdha Kundu &lt;soumya_snigdha.kundu@kcl.ac.uk&gt;
diff --git a/monai/networks/__init__.py b/monai/networks/__init__.py
@@ -14,6 +14,7 @@
 from .trt_compiler import trt_compile
 from .utils import (
     add_casts_around_norms,
+    convert_to_export,
     convert_to_onnx,
     convert_to_torchscript,
     convert_to_trt,
diff --git a/monai/networks/utils.py b/monai/networks/utils.py
@@ -30,8 +30,9 @@
 
 from monai.apps.utils import get_logger
 from monai.config import PathLike
+from monai.utils.deprecate_utils import deprecated
 from monai.utils.misc import ensure_tuple, save_obj, set_determinism
-from monai.utils.module import look_up_option, optional_import
+from monai.utils.module import look_up_option, optional_import, pytorch_after
 from monai.utils.type_conversion import convert_to_dst_type, convert_to_tensor
 
 onnx, _ = optional_import("onnx")
@@ -57,6 +58,7 @@
     "save_state",
     "convert_to_onnx",
     "convert_to_torchscript",
+    "convert_to_export",
     "convert_to_trt",
     "meshgrid_ij",
     "meshgrid_xy",
@@ -793,6 +795,16 @@ def convert_to_onnx(
     return onnx_model
 
 
+def _recursive_to(x, device):
+    """Recursively move tensors (and nested tuples/lists of tensors) to *device*."""
+    if isinstance(x, torch.Tensor):
+        return x.to(device)
+    if isinstance(x, (tuple, list)):
+        return type(x)(_recursive_to(i, device) for i in x)
+    return x
+
+
+@deprecated(since="1.5", removed="1.7", msg_suffix="Use convert_to_export() instead.")
 def convert_to_torchscript(
     model: nn.Module,
     filename_or_obj: Any | None = None,
@@ -863,6 +875,82 @@ def convert_to_torchscript(
     return script_module
 
 
+def convert_to_export(
+    model: nn.Module,
+    filename_or_obj: Any | None = None,
+    extra_files: dict | None = None,
+    verify: bool = False,
+    inputs: Sequence[Any] | None = None,
+    dynamic_shapes: dict | tuple | None = None,
+    device: str | torch.device | None = None,
+    rtol: float = 1e-4,
+    atol: float = 0.0,
+    **kwargs,
+) -> torch.export.ExportedProgram:
+    """
+    Utility to export a model using :func:`torch.export.export` and optionally save to a ``.pt2`` file,
+    with optional input/output data verification.
+
+    Args:
+        model: source PyTorch model to export.
+        filename_or_obj: if not None, a file path string to save the exported program.
+        extra_files: map from filename to contents to store in the saved archive.
+        verify: whether to verify the input and output of the exported model.
+            If ``filename_or_obj`` is not None, loads the saved model and verifies.
+        inputs: input test data for export and verification. Should be a sequence of
+            tensors that map to positional arguments of ``model()``.
+        dynamic_shapes: dynamic shape specifications passed to :func:`torch.export.export`.
+            See PyTorch docs for format details.
+        device: target device to verify the model. If None, uses CUDA if available.
+        rtol: the relative tolerance when comparing outputs.
+        atol: the absolute tolerance when comparing outputs.
+        kwargs: additional keyword arguments for :func:`torch.export.export`.
+
+    Returns:
+        A :class:`torch.export.ExportedProgram` representing the exported model.
+    """
+    if inputs is None:
+        raise ValueError("Input data is required for torch.export.export.")
+
+    model.eval()
+    with torch.no_grad():
+        export_args = tuple(inputs)
+        exported = torch.export.export(model, args=export_args, dynamic_shapes=dynamic_shapes, **kwargs)
+
+        if filename_or_obj is not None:
+            save_extra: dict[str, Any] = {}
+            if extra_files is not None:
+                # torch.export.save requires str values; decode bytes from legacy callers
+                save_extra.update({k: v.decode() if isinstance(v, bytes) else v for k, v in extra_files.items()})
+            torch.export.save(exported, filename_or_obj, extra_files=save_extra if save_extra else None)
+
+    if verify:
+        if device is None:
+            device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+
+        verify_args = tuple(_recursive_to(i, device) for i in inputs)
+
+        # Always verify against the in-memory export to avoid device placement
+        # issues that can occur when reloading from file (torch.export.load does
+        # not support map_location).
+        loaded_module = exported.module()
+        loaded_module.to(device)
+        model.to(device)
+
+        with torch.no_grad():
+            set_determinism(seed=0)
+            torch_out = ensure_tuple(model(*verify_args))
+            set_determinism(seed=0)
+            export_out = ensure_tuple(loaded_module(*verify_args))
+            set_determinism(seed=None)
+
+        for r1, r2 in zip(torch_out, export_out):
+            if isinstance(r1, torch.Tensor) or isinstance(r2, torch.Tensor):
+                torch.testing.assert_close(r1, r2, rtol=rtol, atol=atol)  # type: ignore
+
+    return exported
+
+
 def _onnx_trt_compile(
     onnx_model,
     min_shape: Sequence[int],
@@ -1012,9 +1100,9 @@ def convert_to_trt(
     convert_precision = torch.float32 if precision == "fp32" else torch.half
     inputs = [torch.rand(ensure_tuple(input_shape)).to(target_device)]
 
-    # convert the torch model to a TorchScript model on target device
     model = model.eval().to(target_device)
     min_input_shape, opt_input_shape, max_input_shape = get_profile_shapes(input_shape, dynamic_batchsize)
+    _use_dynamo = pytorch_after(2, 9)
 
     if use_onnx:
         # set the batch dim as dynamic
@@ -1035,40 +1123,55 @@ def convert_to_trt(
             output_names=onnx_output_names,
         )
     else:
-        ir_model = convert_to_torchscript(model, device=target_device, inputs=inputs, use_trace=use_trace)
-        ir_model.eval()
-        # convert the model through the Torch-TensorRT way
-        ir_model.to(target_device)
+        # Torch-TensorRT compilation path
         with torch.no_grad():
             with torch.cuda.device(device=device):
                 input_placeholder = [
                     torch_tensorrt.Input(
                         min_shape=min_input_shape, opt_shape=opt_input_shape, max_shape=max_input_shape
                     )
                 ]
-                trt_model = torch_tensorrt.compile(
-                    ir_model,
-                    inputs=input_placeholder,
-                    enabled_precisions=convert_precision,
-                    device=torch_tensorrt.Device(f"cuda:{device}"),
-                    ir="torchscript",
-                    **kwargs,
-                )
+                # Use dynamo IR (torch.export-based) which is the default in newer torch-tensorrt
+                if _use_dynamo:
+                    trt_model = torch_tensorrt.compile(
+                        model,
+                        inputs=input_placeholder,
+                        enabled_precisions=convert_precision,
+                        device=torch_tensorrt.Device(f"cuda:{device}"),
+                        ir="dynamo",
+                        **kwargs,
+                    )
+                else:
+                    ir_model = convert_to_torchscript(
+                        model, device=target_device, inputs=inputs, use_trace=use_trace
+                    )
+                    trt_model = torch_tensorrt.compile(
+                        ir_model,
+                        inputs=input_placeholder,
+                        enabled_precisions=convert_precision,
+                        device=torch_tensorrt.Device(f"cuda:{device}"),
+                        ir="torchscript",
+                        **kwargs,
+                    )
 
     # verify the outputs between the TensorRT model and PyTorch model
     if verify:
         if inputs is None:
             raise ValueError("Missing input data for verification.")
 
-        trt_model = torch.jit.load(filename_or_obj) if filename_or_obj is not None else trt_model
+        if filename_or_obj is not None:
+            if _use_dynamo:
+                trt_model = torch.export.load(filename_or_obj).module()
+            else:
+                trt_model = torch.jit.load(filename_or_obj)
 
         with torch.no_grad():
             set_determinism(seed=0)
             torch_out = ensure_tuple(model(*inputs))
             set_determinism(seed=0)
             trt_out = ensure_tuple(trt_model(*inputs))
             set_determinism(seed=None)
-        # compare TorchScript and PyTorch results
+        # compare TensorRT and PyTorch results
         for r1, r2 in zip(torch_out, trt_out):
             if isinstance(r1, torch.Tensor) or isinstance(r2, torch.Tensor):
                 torch.testing.assert_close(r1, r2, rtol=rtol, atol=atol)  # type: ignore