diff --git a/deepmd/backend/jax.py b/deepmd/backend/jax.py
index 9c0055b4f2..2b20d5aa79 100644
--- a/deepmd/backend/jax.py
+++ b/deepmd/backend/jax.py
@@ -62,7 +62,11 @@ def entry_point_hook(self) -> Callable[["Namespace"], None]:
         Callable[[Namespace], None]
             The entry point hook of the backend.
         """
-        raise NotImplementedError
+        from deepmd.jax.entrypoints.main import (
+            main,
+        )
+
+        return main
 
     @property
     def deep_eval(self) -> type["DeepEvalBackend"]:
diff --git a/deepmd/jax/entrypoints/__init__.py b/deepmd/jax/entrypoints/__init__.py
new file mode 100644
index 0000000000..6ceb116d85
--- /dev/null
+++ b/deepmd/jax/entrypoints/__init__.py
@@ -0,0 +1 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
diff --git a/deepmd/jax/entrypoints/freeze.py b/deepmd/jax/entrypoints/freeze.py
new file mode 100644
index 0000000000..fbc126ffc7
--- /dev/null
+++ b/deepmd/jax/entrypoints/freeze.py
@@ -0,0 +1,49 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+"""Freeze utilities for the JAX backend."""
+
+from pathlib import (
+    Path,
+)
+
+from deepmd.backend.suffix import (
+    format_model_suffix,
+)
+from deepmd.jax.utils.serialization import (
+    deserialize_to_file,
+    serialize_from_file,
+)
+
+
+def freeze(
+    *,
+    checkpoint_folder: str,
+    output: str,
+    **kwargs: object,
+) -> None:
+    """Freeze a JAX checkpoint into a serialized model file.
+
+    Parameters
+    ----------
+    checkpoint_folder : str
+        Location of either the checkpoint directory or a folder containing the
+        stable ``checkpoint`` pointer.
+    output : str
+        Output model filename or prefix. The JAX model suffix is added when the
+        filename has no supported backend suffix.
+    **kwargs
+        Other CLI arguments accepted for backend entry-point compatibility.
+    """
+    del kwargs
+
+    checkpoint_path = Path(checkpoint_folder)
+    if (checkpoint_path / "checkpoint").is_file():
+        checkpoint_pointer = (checkpoint_path / "checkpoint").read_text().strip()
+        checkpoint_folder = str(checkpoint_path / checkpoint_pointer)
+
+    output = format_model_suffix(
+        output,
+        preferred_backend="jax",
+        strict_prefer=True,
+    )
+    data = serialize_from_file(checkpoint_folder)
+    deserialize_to_file(output, data)
diff --git a/deepmd/jax/entrypoints/main.py b/deepmd/jax/entrypoints/main.py
new file mode 100644
index 0000000000..a365b1dea8
--- /dev/null
+++ b/deepmd/jax/entrypoints/main.py
@@ -0,0 +1,57 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+"""DeePMD-Kit entry point module."""
+
+import argparse
+from pathlib import (
+    Path,
+)
+
+from deepmd.jax.entrypoints.freeze import (
+    freeze,
+)
+from deepmd.jax.entrypoints.train import (
+    train,
+)
+from deepmd.loggers.loggers import (
+    set_log_handles,
+)
+from deepmd.main import (
+    parse_args,
+)
+
+__all__ = ["main"]
+
+
+def main(args: list[str] | argparse.Namespace | None = None) -> None:
+    """DeePMD-Kit entry point.
+
+    Parameters
+    ----------
+    args : list[str] or argparse.Namespace, optional
+        list of command line arguments, used to avoid calling from the subprocess,
+        as it is quite slow to import tensorflow; if Namespace is given, it will
+        be used directly
+
+    Raises
+    ------
+    RuntimeError
+        if no command was input
+    """
+    if not isinstance(args, argparse.Namespace):
+        args = parse_args(args=args)
+
+    dict_args = vars(args)
+    set_log_handles(
+        args.log_level,
+        Path(args.log_path) if args.log_path else None,
+        mpi_log=None,
+    )
+
+    if args.command == "train":
+        train(**dict_args)
+    elif args.command == "freeze":
+        freeze(**dict_args)
+    elif args.command is None:
+        pass
+    else:
+        raise RuntimeError(f"unknown command {args.command}")
diff --git a/deepmd/jax/entrypoints/train.py b/deepmd/jax/entrypoints/train.py
new file mode 100644
index 0000000000..89f4e8a16c
--- /dev/null
+++ b/deepmd/jax/entrypoints/train.py
@@ -0,0 +1,203 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+"""DeePMD training entrypoint script.
+
+Can handle local training.
+"""
+
+import json
+import logging
+import time
+from typing import (
+    Any,
+)
+
+from deepmd.common import (
+    j_loader,
+)
+from deepmd.jax.env import (
+    jax,
+    jax_export,
+)
+from deepmd.jax.train.trainer import (
+    DPTrainer,
+)
+from deepmd.utils import random as dp_random
+from deepmd.utils.argcheck import (
+    normalize,
+)
+from deepmd.utils.compat import (
+    update_deepmd_input,
+)
+from deepmd.utils.data_system import (
+    get_data,
+)
+from deepmd.utils.summary import SummaryPrinter as BaseSummaryPrinter
+
+__all__ = ["train"]
+
+log = logging.getLogger(__name__)
+
+
+class SummaryPrinter(BaseSummaryPrinter):
+    """Summary printer for JAX."""
+
+    def is_built_with_cuda(self) -> bool:
+        """Check if the backend is built with CUDA."""
+        return jax_export.default_export_platform() == "cuda"
+
+    def is_built_with_rocm(self) -> bool:
+        """Check if the backend is built with ROCm."""
+        return jax_export.default_export_platform() == "rocm"
+
+    def get_compute_device(self) -> str:
+        """Get Compute device."""
+        return jax.default_backend()
+
+    def get_ngpus(self) -> int:
+        """Get the number of GPUs."""
+        return jax.device_count()
+
+    def get_backend_info(self) -> dict:
+        """Get backend information."""
+        return {
+            "Backend": "JAX",
+            "JAX ver": jax.__version__,
+        }
+
+    def get_device_name(self) -> str:
+        """Get the name of the device."""
+        devices = jax.devices()
+        if devices:
+            return devices[0].device_kind
+        else:
+            return "Unknown"
+
+
+def train(
+    *,
+    INPUT: str,
+    init_model: str | None,
+    restart: str | None,
+    output: str,
+    init_frz_model: str | None,
+    mpi_log: str,
+    log_level: int,
+    log_path: str | None,
+    skip_neighbor_stat: bool = False,
+    finetune: str | None = None,
+    use_pretrain_script: bool = False,
+    **kwargs: Any,
+) -> None:
+    """Run DeePMD model training.
+
+    Parameters
+    ----------
+    INPUT : str
+        json/yaml control file
+    init_model : Optional[str]
+        path prefix of checkpoint files or None
+    restart : Optional[str]
+        path prefix of checkpoint files or None
+    output : str
+        path for dump file with arguments
+    init_frz_model : str | None
+        path to frozen model, or None if no frozen model is used
+    mpi_log : str
+        mpi logging mode
+    log_level : int
+        logging level defined by int 0-3
+    log_path : Optional[str]
+        logging file path or None if logs are to be output only to stdout
+    skip_neighbor_stat : bool, default=False
+        skip checking neighbor statistics
+    finetune : Optional[str]
+        path to pretrained model or None
+    use_pretrain_script : bool
+        Whether to use model script in pretrained model when doing init-model or init-frz-model.
+        Note that this option is true and unchangeable for fine-tuning.
+    **kwargs
+        additional arguments
+
+    Raises
+    ------
+    RuntimeError
+        if the training command fails.
+    """
+    # load json database
+    jdata = j_loader(INPUT)
+
+    if init_frz_model:
+        raise NotImplementedError("JAX training does not support init_frz_model yet")
+    if finetune:
+        raise NotImplementedError("JAX training does not support finetune yet")
+    if use_pretrain_script:
+        raise NotImplementedError(
+            "JAX training does not support use_pretrain_script yet"
+        )
+
+    jdata = update_deepmd_input(jdata, warning=True, dump="input_v2_compat.json")
+
+    jdata = normalize(jdata)
+    if not skip_neighbor_stat:
+        jdata = update_sel(jdata)
+
+    with open(output, "w") as fp:
+        json.dump(jdata, fp, indent=4)
+    SummaryPrinter()()
+
+    # make necessary checks
+    assert "training" in jdata
+
+    # init the model
+
+    model = DPTrainer(
+        jdata,
+        init_model=init_model,
+        restart=restart,
+    )
+    rcut = model.model.get_rcut()
+    type_map = model.model.get_type_map()
+    if len(type_map) == 0:
+        ipt_type_map = None
+    else:
+        ipt_type_map = type_map
+
+    # init random seed of data systems
+    seed = jdata["training"].get("seed", None)
+    if seed is not None:
+        seed += jax.process_index()
+        seed = seed % (2**32)
+    dp_random.seed(seed)
+
+    # init data
+    train_data = get_data(jdata["training"]["training_data"], rcut, ipt_type_map, None)
+    train_data.add_data_requirements(model.data_requirements)
+    train_data.print_summary("training")
+    if jdata["training"].get("validation_data", None) is not None:
+        valid_data = get_data(
+            jdata["training"]["validation_data"],
+            rcut,
+            train_data.type_map,
+            None,
+        )
+        valid_data.add_data_requirements(model.data_requirements)
+        valid_data.print_summary("validation")
+    else:
+        valid_data = None
+
+    # train the model with the provided systems in a cyclic way
+    start_time = time.time()
+    model.train(train_data, valid_data)
+    end_time = time.time()
+    log.info("finished training")
+    log.info(f"wall time: {(end_time - start_time):.3f} s")
+
+
+def update_sel(jdata: dict) -> dict:
+    """Update descriptor selections from neighbor statistics when available."""
+    log.info(
+        "Skip neighbor statistics update for JAX training; "
+        "BaseModel.update_sel currently needs more memory than expected."
+    )
+    # TODO: Restore BaseModel.update_sel once the JAX data path avoids OOM.
+    return jdata.copy()
diff --git a/deepmd/jax/train/__init__.py b/deepmd/jax/train/__init__.py
new file mode 100644
index 0000000000..6ceb116d85
--- /dev/null
+++ b/deepmd/jax/train/__init__.py
@@ -0,0 +1 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
diff --git a/deepmd/jax/train/trainer.py b/deepmd/jax/train/trainer.py
new file mode 100644
index 0000000000..180249eaef
--- /dev/null
+++ b/deepmd/jax/train/trainer.py
@@ -0,0 +1,581 @@
+#!/usr/bin/env python3
+# SPDX-License-Identifier: LGPL-3.0-or-later
+"""Local training utilities for the JAX backend."""
+
+import logging
+import os
+import platform
+import shutil
+import time
+from pathlib import (
+    Path,
+)
+from typing import (
+    TextIO,
+)
+
+import numpy as np
+import optax
+import orbax.checkpoint as ocp
+from packaging.version import (
+    Version,
+)
+
+from deepmd.dpmodel.loss.ener import (
+    EnergyLoss,
+)
+from deepmd.dpmodel.model.transform_output import (
+    communicate_extended_output,
+)
+from deepmd.dpmodel.utils.learning_rate import (
+    LearningRateExp,
+)
+from deepmd.dpmodel.utils.nlist import (
+    build_neighbor_list,
+    extend_coord_with_ghosts,
+)
+from deepmd.dpmodel.utils.region import (
+    normalize_coord,
+)
+from deepmd.jax.env import (
+    flax_version,
+    jnp,
+    nnx,
+)
+from deepmd.jax.model.base_model import (
+    BaseModel,
+)
+from deepmd.jax.model.model import (
+    get_model,
+)
+from deepmd.jax.utils.serialization import (
+    serialize_from_file,
+)
+from deepmd.loggers.training import (
+    format_training_message,
+    format_training_message_per_task,
+)
+from deepmd.utils.data import (
+    DataRequirementItem,
+)
+from deepmd.utils.data_system import (
+    DeepmdDataSystem,
+)
+from deepmd.utils.model_stat import (
+    make_stat_input,
+)
+
+log = logging.getLogger(__name__)
+
+
+class DPTrainer:
+    """Train JAX DeePMD models on local devices."""
+
+    def __init__(
+        self,
+        jdata: dict,
+        init_model: str | None = None,
+        restart: str | None = None,
+    ) -> None:
+        """Initialize the trainer from input data and optional checkpoints."""
+        self.init_model = init_model
+        self.restart = restart
+        self.model_def_script = jdata["model"]
+        self.start_step = 0
+        if self.init_model is not None:
+            model_dict = serialize_from_file(self.init_model)
+            self.model = BaseModel.deserialize(model_dict["model"])
+        elif self.restart is not None:
+            model_dict = serialize_from_file(self.restart)
+            self.model = BaseModel.deserialize(model_dict["model"])
+            self.start_step = model_dict.get("model_def_script", {}).get(
+                "current_step",
+                model_dict.get("@variables", {}).get("current_step", 0),
+            )
+        else:
+            # from scratch
+            self.model = get_model(jdata["model"])
+        self.training_param = jdata["training"]
+        self.num_steps = self.training_param["numb_steps"]
+
+        def get_lr_and_coef(lr_param: dict) -> LearningRateExp:
+            lr_type = lr_param.get("type", "exp")
+            if lr_type == "exp":
+                lr = LearningRateExp(
+                    **lr_param,
+                    num_steps=self.num_steps,
+                )
+            else:
+                raise RuntimeError("unknown learning_rate type " + lr_type)
+            return lr
+
+        learning_rate_param = jdata["learning_rate"]
+        self.lr = get_lr_and_coef(learning_rate_param)
+        loss_param = jdata.get("loss", {})
+        loss_param["starter_learning_rate"] = learning_rate_param["start_lr"]
+
+        loss_type = loss_param.get("type", "ener")
+        if loss_type == "ener":
+            self.loss = EnergyLoss.get_loss(loss_param)
+        else:
+            raise RuntimeError("unknown loss type " + loss_type)
+
+        # training
+        tr_data = jdata["training"]
+        self.disp_file = tr_data.get("disp_file", "lcurve.out")
+        self.disp_freq = tr_data.get("disp_freq", 1000)
+        self.save_freq = tr_data.get("save_freq", 1000)
+        self.save_ckpt = tr_data.get("save_ckpt", "model.ckpt")
+        self.max_ckpt_keep = tr_data.get("max_ckpt_keep", 5)
+        self.display_in_training = tr_data.get("disp_training", True)
+        self.timing_in_training = tr_data.get("time_training", True)
+        self.profiling = tr_data.get("profiling", False)
+        self.profiling_file = tr_data.get("profiling_file", "timeline.json")
+        self.enable_profiler = tr_data.get("enable_profiler", False)
+        self.tensorboard = tr_data.get("tensorboard", False)
+        self.tensorboard_log_dir = tr_data.get("tensorboard_log_dir", "log")
+        self.tensorboard_freq = tr_data.get("tensorboard_freq", 1)
+        self.mixed_prec = tr_data.get("mixed_precision", None)
+        self.change_bias_after_training = tr_data.get(
+            "change_bias_after_training", False
+        )
+        self.numb_fparam = self.model.get_dim_fparam()
+
+        if tr_data.get("validation_data", None) is not None:
+            self.valid_numb_batch = max(
+                tr_data["validation_data"].get("numb_btch", 1),
+                1,
+            )
+        else:
+            self.valid_numb_batch = 1
+
+        # if init the graph with the frozen model
+        self.frz_model = None
+        self.ckpt_meta = None
+        self.model_type = None
+
+    @property
+    def data_requirements(self) -> list[DataRequirementItem]:
+        """Labels required by the configured loss."""
+        return self.loss.label_requirement
+
+    def train(
+        self, train_data: DeepmdDataSystem, valid_data: DeepmdDataSystem | None = None
+    ) -> None:
+        """Run the training loop with optional validation data."""
+        model = self.model
+        tx = optax.adam(
+            learning_rate=lambda step: self.lr.value(self.start_step + step),
+        )
+        optimizer = nnx.Optimizer(model, tx, wrt=nnx.Param)
+
+        # data stat
+        if self.init_model is None and self.restart is None:
+            data_stat_nbatch = self.model_def_script.get("data_stat_nbatch", 10)
+            stat_data = make_stat_input(train_data, data_stat_nbatch)
+            stat_data_jax = [
+                {
+                    kk: jnp.asarray(vv) if isinstance(vv, np.ndarray) else vv
+                    for kk, vv in single_data.items()
+                }
+                for single_data in stat_data
+            ]
+            model.atomic_model.compute_or_load_stat(lambda: stat_data_jax)
+
+        def loss_fn(
+            model: BaseModel,
+            lr: float,
+            label_dict: dict[str, jnp.ndarray],
+            extended_coord: jnp.ndarray,
+            extended_atype: jnp.ndarray,
+            nlist: jnp.ndarray,
+            mapping: jnp.ndarray | None,
+            fp: jnp.ndarray | None,
+            ap: jnp.ndarray | None,
+        ) -> jnp.ndarray:
+            model_dict_lower = model.call_common_lower(
+                extended_coord,
+                extended_atype,
+                nlist,
+                mapping,
+                fp,
+                ap,
+            )
+            model_dict = communicate_extended_output(
+                model_dict_lower,
+                model.model_output_def(),
+                mapping,
+                do_atomic_virial=False,
+            )
+            model_dict["atom_energy"] = model_dict["energy"]
+            model_dict["energy"] = model_dict["energy_redu"]
+            model_dict["force"] = model_dict["energy_derv_r"].squeeze(-2)
+            model_dict["virial"] = model_dict["energy_derv_c_redu"].squeeze(-2)
+            loss, more_loss = self.loss(
+                learning_rate=lr,
+                natoms=label_dict["type"].shape[1],
+                model_dict=model_dict,
+                label_dict=label_dict,
+            )
+            return loss
+
+        @nnx.jit
+        def loss_fn_more_loss(
+            model: BaseModel,
+            lr: float,
+            label_dict: dict[str, jnp.ndarray],
+            extended_coord: jnp.ndarray,
+            extended_atype: jnp.ndarray,
+            nlist: jnp.ndarray,
+            mapping: jnp.ndarray | None,
+            fp: jnp.ndarray | None,
+            ap: jnp.ndarray | None,
+        ) -> dict[str, jnp.ndarray]:
+            model_dict_lower = model.call_common_lower(
+                extended_coord,
+                extended_atype,
+                nlist,
+                mapping,
+                fp,
+                ap,
+            )
+            model_dict = communicate_extended_output(
+                model_dict_lower,
+                model.model_output_def(),
+                mapping,
+                do_atomic_virial=False,
+            )
+            model_dict["atom_energy"] = model_dict["energy"]
+            model_dict["energy"] = model_dict["energy_redu"]
+            model_dict["force"] = model_dict["energy_derv_r"].squeeze(-2)
+            model_dict["virial"] = model_dict["energy_derv_c_redu"].squeeze(-2)
+            loss, more_loss = self.loss(
+                learning_rate=lr,
+                natoms=label_dict["type"].shape[1],
+                model_dict=model_dict,
+                label_dict=label_dict,
+            )
+            return more_loss
+
+        @nnx.jit
+        def train_step(
+            model: BaseModel,
+            optimizer: nnx.Optimizer,
+            lr: float,
+            label_dict: dict[str, jnp.ndarray],
+            extended_coord: jnp.ndarray,
+            extended_atype: jnp.ndarray,
+            nlist: jnp.ndarray,
+            mapping: jnp.ndarray | None,
+            fp: jnp.ndarray | None,
+            ap: jnp.ndarray | None,
+        ) -> None:
+            grads = nnx.grad(loss_fn)(
+                model,
+                lr,
+                label_dict,
+                extended_coord,
+                extended_atype,
+                nlist,
+                mapping,
+                fp,
+                ap,
+            )
+            if Version(flax_version) >= Version("0.11.0"):
+                optimizer.update(model, grads)
+            else:
+                optimizer.update(grads)
+
+        start_time = time.time()
+        disp_path = Path(self.disp_file)
+        disp_mode = "a" if self.start_step > 0 and disp_path.exists() else "w"
+        with open(disp_path, disp_mode) as disp_file_fp:
+            for step in range(self.start_step, self.num_steps):
+                batch_data = train_data.get_batch()
+                # numpy to jax
+                jax_data = convert_numpy_data_to_jax_data(batch_data)
+                extended_coord, extended_atype, nlist, mapping, fp, ap = prepare_input(
+                    rcut=model.get_rcut(),
+                    sel=model.get_sel(),
+                    coord=jax_data["coord"],
+                    atype=jax_data["type"],
+                    box=jax_data["box"] if jax_data["find_box"] else None,
+                    fparam=jax_data.get("fparam", None),
+                    aparam=jax_data.get("aparam", None),
+                )
+                train_step(
+                    model,
+                    optimizer,
+                    self.lr.value(step),
+                    jax_data,
+                    extended_coord,
+                    extended_atype,
+                    nlist,
+                    mapping,
+                    fp,
+                    ap,
+                )
+                if self.display_in_training and (
+                    step == 0 or (step + 1) % self.disp_freq == 0
+                ):
+                    wall_time = time.time() - start_time
+                    log.info(
+                        format_training_message(
+                            batch=step + 1,
+                            wall_time=wall_time,
+                        )
+                    )
+                    more_loss = loss_fn_more_loss(
+                        model,
+                        self.lr.value(step),
+                        jax_data,
+                        extended_coord,
+                        extended_atype,
+                        nlist,
+                        mapping,
+                        fp,
+                        ap,
+                    )
+                    if valid_data is not None:
+                        valid_more_loss_list = []
+                        for _ in range(self.valid_numb_batch):
+                            valid_batch_data = valid_data.get_batch()
+                            jax_valid_data = convert_numpy_data_to_jax_data(
+                                valid_batch_data
+                            )
+                            extended_coord, extended_atype, nlist, mapping, fp, ap = (
+                                prepare_input(
+                                    rcut=model.get_rcut(),
+                                    sel=model.get_sel(),
+                                    coord=jax_valid_data["coord"],
+                                    atype=jax_valid_data["type"],
+                                    box=jax_valid_data["box"]
+                                    if jax_valid_data["find_box"]
+                                    else None,
+                                    fparam=jax_valid_data.get("fparam", None),
+                                    aparam=jax_valid_data.get("aparam", None),
+                                )
+                            )
+                            valid_more_loss_list.append(
+                                loss_fn_more_loss(
+                                    model,
+                                    self.lr.value(step),
+                                    jax_valid_data,
+                                    extended_coord,
+                                    extended_atype,
+                                    nlist,
+                                    mapping,
+                                    fp,
+                                    ap,
+                                )
+                            )
+                        valid_more_loss = {
+                            key: sum(loss[key] for loss in valid_more_loss_list)
+                            / len(valid_more_loss_list)
+                            for key in valid_more_loss_list[0]
+                        }
+                    else:
+                        valid_more_loss = None
+                    if disp_file_fp.tell() == 0:
+                        self.print_header(
+                            disp_file_fp,
+                            train_results=more_loss,
+                            valid_results=valid_more_loss,
+                        )
+                    self.print_on_training(
+                        disp_file_fp,
+                        train_results=more_loss,
+                        valid_results=valid_more_loss,
+                        cur_batch=step + 1,
+                        cur_lr=self.lr.value(step),
+                    )
+                    start_time = time.time()
+                if (step + 1) % self.save_freq == 0:
+                    self._save_checkpoint(model, step + 1)
+        if self.num_steps > self.start_step and self.num_steps % self.save_freq != 0:
+            self._save_checkpoint(model, self.num_steps)
+
+    def _save_checkpoint(self, model: BaseModel, step: int) -> None:
+        """Save a JAX checkpoint and update the stable checkpoint pointer."""
+        _, state = nnx.split(model)
+        ckpt_path = Path(f"{self.save_ckpt}-{step}.jax")
+        if ckpt_path.is_dir():
+            # remove old checkpoint if it exists
+            shutil.rmtree(ckpt_path)
+        model_def_script_cpy = self.model_def_script.copy()
+        model_def_script_cpy["current_step"] = step
+        with ocp.Checkpointer(
+            ocp.CompositeCheckpointHandler("state", "model_def_script")
+        ) as checkpointer:
+            checkpointer.save(
+                ckpt_path.absolute(),
+                ocp.args.Composite(
+                    state=ocp.args.StandardSave(state.to_pure_dict()),
+                    model_def_script=ocp.args.JsonSave(model_def_script_cpy),
+                ),
+            )
+        log.info(f"Trained model has been saved to: {ckpt_path!s}")
+        _link_checkpoint(ckpt_path, Path(f"{self.save_ckpt}.jax"))
+        self._cleanup_old_checkpoints()
+        with open("checkpoint", "w") as fp:
+            fp.write(f"{self.save_ckpt}.jax")
+
+    def _cleanup_old_checkpoints(self) -> None:
+        """Remove old checkpoint directories beyond the retention limit."""
+        if self.max_ckpt_keep <= 0:
+            return
+        ckpt_parent = Path(self.save_ckpt).parent
+        ckpt_prefix = Path(self.save_ckpt).name
+        checkpoints = []
+        for path in ckpt_parent.glob(f"{ckpt_prefix}-*.jax"):
+            if not path.is_dir() or path.is_symlink():
+                continue
+            step_text = path.name.removeprefix(f"{ckpt_prefix}-").removesuffix(".jax")
+            if step_text.isdigit():
+                checkpoints.append((int(step_text), path))
+        for _, path in sorted(checkpoints)[: -self.max_ckpt_keep]:
+            shutil.rmtree(path)
+
+    @staticmethod
+    def print_on_training(
+        fp: TextIO,
+        train_results: dict[str, float],
+        valid_results: dict[str, float] | None,
+        cur_batch: int,
+        cur_lr: float,
+    ) -> None:
+        """Append one training/validation loss row to the learning-curve file."""
+        print_str = ""
+        print_str += f"{cur_batch:7d}"
+        if valid_results is not None:
+            prop_fmt = "   %11.2e %11.2e"
+            for k in valid_results.keys():
+                # assert k in train_results.keys()
+                print_str += prop_fmt % (valid_results[k], train_results[k])
+        else:
+            prop_fmt = "   %11.2e"
+            for k in train_results.keys():
+                print_str += prop_fmt % (train_results[k])
+        print_str += f"   {cur_lr:8.1e}\n"
+        log.info(
+            format_training_message_per_task(
+                batch=cur_batch,
+                task_name="trn",
+                rmse=train_results,
+                learning_rate=cur_lr,
+            )
+        )
+        if valid_results is not None:
+            log.info(
+                format_training_message_per_task(
+                    batch=cur_batch,
+                    task_name="val",
+                    rmse=valid_results,
+                    learning_rate=None,
+                )
+            )
+        fp.write(print_str)
+        fp.flush()
+
+    @staticmethod
+    def print_header(
+        fp: TextIO,
+        train_results: dict[str, float],
+        valid_results: dict[str, float] | None,
+    ) -> None:
+        """Write the learning-curve header for the configured loss terms."""
+        print_str = ""
+        print_str += "# {:5s}".format("step")
+        if valid_results is not None:
+            prop_fmt = "   %11s %11s"
+            for k in train_results.keys():
+                print_str += prop_fmt % (k + "_val", k + "_trn")
+        else:
+            prop_fmt = "   %11s"
+            for k in train_results.keys():
+                print_str += prop_fmt % (k + "_trn")
+        print_str += "   {:8s}\n".format("lr")
+        print_str += "# If there is no available reference data, rmse_*_{val,trn} will print nan\n"
+        fp.write(print_str)
+        fp.flush()
+
+
+def _link_checkpoint(source: Path, target: Path) -> None:
+    """Point the stable checkpoint path to the latest checkpoint directory."""
+    if target.exists() or target.is_symlink():
+        if target.is_dir() and not target.is_symlink():
+            shutil.rmtree(target)
+        else:
+            target.unlink()
+    if platform.system() != "Windows":
+        os.symlink(os.path.relpath(source, target.parent), target)
+    else:
+        shutil.copytree(source, target)
+
+
+def prepare_input(
+    *,  # enforce keyword-only arguments
+    rcut: float,
+    sel: list[int],
+    coord: np.ndarray,
+    atype: np.ndarray,
+    box: np.ndarray | None = None,
+    fparam: np.ndarray | None = None,
+    aparam: np.ndarray | None = None,
+) -> tuple[
+    np.ndarray,
+    np.ndarray,
+    np.ndarray,
+    np.ndarray,
+    np.ndarray | None,
+    np.ndarray | None,
+]:
+    """Build extended coordinates and neighbor lists for a training batch."""
+    nframes, nloc = atype.shape[:2]
+    cc, bb, fp, ap = coord, box, fparam, aparam
+    del coord, box, fparam, aparam
+    if bb is not None:
+        coord_normalized = normalize_coord(
+            cc.reshape(nframes, nloc, 3),
+            bb.reshape(nframes, 3, 3),
+        )
+    else:
+        coord_normalized = cc.reshape(nframes, nloc, 3).copy()
+    extended_coord, extended_atype, mapping = extend_coord_with_ghosts(
+        coord_normalized, atype, bb, rcut
+    )
+    nlist = build_neighbor_list(
+        extended_coord,
+        extended_atype,
+        nloc,
+        rcut,
+        sel,
+        # types will be distinguished in the lower interface,
+        # so it doesn't need to be distinguished here
+        distinguish_types=False,
+    )
+    extended_coord = extended_coord.reshape(nframes, -1, 3)
+    return extended_coord, extended_atype, nlist, mapping, fp, ap
+
+
+def convert_numpy_data_to_jax_data(
+    numpy_data: dict[str, np.ndarray | np.floating],
+) -> dict[str, jnp.ndarray | bool]:
+    """Convert NumPy data to JAX data.
+
+    Parameters
+    ----------
+    numpy_data : dict[str, np.ndarray | np.floating]
+        NumPy data
+
+    Returns
+    -------
+    jax_data
+        JAX data
+    """
+    # numpy to jax
+    jax_data = {
+        kk: jnp.asarray(vv) if not kk.startswith("find_") else bool(vv.item())
+        for kk, vv in numpy_data.items()
+    }
+    return jax_data
diff --git a/source/tests/jax/test_training.py b/source/tests/jax/test_training.py
new file mode 100644
index 0000000000..5d44e03e51
--- /dev/null
+++ b/source/tests/jax/test_training.py
@@ -0,0 +1,171 @@
+# SPDX-License-Identifier: LGPL-3.0-or-later
+"""End-to-end tests for the local JAX training entrypoint."""
+
+import argparse
+import json
+import os
+import re
+import shutil
+import subprocess
+import sys
+import tempfile
+import textwrap
+import unittest
+from pathlib import (
+    Path,
+)
+from unittest.mock import (
+    patch,
+)
+
+from deepmd.jax.entrypoints.freeze import (
+    freeze,
+)
+from deepmd.jax.entrypoints.main import (
+    main,
+)
+from deepmd.utils.compat import (
+    convert_optimizer_v31_to_v32,
+)
+
+MODEL_SE_E2_A = {
+    "type_map": ["O", "H", "B"],
+    "descriptor": {
+        "type": "se_e2_a",
+        "sel": [6, 12, 1],
+        "rcut_smth": 0.50,
+        "rcut": 4.00,
+        "neuron": [2, 4, 8],
+        "resnet_dt": False,
+        "axis_neuron": 2,
+        "type_one_side": True,
+        "seed": 1,
+    },
+    "fitting_net": {
+        "neuron": [4, 4, 4],
+        "resnet_dt": True,
+        "seed": 1,
+    },
+    "data_stat_nbatch": 1,
+}
+
+
+TRAINING_SCRIPT = """
+from pathlib import Path
+from unittest.mock import patch
+
+from deepmd.main import main
+
+with patch("deepmd.jax.entrypoints.train.SummaryPrinter.__call__"):
+    main(["--jax", "train", "input.json", "--log-level", "2"])
+
+for path in ["out.json", "lcurve.out", "checkpoint", "model-1.jax"]:
+    if not Path(path).exists():
+        raise FileNotFoundError(path)
+"""
+
+
+_LCURVE_STEP_RE = re.compile(r"^\s*(\d+)\b")
+
+
+def _lcurve_steps(path: Path) -> set[int]:
+    """Return integer step numbers written in an lcurve.out file."""
+    steps: set[int] = set()
+    for line in path.read_text().splitlines():
+        match = _LCURVE_STEP_RE.match(line)
+        if match:
+            steps.add(int(match.group(1)))
+    return steps
+
+
+class TestJAXTraining(unittest.TestCase):
+    """Regression tests for complete JAX training runs."""
+
+    def setUp(self) -> None:
+        """Create a temporary work directory with a one-step training input."""
+        self.work_dir = Path(tempfile.mkdtemp())
+        self.cwd = Path.cwd()
+        os.chdir(self.work_dir)
+
+        source_dir = Path(__file__).resolve().parents[1] / "pt" / "water"
+        shutil.copytree(source_dir, self.work_dir / "water")
+        data_file = [str(self.work_dir / "water" / "data" / "single")]
+
+        with (self.work_dir / "water" / "se_atten.json").open() as f:
+            self.config = json.load(f)
+        self.config = convert_optimizer_v31_to_v32(self.config, warning=False)
+        self.config["model"] = MODEL_SE_E2_A
+        self.config["model"]["data_stat_nbatch"] = 1
+        self.config["training"]["training_data"]["systems"] = data_file
+        self.config["training"]["validation_data"]["systems"] = data_file
+        self.config["training"]["numb_steps"] = 1
+        self.config["training"]["disp_freq"] = 1
+        self.config["training"]["save_freq"] = 1
+        self.config["training"]["save_ckpt"] = "model"
+
+        self.input_file = self.work_dir / "input.json"
+        with self.input_file.open("w") as f:
+            json.dump(self.config, f)
+
+    def tearDown(self) -> None:
+        """Remove temporary training outputs."""
+        os.chdir(self.cwd)
+        shutil.rmtree(self.work_dir)
+
+    def test_train_entrypoint_runs_one_step_from_scratch(self) -> None:
+        """Run local JAX training in a child process and check artifacts."""
+        if os.environ.get("GITHUB_ACTIONS") == "true" and os.environ.get(
+            "CUDA_VISIBLE_DEVICES"
+        ):
+            # TODO: Re-enable this in GitHub CUDA CI once the hosted/self-hosted
+            # runner JAX/PJRT abort is understood. The same test passes on a
+            # local GPU, but the GitHub Actions CUDA job can terminate with
+            # CUDA_ERROR_LAUNCH_FAILED while PJRT releases device buffers.
+            self.skipTest(
+                "JAX training is temporarily skipped on GitHub Actions CUDA runners"
+            )
+
+        proc = subprocess.run(
+            [sys.executable, "-c", textwrap.dedent(TRAINING_SCRIPT)],
+            cwd=self.work_dir,
+            text=True,
+            capture_output=True,
+            timeout=60,
+            check=False,
+        )
+
+        self.assertEqual(proc.returncode, 0, proc.stdout + proc.stderr)
+        self.assertIn(1, _lcurve_steps(self.work_dir / "lcurve.out"))
+
+    @patch("deepmd.jax.entrypoints.freeze.deserialize_to_file")
+    @patch("deepmd.jax.entrypoints.freeze.serialize_from_file")
+    def test_freeze_entrypoint_uses_checkpoint_pointer(
+        self, serialize_from_file, deserialize_to_file
+    ) -> None:
+        """Freeze resolves the stable checkpoint pointer without Hessian options."""
+        checkpoint_dir = self.work_dir / "ckpt"
+        checkpoint_dir.mkdir()
+        (checkpoint_dir / "checkpoint").write_text("model-1.jax")
+        serialize_from_file.return_value = {"model": {}, "model_def_script": {}}
+
+        freeze(checkpoint_folder=str(checkpoint_dir), output="frozen_model")
+
+        serialize_from_file.assert_called_once_with(str(checkpoint_dir / "model-1.jax"))
+        deserialize_to_file.assert_called_once_with(
+            "frozen_model.hlo", serialize_from_file.return_value
+        )
+
+    @patch("deepmd.jax.entrypoints.main.freeze")
+    def test_main_dispatches_freeze(self, freeze_entrypoint) -> None:
+        """JAX CLI main imports and dispatches the freeze command."""
+        args = argparse.Namespace(
+            command="freeze",
+            log_level=2,
+            log_path=None,
+            checkpoint_folder=".",
+            output="frozen_model",
+        )
+
+        main(args)
+
+        freeze_entrypoint.assert_called_once()