self-adaptive physics informed solver

GiovanniCanali · GiovanniCanali · commit afc5614a0204 · 2026-06-04T18:09:35.000+02:00
diff --git a/docs/source/_rst/_code.rst b/docs/source/_rst/_code.rst
@@ -91,6 +91,7 @@ Solvers and Mixins
     Physics-Informed Ensemble Solver <solver/physics_informed_ensemble_solver.rst>
     Autoregressive Single-Model Solver <solver/autoregressive_single_model_solver.rst>
     Autoregressive Ensemble Solver <solver/autoregressive_ensemble_solver.rst>
+    Self-Adaptive Physics-Informed Solver <solver/self_adaptive_physics_informed_solver.rst>
     Single-Model Mixin <solver/mixin/single_model_mixin.rst>
     Multi-Model Mixin <solver/mixin/multi_model_mixin.rst>
     Ensemble Mixin <solver/mixin/ensemble_mixin.rst>
diff --git a/docs/source/_rst/solver/self_adaptive_physics_informed_solver.rst b/docs/source/_rst/solver/self_adaptive_physics_informed_solver.rst
@@ -0,0 +1,11 @@
+Self-Adaptive Physics-Informed Solver
+=======================================
+
+.. currentmodule:: pina.solver.self_adaptive_physics_informed_solver
+
+.. automodule:: pina._src.solver.self_adaptive_physics_informed_solver
+
+.. autoclass:: pina._src.solver.self_adaptive_physics_informed_solver.SelfAdaptivePhysicsInformedSolver
+    :members:
+    :show-inheritance:
+        :noindex:
diff --git a/pina/_src/problem/zoo/inverse_poisson_problem.py b/pina/_src/problem/zoo/inverse_poisson_problem.py
@@ -174,3 +174,5 @@ def __init__(self, load=True, data_size=1.0):
                 self.conditions["data"] = Condition(
                     input=input_data[:n_data], target=output_data[:n_data]
                 )
+                self.conditions["data"].problem = self
+                self.conditions["data"].name = "data"
diff --git a/pina/_src/solver/self_adaptive_physics_informed_solver.py b/pina/_src/solver/self_adaptive_physics_informed_solver.py
@@ -0,0 +1,335 @@
+"""Module for the self-adaptive physics-informed multi-model solver."""
+
+import torch
+from pina._src.solver.mixin.physics_informed_mixin import _PhysicsInformedMixin
+from pina._src.condition.input_equation_condition import InputEquationCondition
+from pina._src.condition.input_target_condition import InputTargetCondition
+from pina._src.solver.multi_model_solver import MultiModelSolver
+from pina._src.core.utils import check_consistency
+from pina._src.condition.domain_equation_condition import (
+    DomainEquationCondition,
+)
+
+
+class SelfAdaptivePhysicsInformedSolver(
+    _PhysicsInformedMixin, MultiModelSolver
+):
+    r"""
+    Multi-model solver for self-adaptive physics-informed learning problems.
+
+    This solver approximates the solution of a differential problem using a
+    trainable model together with condition-wise self-adaptive weights. It is
+    intended for problems whose conditions may include supervised data, equation
+    residuals evaluated on input points, and equation residuals sampled from
+    domains.
+
+    Given a model :math:`\mathcal{M}`, the predicted solution is
+
+    .. math::
+
+        \hat{\mathbf{u}}(\mathbf{x}) = \mathcal{M}(\mathbf{x}).
+
+    For each condition, the solver introduces trainable pointwise weights. These
+    weights are passed through a user-defined weight function :math:`m`,
+    typically chosen to keep the effective weights bounded or positive. The
+    resulting weighted objective encourages the model to focus on regions where
+    the residual is larger.
+
+    For a problem with governing equation operator :math:`\mathcal{A}` in the
+    domain :math:`\Omega` and boundary operator :math:`\mathcal{B}` on the
+    boundary :math:`\partial\Omega`, the objective can be written as
+
+    .. math::
+
+        \mathcal{L}_{\mathrm{problem}} = \frac{1}{N_{\Omega}}
+        \sum_{i=1}^{N_{\Omega}} m(\lambda_{\Omega}^{i}) \mathcal{L}
+        \left( \mathcal{A}[\hat{\mathbf{u}}](\mathbf{x}_i) \right)
+        + \frac{1}{N_{\partial\Omega}} \sum_{i=1}^{N_{\partial\Omega}}
+        m(\lambda_{\partial\Omega}^{i})
+        \mathcal{L} \left( \mathcal{B}[\hat{\mathbf{u}}](\mathbf{x}_i) \right),
+
+    where :math:`\lambda_{\Omega}^{i}` and :math:`\lambda_{\partial\Omega}^{i}`
+    are the self-adaptive weights associated with points in :math:`\Omega` and
+    :math:`\partial\Omega`, respectively, and :math:`\mathcal{L}` is the
+    selected loss function, typically the mean squared error.
+
+    The model parameters and the self-adaptive weights are optimized through a
+    min-max problem:
+
+    .. math::
+
+        \min_{\theta} \max_{\lambda} \mathcal{L}_{\mathrm{problem}},
+
+    where :math:`\theta` denotes the model parameters and :math:`\lambda`
+    denotes the collection of self-adaptive weights.
+
+    .. seealso::
+
+        **Original reference**: McClenny, L. D., & Braga-Neto, U. M. (2023).
+        *Self-adaptive physics-informed neural networks.*
+        Journal of Computational Physics, 474, 111722.
+        DOI: `10.1016/j.jcp.2022.111722
+        <https://doi.org/10.1016/j.jcp.2022.111722>`_.
+    """
+
+    # Accepted conditions types for this solver
+    accepted_conditions_types = (
+        InputTargetCondition,
+        InputEquationCondition,
+        DomainEquationCondition,
+    )
+
+    def __init__(
+        self,
+        problem,
+        model,
+        weight_function=torch.nn.Sigmoid(),
+        optimizer_model=None,
+        optimizer_weights=None,
+        scheduler_model=None,
+        scheduler_weights=None,
+        weighting=None,
+        loss=None,
+    ):
+        """
+        Initialization of the :class:`SelfAdaptivePhysicsInformedSolver` class.
+
+        :param BaseProblem problem: The problem to be solved.
+        :param torch.nn.Module model: The model used by the solver.
+        :param torch.nn.Module weight_function: The weight function used to
+            compute self-adaptive weights. Default is ``torch.nn.Sigmoid()``.
+        :param TorchOptimizer optimizer_model: The optimizer of the main model.
+            If ``None``, the ``torch.optim.Adam`` optimizer with a learning rate
+            of ``0.001`` is used. Default is ``None``.
+        :param TorchOptimizer optimizer_weights: The optimizer of the
+            self-adaptive weights. If ``None``, the ``torch.optim.Adam``
+            optimizer with a learning rate of ``0.001`` is used.
+            Default is ``None``.
+        :param TorchScheduler scheduler_model: The scheduler of the main model.
+            If ``None``, the ``torch.optim.lr_scheduler.ConstantLR`` scheduler
+            with a factor of ``1.0`` is used. Default is ``None``.
+        :param TorchScheduler scheduler_weights: The scheduler of the
+            self-adaptive weights. If ``None``, the
+            ``torch.optim.lr_scheduler.ConstantLR`` scheduler with a factor of
+            ``1.0`` is used. Default is ``None``.
+        :param BaseWeighting weighting: The weighting strategy used to combine
+            condition losses. If ``None``, no weighting is applied. Default is
+            ``None``.
+        :param loss: The loss function used to compute residual losses.
+            If ``None``, :class:`torch.nn.MSELoss` is used. Default is ``None``.
+        :raises ValueError: If ``weight_function`` is not a ``torch.nn.Module``.
+        :raises ValueError: If not all domains have been discretised.
+        """
+        # Check consistency
+        check_consistency(weight_function, torch.nn.Module)
+
+        # Check that all domains have been discretised
+        if not problem.are_all_domains_discretised:
+            raise ValueError(
+                "All domains must be discretised before initializing the "
+                "solver."
+            )
+
+        # Compute the number of points for each condition
+        num_points = {
+            cond: (
+                problem._discretised_domains[cond].shape[0]
+                if isinstance(problem.conditions[cond], DomainEquationCondition)
+                else problem.conditions[cond].data.input.shape[0]
+            )
+            for cond in problem.conditions
+        }
+
+        # Initialize weights container and per-condition parameters
+        weights = torch.nn.Module()
+
+        # Attach the weight function as a submodule
+        weights.func = weight_function
+
+        # Register a torch.nn.Parameter for each condition to store the weights
+        for cond in problem.conditions:
+            p = torch.nn.Parameter(torch.zeros(num_points[cond], 1))
+            setattr(weights, cond, p)
+
+        # Prepare optimizers
+        optimizers = (
+            [optimizer_model, optimizer_weights]
+            if any(o is not None for o in (optimizer_model, optimizer_weights))
+            else None
+        )
+
+        # Prepare schedulers
+        schedulers = (
+            [scheduler_model, scheduler_weights]
+            if any(s is not None for s in (scheduler_model, scheduler_weights))
+            else None
+        )
+
+        # Initialize the base solver
+        MultiModelSolver.__init__(
+            self,
+            problem=problem,
+            models=[model, weights],
+            optimizers=optimizers,
+            schedulers=schedulers,
+            weighting=weighting,
+            loss=loss,
+            use_lt=True,
+        )
+
+    def training_step(self, batch, batch_idx):
+        """
+        Solver training step.
+
+        :param list[tuple[str, dict]] batch: A batch of data. Each element is a
+            tuple containing a condition name and a dictionary of points.
+        :param int batch_idx: The index of the current batch.
+        :return: The loss of the training step.
+        :rtype: torch.Tensor
+        """
+        # Zero the gradients of weights optimizer and compute the loss
+        self.optimizer_weights.instance.zero_grad()
+        loss = self.batch_evaluation_step(batch, batch_idx)
+
+        # Perform the backward pass and complete a step for the weights
+        self.manual_backward(-loss)
+        self.optimizer_weights.instance.step()
+        self.scheduler_weights.instance.step()
+
+        # Zero the gradients of model optimizer and compute the loss again
+        self.optimizer_model.instance.zero_grad()
+        loss = self.batch_evaluation_step(batch, batch_idx)
+
+        # Perform the backward pass and complete a step for the model
+        self.manual_backward(loss)
+        self.optimizer_model.instance.step()
+        self.scheduler_model.instance.step()
+
+        # Log the training loss
+        self.log(
+            name="train_loss",
+            value=loss.item(),
+            batch_size=self.get_batch_size(batch),
+            **self.trainer.logging_kwargs,
+        )
+
+        return loss
+
+    def forward(self, x):
+        """
+        Forward pass through the model.
+
+        :param x: The input data.
+        :type x: torch.Tensor | LabelTensor | Data | Graph
+        :return: The output of the model.
+        :rtype: torch.Tensor | LabelTensor | Data | Graph
+        """
+        return self.model(x)
+
+    def _compute_condition_loss(self, condition, data, batch_idx):
+        """
+        Compute the scalar loss for a given condition and its data.
+
+        :param BaseCondition condition: The condition for which to compute the
+            loss.
+        :param dict data: The data corresponding to the condition.
+        :param int batch_idx: The index of the current batch.
+        :return: The scalar loss for the condition.
+        :rtype: torch.Tensor
+        """
+        # Clone the input tensor if it exists to avoid in-place modifications
+        if "input" in data and hasattr(data["input"], "clone"):
+            data = dict(data)
+            data["input"] = data["input"].clone()
+
+        # Compute and store the residual tensor for the condition
+        self.residual_tensor = condition.evaluate(data, self)
+
+        # Retrieve condition name for more complex weighting schemes
+        condition_name = condition.name
+
+        # Apply the activation function to the condition-specific weights
+        weight_param = getattr(self.weights, condition_name)
+        weight_tensor = self.weights.func(weight_param)
+
+        # Compute the tensor loss from the residual tensor
+        condition_tensor_loss = self._loss_from_residual(condition_name)
+
+        # Get the correct indices to retrieve the weights for the current batch
+        len_residuals = self.residual_tensor.shape[0]
+
+        # Get the total number of points, together with the start / end indices
+        total_points = weight_param.shape[0]
+        start = (batch_idx * len_residuals) % total_points
+        end = start + len_residuals
+
+        # Retrieve the weights for the current batch using modular indexing
+        idx = torch.arange(start, end, device=self.residual_tensor.device)
+        idx = idx % total_points
+
+        # Compute the scalar loss from the tensor loss and return it
+        condition_scalar_loss = self._apply_reduction(
+            condition_tensor_loss * weight_tensor[idx]
+        )
+
+        return condition_scalar_loss
+
+    @property
+    def model(self):
+        """
+        The single model used by the solver.
+
+        :return: The single model used by the solver.
+        :rtype: torch.nn.Module
+        """
+        return self._pina_models[0]
+
+    @property
+    def weights(self):
+        """
+        The self-adaptive weights used by the solver.
+
+        :return: The self-adaptive weights used by the solver.
+        :rtype: torch.nn.Module
+        """
+        return self._pina_models[1]
+
+    @property
+    def optimizer_model(self):
+        """
+        The optimizer for the model used by the solver.
+
+        :return: The optimizer for the model used by the solver.
+        :rtype: TorchOptimizer
+        """
+        return self.optimizers[0]
+
+    @property
+    def optimizer_weights(self):
+        """
+        The optimizer for the weights used by the solver.
+
+        :return: The optimizer for the weights used by the solver.
+        :rtype: TorchOptimizer
+        """
+        return self.optimizers[1]
+
+    @property
+    def scheduler_model(self):
+        """
+        The scheduler for the model used by the solver.
+
+        :return: The scheduler for the model used by the solver.
+        :rtype: TorchScheduler
+        """
+        return self.schedulers[0]
+
+    @property
+    def scheduler_weights(self):
+        """
+        The scheduler for the weights used by the solver.
+
+        :return: The scheduler for the weights used by the solver.
+        :rtype: TorchScheduler
+        """
+        return self.schedulers[1]
diff --git a/pina/solver/__init__.py b/pina/solver/__init__.py
@@ -12,6 +12,7 @@
     "PhysicsInformedEnsembleSolver",
     "AutoregressiveSingleModelSolver",
     "AutoregressiveEnsembleSolver",
+    "SelfAdaptivePhysicsInformedSolver",
 ]
 
 
@@ -36,3 +37,6 @@
 from pina._src.solver.autoregressive_ensemble_solver import (
     AutoregressiveEnsembleSolver,
 )
+from pina._src.solver.self_adaptive_physics_informed_solver import (
+    SelfAdaptivePhysicsInformedSolver,
+)
diff --git a/tests/test_solver/test_physics_informed_ensemble_solver.py b/tests/test_solver/test_physics_informed_ensemble_solver.py
@@ -39,7 +39,7 @@ def define_direct_problem_model(n_pts=10, n_models=3):
 def define_inverse_problem_model(n_pts=10, n_models=5):
 
     # Initialize inverse problem
-    problem = InversePoisson2DSquareProblem()
+    problem = InversePoisson2DSquareProblem(load=True, data_size=0.01)
     problem.discretise_domain(n_pts)
 
     # Initialize the models
diff --git a/tests/test_solver/test_physics_informed_single_model_solver.py b/tests/test_solver/test_physics_informed_single_model_solver.py
@@ -38,7 +38,7 @@ def define_direct_problem_model(n_pts=10):
 def define_inverse_problem_model(n_pts=10):
 
     # Initialize inverse problem
-    problem = InversePoisson2DSquareProblem()
+    problem = InversePoisson2DSquareProblem(load=True, data_size=0.01)
     problem.discretise_domain(n_pts)
 
     # Initialize the model
diff --git a/tests/test_solver/test_self_adaptive_physics_informed_solver.py b/tests/test_solver/test_self_adaptive_physics_informed_solver.py

Original file line number	Diff line number	Diff line change
`@@ -174,3 +174,5 @@ def __init__(self, load=True, data_size=1.0):`
`174`	`174`	`self.conditions["data"] = Condition(`
`175`	`175`	`input=input_data[:n_data], target=output_data[:n_data]`
`176`	`176`	`)`
	`177`	`+ self.conditions["data"].problem = self`
	`178`	`+ self.conditions["data"].name = "data"`
Original file line number	Diff line number	Diff line change
`@@ -12,6 +12,7 @@`
`12`	`12`	`"PhysicsInformedEnsembleSolver",`
`13`	`13`	`"AutoregressiveSingleModelSolver",`
`14`	`14`	`"AutoregressiveEnsembleSolver",`
	`15`	`+ "SelfAdaptivePhysicsInformedSolver",`
`15`	`16`	`]`
`16`	`17`
`17`	`18`
`@@ -36,3 +37,6 @@`
`36`	`37`	`from pina._src.solver.autoregressive_ensemble_solver import (`
`37`	`38`	`AutoregressiveEnsembleSolver,`
`38`	`39`	`)`
	`40`	`+from pina._src.solver.self_adaptive_physics_informed_solver import (`
	`41`	`+ SelfAdaptivePhysicsInformedSolver,`
	`42`	`+)`