allow arbitrary loss and reduction

GiovanniCanali · dario-coscia · commit 2cacf20e64fd · 2025-07-04T16:38:44.000+02:00
diff --git a/pina/solver/physics_informed_solver/rba_pinn.py b/pina/solver/physics_informed_solver/rba_pinn.py
@@ -72,6 +72,7 @@ def __init__(
         optimizer=None,
         scheduler=None,
         weighting=None,
+        loss=None,
         eta=0.001,
         gamma=0.999,
     ):
@@ -88,6 +89,9 @@ def __init__(
             scheduler is used. Default is ``None``.
         :param WeightingInterface weighting: The weighting schema to be used.
             If ``None``, no weighting schema is used. Default is ``None``.
+        :param torch.nn.Module loss: The loss function to be minimized.
+            If ``None``, the :class:`torch.nn.MSELoss` loss is used.
+            Default is `None`.
         :param float | int eta: The learning rate for the weights of the
             residuals. Default is ``0.001``.
         :param float gamma: The decay parameter in the update of the weights
@@ -102,7 +106,7 @@ def __init__(
             optimizer=optimizer,
             scheduler=scheduler,
             weighting=weighting,
-            loss=torch.nn.MSELoss(reduction="none"),
+            loss=loss,
         )
 
         # check consistency
@@ -130,6 +134,12 @@ def __init__(
             self.register_buffer(f"weight_{cond}", buffer_tensor)
             self.weights[cond] = getattr(self, f"weight_{cond}")
 
+        # Extract the reduction method from the loss function
+        self._reduction = self._loss_fn.reduction
+
+        # Set the loss function to return non-aggregated losses
+        self._loss_fn = type(self._loss_fn)(reduction="none")
+
     def training_step(self, batch, batch_idx, **kwargs):
         """
         Solver training step. It computes the optimization cycle and aggregates
@@ -166,7 +176,7 @@ def validation_step(self, batch, **kwargs):
 
         # Aggregate losses for each condition
         for cond, loss in losses.items():
-            losses[cond] = losses[cond].mean()
+            losses[cond] = self._apply_reduction(loss=losses[cond])
 
         loss = (sum(losses.values()) / len(losses)).as_subclass(torch.Tensor)
         self.store_log("val_loss", loss, self.get_batch_size(batch))
@@ -189,7 +199,7 @@ def test_step(self, batch, **kwargs):
 
         # Aggregate losses for each condition
         for cond, loss in losses.items():
-            losses[cond] = losses[cond].mean()
+            losses[cond] = self._apply_reduction(loss=losses[cond])
 
         loss = (sum(losses.values()) / len(losses)).as_subclass(torch.Tensor)
         self.store_log("test_loss", loss, self.get_batch_size(batch))
@@ -228,7 +238,9 @@ def _optimization_cycle(self, batch, batch_idx, **kwargs):
                 device=res.device,
             ) % len(self.problem.input_pts[cond])
 
-            losses[cond] = (res * self.weights[cond][idx]).mean()
+            losses[cond] = self._apply_reduction(
+                loss=(res * self.weights[cond][idx])
+            )
 
             # store log
             self.store_log(
@@ -275,3 +287,26 @@ def _update_weights(self, batch, batch_idx, residuals):
             weights = self.weights[cond]
             update = self.gamma * weights[idx] + r_norm
             weights[idx] = update.detach()
+
+    def _apply_reduction(self, loss):
+        """
+        Apply the specified reduction to the loss. The reduction is deferred
+        until the end of the optimization cycle to allow residual-based weights
+        to be applied to each point beforehand.
+
+        :param torch.Tensor loss: The loss tensor to be reduced.
+        :return: The reduced loss tensor.
+        :rtype: torch.Tensor
+        :raises ValueError: If the reduction method is neither "mean" nor "sum".
+        """
+        # Apply the specified reduction method
+        if self._reduction == "mean":
+            return loss.mean()
+        if self._reduction == "sum":
+            return loss.sum()
+
+        # Raise an error if the reduction method is not recognized
+        raise ValueError(
+            f"Unknown reduction: {self._reduction}."
+            " Supported reductions are 'mean' and 'sum'."
+        )
diff --git a/tests/test_solver/test_rba_pinn.py b/tests/test_solver/test_rba_pinn.py
@@ -60,8 +60,11 @@ def test_constructor(problem, eta, gamma):
 @pytest.mark.parametrize("problem", [problem, inverse_problem])
 @pytest.mark.parametrize("batch_size", [None, 1, 5, 20])
 @pytest.mark.parametrize("compile", [True, False])
-def test_solver_train(problem, batch_size, compile):
-    solver = RBAPINN(model=model, problem=problem)
+@pytest.mark.parametrize(
+    "loss", [torch.nn.L1Loss(reduction="sum"), torch.nn.MSELoss()]
+)
+def test_solver_train(problem, batch_size, loss, compile):
+    solver = RBAPINN(model=model, problem=problem, loss=loss)
     trainer = Trainer(
         solver=solver,
         max_epochs=2,
@@ -80,8 +83,11 @@ def test_solver_train(problem, batch_size, compile):
 @pytest.mark.parametrize("problem", [problem, inverse_problem])
 @pytest.mark.parametrize("batch_size", [None, 1, 5, 20])
 @pytest.mark.parametrize("compile", [True, False])
-def test_solver_validation(problem, batch_size, compile):
-    solver = RBAPINN(model=model, problem=problem)
+@pytest.mark.parametrize(
+    "loss", [torch.nn.L1Loss(reduction="sum"), torch.nn.MSELoss()]
+)
+def test_solver_validation(problem, batch_size, loss, compile):
+    solver = RBAPINN(model=model, problem=problem, loss=loss)
     trainer = Trainer(
         solver=solver,
         max_epochs=2,
@@ -100,8 +106,11 @@ def test_solver_validation(problem, batch_size, compile):
 @pytest.mark.parametrize("problem", [problem, inverse_problem])
 @pytest.mark.parametrize("batch_size", [None, 1, 5, 20])
 @pytest.mark.parametrize("compile", [True, False])
-def test_solver_test(problem, batch_size, compile):
-    solver = RBAPINN(model=model, problem=problem)
+@pytest.mark.parametrize(
+    "loss", [torch.nn.L1Loss(reduction="sum"), torch.nn.MSELoss()]
+)
+def test_solver_test(problem, batch_size, loss, compile):
+    solver = RBAPINN(model=model, problem=problem, loss=loss)
     trainer = Trainer(
         solver=solver,
         max_epochs=2,