alan-turing-institute
diff --git a/‎autoemulate/emulators/conformal.py‎
Lines changed: 225 additions & 18 deletions b/‎autoemulate/emulators/conformal.py‎
Lines changed: 225 additions & 18 deletions
@@ -1,7 +1,8 @@
 import math
+from typing import Literal
 
 import torch
-from torch import Tensor, nn
+from torch import nn
 from torch.optim.lr_scheduler import LRScheduler
 
 from autoemulate.core.device import TorchDeviceMixin
@@ -10,6 +11,69 @@
 from autoemulate.emulators.nn.mlp import MLP
 
 
+class QuantileLoss(nn.Module):
+    """Quantile loss for quantile regression.
+
+    This loss function asymmetrically penalizes over- and under-predictions, enabling
+    the model to learn specific quantiles of the conditional distribution.
+    """
+
+    def __init__(self, quantile: float):
+        """Initialize quantile loss.
+
+        Parameters
+        ----------
+        quantile: float
+            Target quantile level in (0, 1). For example, 0.1 for 10th percentile, 0.5
+            for median, 0.9 for 90th percentile.
+        """
+        super().__init__()
+        if not 0 < quantile < 1:
+            msg = f"Quantile must be in (0, 1), got {quantile}"
+            raise ValueError(msg)
+        self.quantile = quantile
+
+    def forward(self, y_pred: TensorLike, y_true: TensorLike) -> TensorLike:
+        """Compute quantile loss.
+
+        Parameters
+        ----------
+        y_pred: TensorLike
+            Predicted values.
+        y_true: TensorLike
+            True target values.
+
+        Returns
+        -------
+        TensorLike
+            Scalar loss value.
+        """
+        errors = y_true - y_pred
+        return torch.max(self.quantile * errors, (self.quantile - 1) * errors).mean()
+
+
+class QuantileMLP(MLP):
+    """MLP with quantile loss for quantile regression."""
+
+    def __init__(self, quantile: float, **kwargs):
+        """Initialize quantile MLP.
+
+        Parameters
+        ----------
+        quantile: float
+            Target quantile level in (0, 1).
+        **kwargs
+            Keyword arguments passed to MLP parent class.
+        """
+        super().__init__(**kwargs)
+        self.quantile = quantile
+        self.quantile_loss = QuantileLoss(quantile)
+
+    def loss_func(self, y_pred, y_true):
+        """Quantile loss function."""
+        return self.quantile_loss(y_pred, y_true)
+
+
 class Conformal(Emulator):
     """Conformal Uncertainty Quantification (UQ) wrapper for emulators.
 
@@ -26,6 +90,8 @@ def __init__(
         device: DeviceLike | None = None,
         calibration_ratio: float = 0.2,
         n_samples: int = 1000,
+        method: Literal["split", "quantile"] = "split",
+        quantile_emulator_kwargs: dict | None = None,
     ):
         """Initialize a conformal emulator.
 
@@ -42,8 +108,16 @@ def __init__(
             Fraction of the training data to reserve for calibration if explicit
             validation data is not provided. Must lie in (0, 1). Defaults to 0.2.
         n_samples: int
-            Number of samples used for sampling-based predictions or
-            internal procedures. Defaults to 1000.
+            Number of samples used for sampling-based predictions or internal
+            procedures. Defaults to 1000.
+        method: Literal["split", "quantile"]
+            Conformalization method to use:
+            - "split": Standard split conformal with constant-width intervals
+            - "quantile": Conformalized Quantile Regression (CQR) with input-dependent
+              intervals. Defaults to "split".
+        quantile_emulator_kwargs: dict | None
+            Additional keyword arguments for the quantile emulators when
+            method="quantile". Defaults to None.
         """
         self.emulator = emulator
         self.supports_grad = emulator.supports_grad
@@ -53,9 +127,14 @@ def __init__(
         if not 0 < calibration_ratio < 1:
             msg = "Calibration ratio must lie strictly between 0 and 1."
             raise ValueError(msg)
+        if method not in {"split", "quantile"}:
+            msg = f"Method must be 'split' or 'quantile', got '{method}'."
+            raise ValueError(msg)
         self.alpha = alpha  # desired predictive coverage (e.g., 0.95)
         self.calibration_ratio = calibration_ratio
         self.n_samples = n_samples
+        self.method = method
+        self.quantile_emulator_kwargs = quantile_emulator_kwargs or {}
         TorchDeviceMixin.__init__(self, device=device)
         self.supports_grad = emulator.supports_grad
 
@@ -98,36 +177,129 @@ def _fit(
         else:
             x_cal, y_true_cal = validation_data
 
+        # Fit the base emulator
         self.emulator.fit(x_train, y_train, validation_data=None)
 
-        with torch.no_grad():
-            n_cal = x_cal.shape[0]
-            # Check calibration data is non-empty
-            if n_cal == 0:
-                msg = "Calibration set must contain at least one sample."
-                raise ValueError(msg)
+        n_cal = x_cal.shape[0]
+        # Check calibration data is non-empty
+        if n_cal == 0:
+            msg = "Calibration set must contain at least one sample."
+            raise ValueError(msg)
 
+        with torch.no_grad():
             # Predict and calculate residuals
             y_pred_cal = self.output_to_tensor(self.emulator.predict(x_cal))
+
+        if self.method == "split":
+            # Standard split conformal: compute global quantile of residuals
             residuals = torch.abs(y_true_cal - y_pred_cal)
 
-            # Apply finite-sample correction to quantile level to ensure valid coverage
+            # Apply finite-sample correction to quantile level
             quantile_level = min(1.0, math.ceil((n_cal + 1) * self.alpha) / n_cal)
 
-            # Calibrate over the batch dim with a separate quantile for each output
+            # Calibrate over the batch dim with a separate quantile per output
             self.q = torch.quantile(residuals, quantile_level, dim=0)
 
+        elif self.method == "quantile":
+            # Conformalized Quantile Regression: train quantile regressors
+            self._fit_quantile_regressors(x_train, y_train, x_cal, y_true_cal)
+
         self.is_fitted_ = True
 
-    def _predict(self, x: Tensor, with_grad: bool) -> DistributionLike:
-        pred = self.emulator.predict(x, with_grad)
-        mean = self.output_to_tensor(pred)
-        q = self.q.to(mean.device)
-        return torch.distributions.Independent(
-            torch.distributions.Uniform(mean - q, mean + q),
-            reinterpreted_batch_ndims=mean.ndim - 1,
+    def _fit_quantile_regressors(
+        self,
+        x_train: TensorLike,
+        y_train: TensorLike,
+        x_cal: TensorLike,
+        y_true_cal: TensorLike,
+    ) -> None:
+        """Fit quantile regressors for CQR method.
+
+        Trains two quantile regressors to predict lower and upper quantiles,
+        then calibrates the width using the calibration set.
+        """
+        # Calculate quantile levels
+        lower_q = (1 - self.alpha) / 2
+        upper_q = 1 - lower_q
+
+        # Create quantile regression emulators
+        mlp_kwargs = {
+            "epochs": 100,
+            "batch_size": 16,
+            "lr": 1e-2,
+            **self.quantile_emulator_kwargs,
+        }
+
+        # Lower quantile emulator
+        self.lower_quantile_emulator = QuantileMLP(
+            lower_q, x=x_train, y=y_train, device=self.device, **mlp_kwargs
         )
 
+        # Upper quantile emulator
+        self.upper_quantile_emulator = QuantileMLP(
+            upper_q, x=x_train, y=y_train, device=self.device, **mlp_kwargs
+        )
+
+        # Fit the quantile emulators
+        self.lower_quantile_emulator.fit(x_train, y_train, validation_data=None)
+        self.upper_quantile_emulator.fit(x_train, y_train, validation_data=None)
+
+        # Predict quantiles on calibration set
+        with torch.no_grad():
+            lower_pred_cal = self.output_to_tensor(
+                self.lower_quantile_emulator.predict(x_cal)
+            )
+            upper_pred_cal = self.output_to_tensor(
+                self.upper_quantile_emulator.predict(x_cal)
+            )
+
+            # Calculate conformalization scores (non-conformity scores)
+            # For CQR, the score is max(lower - y, y - upper)
+            scores = torch.maximum(
+                lower_pred_cal - y_true_cal, y_true_cal - upper_pred_cal
+            )
+
+            # Apply finite-sample correction
+            n_cal = x_cal.shape[0]
+            quantile_level = min(1.0, math.ceil((n_cal + 1) * self.alpha) / n_cal)
+
+            # Compute the correction term per output dimension
+            self.q_cqr = torch.quantile(scores, quantile_level, dim=0)
+
+    def _predict(self, x: TensorLike, with_grad: bool) -> DistributionLike:
+        if self.method == "split":
+            # Standard split conformal: constant-width intervals
+            pred = self.emulator.predict(x, with_grad)
+            mean = self.output_to_tensor(pred)
+            q = self.q.to(mean.device)
+            return torch.distributions.Independent(
+                torch.distributions.Uniform(mean - q, mean + q),
+                reinterpreted_batch_ndims=mean.ndim - 1,
+            )
+
+        if self.method == "quantile":
+            # CQR: input-dependent intervals
+            lower_pred = self.output_to_tensor(
+                self.lower_quantile_emulator.predict(x, with_grad)
+            )
+            upper_pred = self.output_to_tensor(
+                self.upper_quantile_emulator.predict(x, with_grad)
+            )
+            q_cqr = self.q_cqr.to(lower_pred.device)
+
+            # Apply calibration correction
+            lower_bound = lower_pred - q_cqr
+            upper_bound = upper_pred + q_cqr
+
+            # Return uniform distribution over the calibrated interval
+            return torch.distributions.Independent(
+                torch.distributions.Uniform(lower_bound, upper_bound),
+                reinterpreted_batch_ndims=lower_bound.ndim - 1,
+            )
+
+        msg = f"Unknown method: {self.method}"
+        raise ValueError(msg)
+
 
 class ConformalMLP(Conformal, PyTorchBackend):
     """Conformal UQ with an MLP.
@@ -146,6 +318,7 @@ def __init__(
         device: DeviceLike | None = None,
         alpha: float = 0.95,
         calibration_ratio: float = 0.2,
+        method: Literal["split", "quantile"] = "split",
         activation_cls: type[nn.Module] = nn.ReLU,
         loss_fn_cls: type[nn.Module] = nn.MSELoss,
         epochs: int = 100,
@@ -160,6 +333,7 @@ def __init__(
         random_seed: int | None = None,
         scheduler_cls: type[LRScheduler] | None = None,
         scheduler_params: dict | None = None,
+        quantile_emulator_kwargs: dict | None = None,
     ):
         """
         Initialize an ensemble of MLPs.
@@ -181,6 +355,11 @@ def __init__(
         calibration_ratio: float
             Fraction of training samples to hold out for calibration when an explicit
             validation set is not provided.
+        method: Literal["split", "quantile"]
+            Conformalization method:
+            - "split": Standard split conformal (constant-width intervals)
+            - "quantile": Conformalized Quantile Regression (input-dependent intervals)
+            Defaults to "split".
         activation_cls: type[nn.Module]
             Activation function to use in the hidden layers. Defaults to `nn.ReLU`.
         loss_fn_cls: type[nn.Module]
@@ -218,6 +397,9 @@ def __init__(
             None.
         scheduler_params: dict | None
             Additional keyword arguments related to the scheduler.
+        quantile_emulator_kwargs: dict | None
+            Additional keyword arguments for the quantile emulators when
+            method="quantile". Defaults to None.
         """
         nn.Module.__init__(self)
 
@@ -242,12 +424,37 @@ def __init__(
             scheduler_cls=scheduler_cls,
             scheduler_params=scheduler_params,
         )
+
+        quantile_defaults = {
+            "standardize_x": standardize_x,
+            "standardize_y": standardize_y,
+            "activation_cls": activation_cls,
+            "loss_fn_cls": loss_fn_cls,
+            "epochs": epochs,
+            "batch_size": batch_size,
+            "layer_dims": layer_dims,
+            "weight_init": weight_init,
+            "scale": scale,
+            "bias_init": bias_init,
+            "dropout_prob": dropout_prob,
+            "lr": lr,
+            "params_size": params_size,
+            "random_seed": random_seed,
+            "scheduler_cls": scheduler_cls,
+            "scheduler_params": scheduler_params,
+        }
+        merged_quantile_kwargs = {
+            **quantile_defaults,
+            **(quantile_emulator_kwargs or {}),
+        }
         Conformal.__init__(
             self,
             emulator=emulator,
             alpha=alpha,
             device=device,
             calibration_ratio=calibration_ratio,
+            method=method,
+            quantile_emulator_kwargs=merged_quantile_kwargs,
         )
 
     @staticmethod