Source code for ise.models.iseflow

"""ISEFlow hybrid ice sheet emulator — base class and pretrained variants.

This module is the primary user-facing entry point for running and training
ISEFlow emulators.  It provides:

ISEFlow (base class)
--------------------
A hybrid ``torch.nn.Module`` combining:

- ``NormalizingFlow`` — conditional autoregressive flow trained first via
  maximum likelihood.  At inference time it provides (a) a latent
  representation ``z`` fed as extra context to the ensemble, and (b) the
  **aleatoric** uncertainty estimate via Monte Carlo sampling.
- ``DeepEnsemble`` — ensemble of LSTMs trained on ``[X, z]`` (original
  features concatenated with the NF latent).  Disagreement across members
  gives the **epistemic** uncertainty.

Training is sequential and order-sensitive: the NF must be trained before
the DE so that the latent features ``z`` are meaningful::

    from ise.models.iseflow import ISEFlow
    from ise.models.normalizing_flow import NormalizingFlow
    from ise.models.deep_ensemble import DeepEnsemble

    nf = NormalizingFlow(input_size=83, output_size=1, num_flow_transforms=5)
    de = DeepEnsemble(input_size=83, output_size=1, num_ensemble_members=10)
    model = ISEFlow(de, nf)
    model.fit(X_train, y_train, nf_epochs=500, de_epochs=200, X_val=X_val, y_val=y_val)
    model.save("my_model/")

Uncertainty decomposition::

    predictions, uncertainties = model.predict(X)
    # uncertainties = {"total": ..., "epistemic": ..., "aleatoric": ...}
    # total = epistemic + aleatoric  (scalar sum per timestep)

ISEFlow_AIS / ISEFlow_GrIS (pretrained)
----------------------------------------
Convenience subclasses that load bundled pretrained weights and expose a
simplified ``predict(inputs)`` interface::

    from ise.models.iseflow import ISEFlow_AIS
    from ise.data.inputs import ISEFlowAISInputs

    model = ISEFlow_AIS(version="v1.1.0")   # loads pretrained weights from package
    inputs = ISEFlowAISInputs(...)           # or ISEFlowAISInputs.from_absolute_forcings(...)
    predictions, uncertainties = model.predict(inputs)
    # predictions: numpy array shape (86, 1), SLE in mm, years 2015-2100

Supported versions
------------------
- ``v1.0.0``: AIS only; includes ``mrro_anomaly`` as a forcing variable.
- ``v1.1.0`` (default): AIS + GrIS; ``mrro_anomaly`` removed from AIS inputs.

Output smoothing
----------------
Both ``ISEFlow.predict()`` and ``ISEFlow_AIS/GrIS.predict()`` accept a
``smoothing_window`` argument.  When ``> 0``, a uniform moving-average filter
of that width is applied *after* inverse-scaling so the smoothing acts on
physical SLE values rather than scaled outputs.  Projection boundaries are
respected (no mixing between runs).

Deprecated classes
------------------
``ISEFlow_AIS_DE_v1_0_0``, ``ISEFlow_GrIS_DE_v1_0_0``,
``ISEFlow_AIS_NF_v1_0_0``, ``ISEFlow_GrIS_NF_v1_0_0`` are kept for loading
old v1.0.0 checkpoints only.  Use ``ISEFlow_AIS`` / ``ISEFlow_GrIS`` instead.
"""

import json
import os
import pickle
import shutil
import warnings

import numpy as np
import pandas as pd
import torch
from scipy.ndimage import uniform_filter1d
from sklearn.exceptions import InconsistentVersionWarning
from torch import nn

from ise.data import feature_engineer as fe
from ise.data.inputs import ISEFlowAISInputs, ISEFlowGrISInputs
from ise.models.deep_ensemble import DeepEnsemble
from ise.models.lstm import LSTM
from ise.models.normalizing_flow import NormalizingFlow
from ise.models.pretrained import (
    ISEFLOW_LATEST_MODEL_VERSION,
    ISEFlow_AIS_v1_0_0_variables,
    ISEFlow_AIS_v1_1_0_variables,
    ISEFlow_GrIS_v1_0_0_variables,
    ISEFlow_GrIS_v1_1_0_variables,
    get_model_dir,
)
from ise.utils.functions import get_device, to_tensor



[docs]
class ISEFlow(torch.nn.Module):
    """
    ISEFlow is a hybrid ice sheet emulator that combines a deep ensemble model and a normalizing flow model.

    This class provides methods to train, predict, save, and load hybrid models for ice sheet emulation.
    It integrates a deep ensemble to capture epistemic uncertainties and a normalizing flow to model aleatoric uncertainties.

    Attributes:
        device (str): The computing device ('cuda' if available, else 'cpu').
        deep_ensemble (DeepEnsemble): The deep ensemble model for epistemic uncertainty.
        normalizing_flow (NormalizingFlow): The normalizing flow model for aleatoric uncertainty.
        trained (bool): Flag indicating whether the model has been trained.
        scaler_path (str or None): Path to the scaler used for output transformation.
    """

    def __init__(self, deep_ensemble, normalizing_flow):
        """
        Initializes the ISEFlow model with a deep ensemble and a normalizing flow.

        Args:
            deep_ensemble (DeepEnsemble): A deep ensemble model for epistemic uncertainty estimation.
            normalizing_flow (NormalizingFlow): A normalizing flow model for aleatoric uncertainty estimation.

        Raises:
            ValueError: If `deep_ensemble` is not an instance of DeepEnsemble.
            ValueError: If `normalizing_flow` is not an instance of NormalizingFlow.
        """

        super().__init__()

        self.device = get_device()
        self.to(self.device)

        if not isinstance(deep_ensemble, DeepEnsemble):
            raise ValueError("deep_ensemble must be a DeepEnsemble instance")
        if not isinstance(normalizing_flow, NormalizingFlow):
            raise ValueError("normalizing_flow must be a NormalizingFlow instance")

        self.deep_ensemble = deep_ensemble.to(self.device)
        self.normalizing_flow = normalizing_flow.to(self.device)
        self.trained = self.deep_ensemble.trained and self.normalizing_flow.trained
        self.scaler_path = None
        self.model_dir = getattr(normalizing_flow, "model_dir", None)


[docs]
    def fit(
        self,
        X,
        y,
        nf_epochs,
        de_epochs,
        batch_size=64,
        X_val=None,
        y_val=None,
        save_checkpoints=True,
        checkpoint_path="checkpoint_ensemble",
        early_stopping=True,
        sequence_length=5,
        patience=10,
        verbose=True,
    ):
        """
        Trains the hybrid emulator using the provided data.

        This method trains the normalizing flow model first, then uses its latent representations
        to train the deep ensemble model.

        Args:
            X (array-like): Input feature matrix.
            y (array-like): Target values.
            nf_epochs (int): Number of training epochs for the normalizing flow.
            de_epochs (int): Number of training epochs for the deep ensemble.
            batch_size (int, optional): Batch size for training. Defaults to 64.
            X_val (array-like, optional): Validation feature matrix. Defaults to None.
            y_val (array-like, optional): Validation target values. Defaults to None.
            save_checkpoints (bool, optional): Whether to save training checkpoints. Defaults to True.
            checkpoint_path (str, optional): Path prefix for saving model checkpoints. Defaults to 'checkpoint_ensemble'.
            early_stopping (bool, optional): Whether to use early stopping. Defaults to True.
            sequence_length (int, optional): Sequence length for recurrent architectures. Defaults to 5.
            patience (int, optional): Number of epochs with no improvement before stopping. Defaults to 10.
            verbose (bool, optional): Whether to print training progress. Defaults to True.

        Raises:
            Warning: If the model has already been trained.
        """

        if early_stopping is None:
            early_stopping = X_val is not None and y_val is not None

        X, y = to_tensor(X).to(self.device), to_tensor(y).to(self.device)

        if self.trained:
            warnings.warn("This model has already been trained. Training again.")

        # Train Normalizing Flow
        if not self.normalizing_flow.trained:
            print(
                f"\nTraining Normalizing Flow ({'Maximum ' if early_stopping else ''}{nf_epochs} epochs):"
            )
            self.normalizing_flow.fit(
                X,
                y,
                epochs=nf_epochs,
                batch_size=batch_size,
                save_checkpoints=save_checkpoints,
                checkpoint_path=f"{checkpoint_path}_nf.pth",
                early_stopping=early_stopping,
                patience=patience,
                verbose=verbose,
            )

        # Latent representation
        z = self.normalizing_flow.get_latent(X).detach()
        X_latent = torch.cat((X, z), axis=1)

        X_val_latent = None
        if X_val is not None and y_val is not None:
            X_val, y_val = to_tensor(X_val).to(self.device), to_tensor(y_val).to(self.device)
            z_val = self.normalizing_flow.get_latent(X_val).detach()
            X_val_latent = torch.cat((X_val, z_val), axis=1)

        # Train Deep Ensemble
        if not self.deep_ensemble.trained:
            print(
                f"\nTraining Deep Ensemble ({'Maximum ' if early_stopping else ''}{de_epochs} epochs):"
            )

            self.deep_ensemble.fit(
                X_latent,
                y,
                X_val_latent,
                y_val,
                save_checkpoints,
                f"{checkpoint_path}_de",
                early_stopping,
                de_epochs,
                batch_size,
                sequence_length,
                patience,
                verbose,
            )

        self.trained = True



[docs]
    def forward(
        self,
        x,
    ):
        """Run a forward pass through the hybrid emulator.

        Args:
            x (array-like): Input feature matrix with shape ``(N, num_features)``.

        Returns:
            tuple: ``(prediction, uncertainties)`` where:

            - **prediction** (*numpy.ndarray*): Mean prediction across ensemble members.
            - **uncertainties** (*dict*): Keys ``'total'``, ``'epistemic'``, ``'aleatoric'``
              with numpy arrays giving per-row uncertainty in scaled (model) units.

        Warns:
            UserWarning: If the model has not been trained.
        """

        self.eval()
        x = to_tensor(x).to(self.device)
        if not self.trained:
            warnings.warn("This model has not been trained. Predictions may not be accurate.")
        z = self.normalizing_flow.get_latent(x).detach()
        X_latent = torch.cat((x, z), axis=1)
        prediction, epistemic = self.deep_ensemble(X_latent)
        aleatoric = self.normalizing_flow.aleatoric(x, 100)
        prediction = prediction.detach().cpu().numpy()
        epistemic = epistemic.detach().cpu().numpy()
        uncertainties = dict(
            total=aleatoric + epistemic,
            epistemic=epistemic,
            aleatoric=aleatoric,
        )
        return prediction, uncertainties



[docs]
    def predict(self, x, output_scaler=True, smoothing_window=0):
        """Predict SLE projections and uncertainties, applying inverse scaling and optional smoothing.

        Smoothing is applied to the final unscaled predictions and uncertainties so the
        physical SLE curve is what gets smoothed (rather than scaled values).

        Args:
            x (array-like): Input feature matrix with shape ``(N, num_features)``.
            output_scaler (bool or str, optional): If ``True`` (default), loads the
                scaler bundled with the pretrained model. If ``False``, returns
                un-rescaled predictions. If a string, loads the sklearn scaler at
                that path and uses it to inverse-transform the output.
            smoothing_window (int, optional): Width of a centered moving-average
                smoother applied to the unscaled predictions and uncertainties.
                ``0`` (default) disables smoothing.

        Returns:
            tuple: ``(unscaled_predictions, uncertainties)`` where:

            - **unscaled_predictions** (*numpy.ndarray*): Predictions in mm SLE.
            - **uncertainties** (*dict*): Keys ``'total'``, ``'epistemic'``, ``'aleatoric'``
              with numpy arrays in mm SLE.

        Warns:
            UserWarning: If no scaler is available; predictions and uncertainties are
                then returned in the model's scaled output space rather than mm SLE.
        """
        self.eval()

        # Handle scaler loading
        if output_scaler is True:
            output_scaler = os.path.join(self.model_dir, "scaler_y.pkl")
            with open(output_scaler, "rb") as f:
                with warnings.catch_warnings():
                    warnings.filterwarnings("ignore", category=InconsistentVersionWarning)
                    output_scaler = pickle.load(f)
        elif output_scaler is False and self.scaler_path is None:
            warnings.warn("No scaler path provided, uncertainties are not in units of SLE.")
            predictions, uncertainties = self.forward(x)

            # Apply smoothing to raw predictions and uncertainties if requested
            if smoothing_window > 0:
                predictions = smooth_projections(predictions, smoothing_window)
                for key in uncertainties:
                    uncertainties[key] = smooth_projections(uncertainties[key], smoothing_window)

            return predictions, uncertainties
        elif isinstance(output_scaler, str):
            self.scaler_path = output_scaler
            with open(self.scaler_path, "rb") as f:
                with warnings.catch_warnings():
                    warnings.filterwarnings("ignore", category=InconsistentVersionWarning)
                    output_scaler = pickle.load(f)

        # Get raw predictions and uncertainties (no smoothing yet)
        predictions, uncertainties = self.forward(x)

        # Inverse transform predictions first
        # The upper/lower-then-average pattern below is correct only for monotone scalers
        # (StandardScaler, MinMaxScaler, RobustScaler — all linear), where f(a±b) = f(a)±f'*b.
        unscaled_predictions = output_scaler.inverse_transform(predictions.reshape(-1, 1))

        # Calculate uncertainty bounds in scaled space
        bound_epistemic_upper = predictions + uncertainties["epistemic"]
        bound_epistemic_lower = predictions - uncertainties["epistemic"]
        bound_aleatoric_upper = predictions + uncertainties["aleatoric"]
        bound_aleatoric_lower = predictions - uncertainties["aleatoric"]

        # Inverse transform all bounds
        unscaled_bound_epistemic_upper = output_scaler.inverse_transform(
            bound_epistemic_upper.reshape(-1, 1)
        )
        unscaled_bound_epistemic_lower = output_scaler.inverse_transform(
            bound_epistemic_lower.reshape(-1, 1)
        )
        unscaled_bound_aleatoric_upper = output_scaler.inverse_transform(
            bound_aleatoric_upper.reshape(-1, 1)
        )
        unscaled_bound_aleatoric_lower = output_scaler.inverse_transform(
            bound_aleatoric_lower.reshape(-1, 1)
        )

        # Calculate unscaled uncertainties (symmetric around predictions)
        epistemic_upper = unscaled_bound_epistemic_upper - unscaled_predictions
        epistemic_lower = unscaled_predictions - unscaled_bound_epistemic_lower
        aleatoric_upper = unscaled_bound_aleatoric_upper - unscaled_predictions
        aleatoric_lower = unscaled_predictions - unscaled_bound_aleatoric_lower

        # Use average of upper and lower uncertainties for symmetry
        epistemic = (epistemic_upper + epistemic_lower) / 2
        aleatoric = (aleatoric_upper + aleatoric_lower) / 2

        # NOW apply smoothing to the final unscaled values
        if smoothing_window > 0:
            unscaled_predictions = smooth_projections(unscaled_predictions, smoothing_window)
            epistemic = smooth_projections(epistemic, smoothing_window)
            aleatoric = smooth_projections(aleatoric, smoothing_window)

        # Ensure uncertainties are non-negative
        epistemic = np.abs(epistemic)
        aleatoric = np.abs(aleatoric)

        uncertainties = dict(
            total=epistemic + aleatoric,
            epistemic=epistemic,
            aleatoric=aleatoric,
        )

        return unscaled_predictions, uncertainties



[docs]
    def save(self, save_dir, input_features=None, output_scaler_path=None):
        """
        Saves the trained model and related components to a specified directory.

        Args:
            save_dir (str): Directory where the model should be saved.
            input_features (list, optional): List of input feature names. Defaults to None.
            output_scaler_path (str, optional): Path to the output scaler. Defaults to None.

        Raises:
            ValueError: If the model has not been trained.
            ValueError: If `save_dir` is a file instead of a directory.
            ValueError: If `input_features` is not a list.
        """

        if not self.trained:
            raise ValueError("This model has not been trained yet. Train the model before saving.")
        if save_dir.endswith(".pth"):
            raise ValueError("save_dir must be a directory, not a file")
        os.makedirs(save_dir, exist_ok=True)

        self.deep_ensemble.save(os.path.join(save_dir, "deep_ensemble.pth"))
        self.normalizing_flow.save(os.path.join(save_dir, "normalizing_flow.pth"))

        if input_features is not None:
            if not isinstance(input_features, list):
                raise ValueError("input_features must be a list of feature names")
            with open(os.path.join(save_dir, "input_features.json"), "w") as f:
                json.dump(input_features, f, indent=4)

        if output_scaler_path is not None and output_scaler_path.endswith(".pkl"):
            self.scaler_path = output_scaler_path

        if self.scaler_path is not None:
            shutil.copy(self.scaler_path, os.path.join(save_dir, "scaler_y.pkl"))
            try:
                scaler_x_path = self.scaler_path.replace("scaler_y", "scaler_X")
                shutil.copy(scaler_x_path, os.path.join(save_dir, "scaler_X.pkl"))
            except (FileNotFoundError, OSError):
                warnings.warn(
                    f"Could not copy input scaler (scaler_X) to {save_dir}. "
                    "Inferred path did not exist. Pass a separate scaler_X path if needed.",
                    UserWarning,
                )



[docs]
    @staticmethod
    def load(
        model_dir=None,
        deep_ensemble_path=None,
        normalizing_flow_path=None,
    ):
        """Load a trained ISEFlow from saved deep ensemble and normalizing flow checkpoints.

        Provide either ``model_dir`` (which expects ``deep_ensemble.pth`` and
        ``normalizing_flow.pth`` files inside it) or both ``deep_ensemble_path``
        and ``normalizing_flow_path`` explicitly.

        Args:
            model_dir (str, optional): Directory containing the saved sub-model files.
            deep_ensemble_path (str, optional): Explicit path to the saved deep ensemble.
            normalizing_flow_path (str, optional): Explicit path to the saved normalizing flow.

        Returns:
            ISEFlow: The loaded model, with ``trained=True``.
        """

        if model_dir:
            deep_ensemble_path = os.path.join(model_dir, "deep_ensemble.pth")
            normalizing_flow_path = os.path.join(model_dir, "normalizing_flow.pth")

        deep_ensemble = DeepEnsemble.load(deep_ensemble_path)
        normalizing_flow = NormalizingFlow.load(normalizing_flow_path)
        model = ISEFlow(deep_ensemble, normalizing_flow)
        model.trained = True
        model.model_dir = model_dir

        return model





[docs]
class ISEFlow_AIS(ISEFlow):
    """Pretrained ISEFlow emulator for the Antarctic Ice Sheet (AIS).

    Loads pretrained weights for AIS (18 sectors, 8 km resolution) from HuggingFace Hub
    and exposes ``predict(inputs)`` where ``inputs`` is an ``ISEFlowAISInputs`` instance.

    .. note::
       ``version`` refers to the **ISEFlow model weights version**, not the ise-py
       package version. See ``ise.models.pretrained.ISEFLOW_LATEST_MODEL_VERSION``
       for the current default.

    Supported model versions:

    - ``v1.0.0``: includes ``mrro_anomaly`` as a forcing variable.
    - ``v1.1.0`` (default): ``mrro_anomaly`` removed; improved GrIS+AIS joint training.

    Args:
        version (str, optional): ISEFlow model weights version. One of ``'v1.0.0'`` or
            ``'v1.1.0'``. Defaults to the latest: ``'v1.1.0'``.

    Raises:
        NotImplementedError: If an unsupported version string is provided.
    """

    def __init__(self, version=ISEFLOW_LATEST_MODEL_VERSION):
        """Load pretrained AIS weights for the specified model version.

        Args:
            version (str, optional): ISEFlow model weights version.
                ``'v1.0.0'`` or ``'v1.1.0'``. Defaults to ``'v1.1.0'``.
        """
        self.ice_sheet = "AIS"
        self.version = version

        if version not in ("v1.0.0", "v1.1.0"):
            raise NotImplementedError(f"Version {version} not implemented. Try v1.0.0 or v1.1.0")

        model_dir = get_model_dir(version, "AIS")
        deep_ensemble = DeepEnsemble.load(os.path.join(model_dir, "deep_ensemble.pth"))
        normalizing_flow = NormalizingFlow.load(os.path.join(model_dir, "normalizing_flow.pth"))
        super().__init__(deep_ensemble, normalizing_flow)

        self.model_dir = model_dir
        self.trained = True


[docs]
    def process(
        self,
        inputs: ISEFlowAISInputs,
    ):
        """Preprocess ISEFlowAISInputs into the feature matrix expected by the model.

        Applies input scaling (using the version-specific ``scaler_X.pkl``), adds
        5-step lag variables, one-hot encodes ISM configuration columns, and pads
        any missing one-hot columns with ``False``.

        Args:
            inputs (ISEFlowAISInputs): Validated input dataclass for a single AIS sector.

        Returns:
            pandas.DataFrame: Feature matrix aligned to the column order expected by
            the pretrained model weights for the current version.

        Raises:
            ValueError: If ``mrro_anomaly`` is ``None`` when using v1.0.0.
        """

        if inputs.mrro_anomaly is None and self.version == "v1.0.0":
            raise ValueError("mrro_anomaly is required for version v1.0.0")

        mrro_means = np.array(
            [
                3.61493220e-08,
                2.77753815e-08,
                5.50841177e-08,
                4.17617754e-08,
                5.58558082e-08,
                5.74870861e-08,
                1.07017988e-07,
                7.72183085e-08,
                6.44275121e-08,
                2.10466987e-08,
                5.36071770e-08,
                8.32501757e-08,
                9.31873131e-08,
                7.84747761e-08,
                8.41751157e-08,
                8.56960829e-08,
                7.81743956e-08,
                9.74934761e-08,
                6.04155892e-08,
                8.31572351e-08,
                1.16800344e-07,
                9.96168899e-08,
                1.41262144e-07,
                8.76467771e-08,
                1.03335698e-07,
                1.23414214e-07,
                9.29483909e-08,
                1.95530928e-07,
                1.18321950e-07,
                1.68664275e-07,
                1.56460562e-07,
                1.40309916e-07,
                1.08267844e-07,
                1.85627395e-07,
                1.29400203e-07,
                1.98725020e-07,
                1.39994753e-07,
                1.86775688e-07,
                1.68388442e-07,
                2.04534154e-07,
                1.49715175e-07,
                1.50418319e-07,
                1.44444531e-07,
                1.67211070e-07,
                1.83698063e-07,
                2.05489898e-07,
                2.42246565e-07,
                1.98110423e-07,
                2.40505470e-07,
                2.37863389e-07,
                2.55668987e-07,
                2.93048624e-07,
                2.57849749e-07,
                2.72915753e-07,
                2.82135517e-07,
                2.27647208e-07,
                2.21859448e-07,
                2.07266200e-07,
                2.42241281e-07,
                2.55693726e-07,
                2.52039399e-07,
                2.82802604e-07,
                2.94193847e-07,
                3.00380753e-07,
                3.60152406e-07,
                3.47886784e-07,
                3.58344925e-07,
                3.84398045e-07,
                4.41053179e-07,
                3.84072892e-07,
                4.42520286e-07,
                4.30170222e-07,
                4.34444387e-07,
                4.77483307e-07,
                3.52802246e-07,
                4.96503280e-07,
                5.22078462e-07,
                4.78644041e-07,
                4.86755806e-07,
                5.04600526e-07,
                4.80814514e-07,
                5.38276914e-07,
                5.91539053e-07,
                5.84794672e-07,
                5.33792907e-07,
                5.37435986e-07,
            ]
        )

        data = inputs.to_df()
        dummy_columns = [
            "numerics",
            "stress_balance",
            "resolution",
            "init_method",
            "melt",
            "ice_front",
            "Ocean forcing",
            "Ocean sensitivity",
            "open_melt_param",
            "standard_melt_param",
            "Ice shelf fracture",
        ]

        if self.version == "v1.0.0":
            # v1.0.0 ordering: fill missing mrro -> add lags -> get_dummies -> reindex
            # to ISEFlow_AIS_v1_0_0_variables -> append `outlier=False` -> positional
            # scale (the v1.0.0 scaler was fit on 99 cols including `outlier`) -> drop
            # `outlier`. The v1.0.0 scaler has no feature_names_in_, so master's
            # name-based scale_data() can't be used here.
            # Years in `data` are in model encoding (1..86) per
            # ISEFlowAISInputs._check_inputs (calendar 2015..2100 → 1..86),
            # so the lookup map must be keyed 1..86, not 0..85.
            year_mean_map = {year: mean for year, mean in enumerate(mrro_means, start=1)}
            data["mrro_anomaly"] = data.apply(
                lambda row: (
                    year_mean_map[row["year"]]
                    if pd.isna(row["mrro_anomaly"])
                    else row["mrro_anomaly"]
                ),
                axis=1,
            )
            data = fe.add_lag_variables(data, lag=5, verbose=False)
            data = pd.get_dummies(data, columns=dummy_columns, dtype=bool)

            columns = ISEFlow_AIS_v1_0_0_variables
            for col in columns:
                if col not in data.columns:
                    data[col] = False
            data = data[columns]
            data = data.loc[:, ~data.columns.duplicated()]

            data["outlier"] = False
            with warnings.catch_warnings():
                warnings.simplefilter("ignore", InconsistentVersionWarning)
                with open(f"{self.model_dir}/scaler_X.pkl", "rb") as f:
                    scaler = pickle.load(f)
            scaled = scaler.transform(data.values.astype(float))
            data = pd.DataFrame(scaled, columns=list(data.columns), index=data.index)
            data = data.drop(columns=["outlier"])
            return data

        # v1.1.0 path (unchanged): scale -> lag -> dummies -> reindex
        data = fe.scale_data(data, scaler_path=f"{self.model_dir}/scaler_X.pkl")
        data = fe.add_lag_variables(data, lag=5, verbose=False)
        data = pd.get_dummies(data, columns=dummy_columns, dtype=bool)

        if self.version == "v1.1.0":
            columns = ISEFlow_AIS_v1_1_0_variables
        else:
            raise NotImplementedError(
                f"Version {self.version} not implemented. Use v1.0.0 or v1.1.0"
            )

        for col in columns:
            if col not in data.columns:
                data[col] = False

        data = data[columns]
        data = data.loc[:, ~data.columns.duplicated()]

        return data



[docs]
    def predict(  # type: ignore[override]
        self,
        inputs: ISEFlowAISInputs,
        smoothing_window: int = 0,
    ):
        """
        Predicts AIS sea level contribution using the pretrained ISEFlow_AIS model.

        Internally calls ``process()`` to scale, add lag variables, and one-hot
        encode the inputs before running the hybrid forward pass.

        Args:
            inputs (ISEFlowAISInputs): Validated input dataclass containing climate
                forcings and ISM configuration for a single sector.
            smoothing_window (int, optional): If > 0, applies a uniform moving-average
                smoother of this width to the output time series. Defaults to 0 (no
                smoothing).

        Returns:
            tuple: A tuple containing:

                - **predictions** (*numpy.ndarray*, shape ``(86, 1)``): Unscaled sea
                  level equivalent (SLE) projections in mm for years 2015-2100.
                - **uncertainties** (*dict*): Dictionary with keys:

                  - ``'total'``: total uncertainty (epistemic + aleatoric).
                  - ``'epistemic'``: uncertainty from ensemble disagreement.
                  - ``'aleatoric'``: uncertainty from normalizing-flow sampling.
        """

        data = self.process(
            inputs=inputs,
        )
        X = to_tensor(data).to(self.device)
        return super().predict(
            X, output_scaler=f"{self.model_dir}/scaler_y.pkl", smoothing_window=smoothing_window
        )



[docs]
    def test(
        self,
        X_test,
    ):
        """
        Tests the model on a test dataset.

        Args:
            X_test (array-like): Test feature matrix.

        Returns:
            tuple: A tuple containing:
                - unscaled_predictions (numpy.ndarray): Model predictions in the original scale.
                - uncertainties (dict): Dictionary with keys:
                    - 'total' (numpy.ndarray): Total uncertainty.
                    - 'epistemic' (numpy.ndarray): Epistemic uncertainty.
                    - 'aleatoric' (numpy.ndarray): Aleatoric uncertainty.
        """

        return super().predict(X_test, output_scaler=f"{self.model_dir}/scaler_y.pkl")





[docs]
class ISEFlow_GrIS(ISEFlow):
    """Pretrained ISEFlow emulator for the Greenland Ice Sheet (GrIS).

    Loads pretrained weights for GrIS (6 drainage basins, 5 km resolution) from
    HuggingFace Hub and exposes ``predict(inputs)`` where ``inputs`` is an
    ``ISEFlowGrISInputs`` instance.

    .. note::
       ``version`` refers to the **ISEFlow model weights version**, not the ise-py
       package version. See ``ise.models.pretrained.ISEFLOW_LATEST_MODEL_VERSION``
       for the current default.

    Supported model versions:

    - ``v1.0.0``: initial GrIS release.
    - ``v1.1.0`` (default): improved AIS+GrIS joint training.

    Args:
        version (str, optional): ISEFlow model weights version. One of ``'v1.0.0'`` or
            ``'v1.1.0'``. Defaults to the latest: ``'v1.1.0'``.

    Raises:
        NotImplementedError: If an unsupported version string is provided.
    """

    def __init__(self, version=ISEFLOW_LATEST_MODEL_VERSION):
        """Load pretrained GrIS weights for the specified model version.

        Args:
            version (str, optional): ISEFlow model weights version.
                ``'v1.0.0'`` or ``'v1.1.0'``. Defaults to ``'v1.1.0'``.
        """
        self.ice_sheet = "GrIS"
        self.version = version

        if version not in ("v1.0.0", "v1.1.0"):
            raise NotImplementedError(f"Version {version} not implemented. Try v1.0.0 or v1.1.0")

        model_dir = get_model_dir(version, "GrIS")
        deep_ensemble = DeepEnsemble.load(os.path.join(model_dir, "deep_ensemble.pth"))
        normalizing_flow = NormalizingFlow.load(os.path.join(model_dir, "normalizing_flow.pth"))
        super().__init__(deep_ensemble, normalizing_flow)

        self.model_dir = model_dir
        self.trained = True


[docs]
    def process(
        self,
        inputs: ISEFlowGrISInputs,
    ):
        """Preprocess ISEFlowGrISInputs into the feature matrix expected by the model.

        Applies input scaling (using the version-specific ``scaler_X.pkl``), adds
        5-step lag variables, one-hot encodes ISM configuration columns, and pads
        any missing one-hot columns with ``False``.

        Args:
            inputs (ISEFlowGrISInputs): Validated input dataclass for a single GrIS basin.

        Returns:
            pandas.DataFrame: Feature matrix aligned to the column order expected by
            the pretrained model weights for the current version.
        """

        data = inputs.to_df()
        dummy_columns = [
            "numerics",
            "ice_flow",
            "initialization",
            "initial_smb",
            "velocity",
            "bed",
            "surface_thickness",
            "ghf",
            "res_min",
            "res_max",
            "Ocean forcing",
            "Ocean sensitivity",
            "Ice shelf fracture",
        ]

        if self.version == "v1.0.0":
            # v1.0.0 ordering: add lags -> get_dummies -> reindex to
            # ISEFlow_GrIS_v1_0_0_variables -> append `outlier=False` -> positional
            # scale (the v1.0.0 scaler has 91 cols incl. `outlier` and no
            # feature_names_in_) -> drop `outlier`.
            data = fe.add_lag_variables(data, lag=5, verbose=False)
            data = pd.get_dummies(data, columns=dummy_columns, dtype=bool)

            columns = ISEFlow_GrIS_v1_0_0_variables
            for col in columns:
                if col not in data.columns:
                    data[col] = False
            data = data[columns]
            data = data.loc[:, ~data.columns.duplicated()]

            data["outlier"] = False
            with warnings.catch_warnings():
                warnings.simplefilter("ignore", InconsistentVersionWarning)
                with open(f"{self.model_dir}/scaler_X.pkl", "rb") as f:
                    scaler = pickle.load(f)
            scaled = scaler.transform(data.values.astype(float))
            data = pd.DataFrame(scaled, columns=list(data.columns), index=data.index)
            data = data.drop(columns=["outlier"])
            return data

        # v1.1.0 path (unchanged): scale -> lag -> dummies -> reindex
        data = fe.scale_data(data, scaler_path=f"{self.model_dir}/scaler_X.pkl")
        data = fe.add_lag_variables(data, lag=5, verbose=False)
        data = pd.get_dummies(data, columns=dummy_columns, dtype=bool)

        if self.version == "v1.1.0":
            columns = ISEFlow_GrIS_v1_1_0_variables
        else:
            raise NotImplementedError(
                f"Version {self.version} not implemented. Use v1.0.0 or v1.1.0"
            )

        for col in columns:
            if col not in data.columns:
                data[col] = False

        data = data[columns]
        data = data.loc[:, ~data.columns.duplicated()]
        # print(data.head())
        return data



[docs]
    def predict(  # type: ignore[override]
        self,
        inputs: ISEFlowGrISInputs,
        smoothing_window: int = 0,
    ):
        """Predicts GrIS sea level contribution using the pretrained ISEFlow_GrIS model.

        Internally calls ``process()`` to scale, add lag variables, and one-hot
        encode the inputs before running the hybrid forward pass.

        Args:
            inputs (ISEFlowGrISInputs): Validated input dataclass containing climate
                forcings and ISM configuration for a single GrIS drainage basin.
            smoothing_window (int, optional): If > 0, applies a uniform moving-average
                smoother of this width to the output time series. Defaults to 0 (no
                smoothing).

        Returns:
            tuple: A tuple containing:

                - **predictions** (*numpy.ndarray*, shape ``(86, 1)``): Unscaled sea
                  level equivalent (SLE) projections in mm for years 2015-2100.
                - **uncertainties** (*dict*): Dictionary with keys:

                  - ``'total'``: total uncertainty (epistemic + aleatoric).
                  - ``'epistemic'``: uncertainty from ensemble disagreement.
                  - ``'aleatoric'``: uncertainty from normalizing-flow sampling.
        """
        data = self.process(
            inputs=inputs,
        )
        X = to_tensor(data).to(self.device)
        return super().predict(
            X, output_scaler=f"{self.model_dir}/scaler_y.pkl", smoothing_window=smoothing_window
        )



[docs]
    def test(
        self,
        X_test,
    ):
        """
        Tests the model on a test dataset.

        Args:
            X_test (array-like): Test feature matrix.

        Returns:
            tuple: A tuple containing:
                - unscaled_predictions (numpy.ndarray): Model predictions in the original scale.
                - uncertainties (dict): Dictionary with keys:
                    - 'total' (numpy.ndarray): Total uncertainty.
                    - 'epistemic' (numpy.ndarray): Epistemic uncertainty.
                    - 'aleatoric' (numpy.ndarray): Aleatoric uncertainty.
        """

        return super().predict(X_test, output_scaler=f"{self.model_dir}/scaler_y.pkl")





[docs]
class ISEFlow_AIS_DE_v1_0_0(DeepEnsemble):
    """
    Deprecated AIS deep ensemble (v1.0.0). Use ``ISEFlow_AIS`` instead.

    This hard-coded 10-member LSTM ensemble was used in ISEFlow v1.0.0 for AIS
    emulation (input_size=99, includes ``mrro_anomaly``).  It is kept for
    backward compatibility with saved v1.0.0 checkpoints only.

    .. deprecated::
        Use ``ISEFlow_AIS(version='v1.0.0')`` or ``ISEFlow_AIS(version='v1.1.0')``
        instead.  This class will be removed in a future release.

    Attributes:
        input_size (int): 99 (includes mrro_anomaly).
        output_size (int): 1.
    """

    def __init__(
        self,
    ):
        warnings.warn(
            "ISEFlow_AIS_DE_v1_0_0 is deprecated and will be removed in future versions. Please use ISEFlow_AIS instead.",
            DeprecationWarning,
        )

        self.input_size = 99
        self.output_size = 1
        iseflow_ais_ensemble = [
            LSTM(1, 128, 99, 1, nn.HuberLoss()),
            LSTM(1, 512, 99, 1, nn.HuberLoss()),
            LSTM(1, 512, 99, 1, nn.HuberLoss()),
            LSTM(2, 128, 99, 1, nn.HuberLoss()),
            LSTM(1, 256, 99, 1, nn.L1Loss()),
            LSTM(1, 512, 99, 1, nn.MSELoss()),
            LSTM(2, 128, 99, 1, nn.MSELoss()),
            LSTM(2, 512, 99, 1, nn.MSELoss()),
            LSTM(1, 256, 99, 1, nn.L1Loss()),
            LSTM(1, 64, 99, 1, nn.HuberLoss()),
        ]
        super().__init__(
            ensemble_members=iseflow_ais_ensemble,
            input_size=self.input_size,
            output_size=self.output_size,
            output_sequence_length=86,
        )




[docs]
class ISEFlow_GrIS_DE_v1_0_0(DeepEnsemble):
    """
    Deprecated GrIS deep ensemble (v1.0.0). Use ``ISEFlow_GrIS`` instead.

    This hard-coded 10-member LSTM ensemble was used in ISEFlow v1.0.0 for GrIS
    emulation (input_size=90).  It is kept for backward compatibility with saved
    v1.0.0 checkpoints only.

    .. deprecated::
        Use ``ISEFlow_GrIS(version='v1.0.0')`` or ``ISEFlow_GrIS(version='v1.1.0')``
        instead.  This class will be removed in a future release.

    Attributes:
        input_size (int): 90.
        output_size (int): 1.
    """

    def __init__(
        self,
    ):
        warnings.warn(
            "ISEFlow_GrIS_DE_v1_0_0 is deprecated and will be removed in future versions. Please use ISEFlow_GrIS instead.",
            DeprecationWarning,
        )
        self.input_size = 90
        self.output_size = 1
        iseflow_gris_ensemble = [
            LSTM(2, 128, 99, 1, nn.HuberLoss()),
            LSTM(2, 256, 99, 1, nn.MSELoss()),
            LSTM(2, 128, 99, 1, nn.HuberLoss()),
            LSTM(2, 128, 99, 1, nn.MSELoss()),
            LSTM(2, 256, 99, 1, nn.HuberLoss()),
            LSTM(1, 256, 99, 1, nn.L1Loss()),
            LSTM(1, 128, 99, 1, nn.HuberLoss()),
            LSTM(2, 64, 99, 1, nn.MSELoss()),
            LSTM(2, 256, 99, 1, nn.HuberLoss()),
            LSTM(1, 256, 99, 1, nn.L1Loss()),
        ]
        super().__init__(
            ensemble_members=iseflow_gris_ensemble,
            input_size=self.input_size,
            output_size=self.output_size,
            output_sequence_length=86,
        )




[docs]
class ISEFlow_AIS_NF_v1_0_0(NormalizingFlow):
    """
    Deprecated AIS normalizing flow (v1.0.0). Use ``ISEFlow_AIS`` instead.

    This pre-configured NormalizingFlow was used in ISEFlow v1.0.0 for AIS
    aleatoric uncertainty estimation.

    .. deprecated::
        Use ``ISEFlow_AIS(version='v1.0.0')`` or ``ISEFlow_AIS(version='v1.1.0')``
        instead.  This class will be removed in a future release.
    """

    def __init__(self, version="1.0.0"):
        """
        Initialize with AIS-specific defaults (input_size=99 for v1.0.0, 93 otherwise).
        """
        warnings.warn(
            "ISEFlow_AIS_NF_v1_0_0 is deprecated and will be removed in future versions. Please use ISEFlow_AIS instead.",
            DeprecationWarning,
        )

        self.input_size = 99 if version == "v1.0.0" else 93
        self.output_size = 1
        self.num_flow_transforms = 5
        super().__init__(
            input_size=self.input_size,
            output_size=self.output_size,
            num_flow_transforms=self.num_flow_transforms,
        )




[docs]
class ISEFlow_GrIS_NF_v1_0_0(NormalizingFlow):
    """
    Deprecated GrIS normalizing flow (v1.0.0). Use ``ISEFlow_GrIS`` instead.

    This pre-configured NormalizingFlow was used in ISEFlow v1.0.0 for GrIS
    aleatoric uncertainty estimation (input_size=90).

    .. deprecated::
        Use ``ISEFlow_GrIS(version='v1.0.0')`` or ``ISEFlow_GrIS(version='v1.1.0')``
        instead.  This class will be removed in a future release.
    """

    def __init__(
        self,
    ):
        """Initialize with GrIS-specific defaults (input_size=90, 5 flow transforms)."""
        warnings.warn(
            "ISEFlow_GrIS_NF_v1_0_0 is deprecated and will be removed in future versions. Please use ISEFlow_GrIS instead.",
            DeprecationWarning,
        )
        self.input_size = 90
        self.output_size = 1
        self.num_flow_transforms = 5
        super().__init__(
            input_size=self.input_size,
            output_size=self.output_size,
            num_flow_transforms=self.num_flow_transforms,
        )




[docs]
def smooth_projections(data, window_size, projection_length=86):
    """
    Apply smoothing to projections while respecting projection boundaries.
    Uses scipy's uniform_filter1d for more effective smoothing.

    Args:
        data (np.ndarray): Array of shape (n_samples,) or (n_samples, 1) containing values to smooth
        window_size (int): Size of the smoothing window
        projection_length (int): Length of each projection segment (default: 86 years)

    Returns:
        np.ndarray: Smoothed data with same shape as input
    """
    if window_size <= 0 or window_size == 1:
        return data

    # Ensure window_size is odd for symmetric smoothing
    if window_size % 2 == 0:
        window_size += 1

    # Handle both 1D and 2D arrays
    original_shape = data.shape
    data_was_1d = False
    if data.ndim == 1:
        data = data.reshape(-1, 1)
        data_was_1d = True

    smoothed_data = np.zeros_like(data)
    n_samples = data.shape[0]

    # Calculate number of complete projections
    n_complete_projections = n_samples // projection_length

    # Process each projection separately to avoid boundary mixing
    for proj_idx in range(n_complete_projections):
        start_idx = proj_idx * projection_length
        end_idx = (proj_idx + 1) * projection_length

        # Extract current projection segment
        projection_segment = data[start_idx:end_idx, :]

        # Apply uniform filter for each column
        for col in range(data.shape[1]):
            # Use mode='nearest' at boundaries to avoid edge effects
            smoothed_segment = uniform_filter1d(
                projection_segment[:, col], size=window_size, mode="nearest"
            )
            smoothed_data[start_idx:end_idx, col] = smoothed_segment

    # Handle any remaining samples that don't form a complete projection
    if n_samples % projection_length != 0:
        start_idx = n_complete_projections * projection_length
        remaining_segment = data[start_idx:, :]

        for col in range(data.shape[1]):
            smoothed_segment = uniform_filter1d(
                remaining_segment[:, col],
                size=min(window_size, len(remaining_segment)),
                mode="nearest",
            )
            smoothed_data[start_idx:, col] = smoothed_segment

    # Restore original shape
    if data_was_1d:
        smoothed_data = smoothed_data.flatten()

    return smoothed_data