Source code for fusilli.fusionmodels.base_model

"""
Base lightning module for all fusion models and parent class for all fusion models.
"""

from typing import Any
import lightning.pytorch as pl
import torch
from torch import nn
from torch.nn import functional as F

from fusilli.utils.metrics_utils import MetricsCalculator



[docs]
class BaseModel(pl.LightningModule):
    """Base pytorch lightning model for all fusion models.

    This class takes the specific fusion model as an input and provides the training and validation
    steps.
    The loss functions/metrics/activation function options are defined here and chosen based on the
    prediction type
    chosen by the user.

    Attributes
    ----------
    model : class
        Fusion model class.
    multiclass_dimensions : int
        Number of classes for multiclass prediction. Default is 3 for making the metrics dictionary.
    metrics : dict
        Dictionary of metrics, at least two. Key is the name and value is the function from MetricsCalculator.
    metrics_list : list
        List of strings of names of metrics to use for model evaluation. Default None. If None, the metrics will be
        automatically selected based on the prediction task (AUROC, accuracy for binary/multiclass, R2 and MAE for
        regression).
    train_mask : tensor
        Mask for training data, used for the graph fusion methods instead of train/val split.
        Indicates which nodes are training nodes.
    val_mask : tensor
        Mask for validation data - used for the graph fusion methods instead of train/val split.
        Indicates which nodes are validation nodes.
    loss_functions : dict
        Dictionary of loss functions, one for each prediction type.
    output_activation_functions : dict
        Dictionary of output activation functions, one for each prediction type.
    batch_val_reals : list
        List of validation reals for each batch. Stored for later concatenation with rest of
        batches and access by Plotter class for plotting.
    batch_val_preds : list
        List of validation preds for each batch. Stored for later concatenation with rest of
        batches and access by Plotter class for plotting.
    batch_val_logits : list
        List of validation logits for each batch. Stored for later concatenation with rest of
        batches and access by Plotter class for plotting.
    batch_train_reals : list
        List of training reals for each batch. Stored for later concatenation with rest of batches
        and access by Plotter class for plotting.
    batch_train_preds : list
        List of training preds for each batch. Stored for later concatenation with rest of batches
        and access by Plotter class for plotting.
    val_reals : tensor
        Concatenated validation reals for all batches. Accessed by Plotter class for plotting.
    val_preds : tensor
        Concatenated validation preds for all batches. Accessed by Plotter class for plotting.
    val_logits : tensor
        Concatenated validation logits for all batches. Accessed by Plotter class for plotting.
    train_reals : tensor
        Concatenated training reals for all batches. Accessed by Plotter class for plotting.
    train_preds : tensor
        Concatenated training preds for all batches. Accessed by Plotter class for plotting.
    """


[docs]
    def __init__(self, model, metrics_list=None):
        """
        Parameters
        ----------
        model : class
            Fusion model class.
        metrics_list : list or None
            List of metrics to use for model evaluation. Default None.
            If None, the metrics will be automatically selected based on the prediction task
            (AUROC, accuracy for binary/multiclass, R2 and MAE for regression).
            The first metric in the list will be used in the comparison evaluation figures to rank the models' performances.
            Length must be 2 or more.

        Returns
        -------
        None
        """
        super().__init__()
        self.model = model

        self.MetricsCalculator = MetricsCalculator(self)
        self.metrics_list = metrics_list
        self.set_metrics(metrics_list=metrics_list)

        if self.model.prediction_task == "multiclass":
            self.multiclass_dimensions = model.multiclass_dimensions
        else:
            self.multiclass_dimensions = 3  # default value so metrics dict can be built

        if not hasattr(model, "subspace_method"):
            self.model.subspace_method = None

        if hasattr(model, "train_mask") is False:
            self.train_mask = None
            self.val_mask = None

        self.loss_functions = {
            "binary": lambda logits, y: F.binary_cross_entropy_with_logits(
                logits, y.float()
            ),
            "multiclass": lambda logits, y: F.cross_entropy(
                self.safe_squeeze(logits), self.safe_squeeze(y)
            ),
            "regression": F.mse_loss,
        }

        self.output_activation_functions = {
            "binary": torch.round,
            "multiclass": lambda x: torch.argmax(nn.Softmax(dim=-1)(x), dim=-1),
            "regression": lambda x: x,
        }

        if self.model.prediction_task not in ["binary", "multiclass", "regression"]:
            raise ValueError(f"Unsupported prediction_task: {self.model.prediction_task}")

        self.metric_names_list = list(self.metrics.keys())

        # storing the final validation reals and preds
        self.batch_val_reals = []
        self.batch_val_preds = []
        self.batch_val_logits = []
        self.batch_train_reals = []
        self.batch_train_preds = []
        self.batch_train_logits = []

        # Instance attributes for storing final validation reals and preds
        self.val_reals = None
        self.val_preds = None
        self.val_logits = None
        self.train_reals = None
        self.train_preds = None



[docs]
    @staticmethod
    def safe_squeeze(tensor):
        """
        Squeeze tensor if it is not 1D.

        Parameters
        ----------
        tensor : tensor
            Tensor to be squeezed.

        Returns
        -------
        tensor
            Squeezed tensor.
        """
        # Check if the tensor is 1D, in which case, no squeezing is needed
        if len(tensor.shape) == 1:
            return tensor
        # Otherwise, remove the first dimension
        else:
            return tensor.squeeze(dim=0)



[docs]
    def set_metrics(self, metrics_list):
        """
        Set what metrics will be used to log and plot.
        If no metrics are passed, then the default metrics for the prediction task will be used.

        Parameters
        ----------
        metrics_list : list or None
            List of metrics to use for model evaluation. Default None.
            If None, the metrics will be automatically selected based on the prediction task
            (AUROC, accuracy for binary/multiclass, R2 and MAE for regression).
            The first metric in the list will be used in the comparison evaluation figures to rank the models' performances.
            Length must be 2 or more.
        """

        # If the list is None, use the default metrics
        if metrics_list is None:
            if self.model.prediction_task == "binary":
                self.metrics = {"AUROC": self.MetricsCalculator.auroc,
                                "Accuracy": self.MetricsCalculator.accuracy}
            elif self.model.prediction_task == "multiclass":
                self.metrics = {"AUROC": self.MetricsCalculator.auroc,
                                "Accuracy": self.MetricsCalculator.accuracy}
            elif self.model.prediction_task == "regression":
                self.metrics = {"R2": self.MetricsCalculator.r2,
                                "MAE": self.MetricsCalculator.mae}

        # Error if list length is less than 2
        else:
            if len(metrics_list) < 2:
                raise ValueError("Length of metrics list must be 2 or more.")

            self.metrics = {}

            # Error if any of the metrics are not supported
            for metric_string in metrics_list:
                supported_metrics = [func for func in dir(self.MetricsCalculator) if
                                     callable(getattr(self.MetricsCalculator, func)) and not func.startswith("__")]
                if metric_string.lower() not in supported_metrics:  # change this to be accurate
                    raise ValueError(f"Unsupported metric: {metric_string}. Please choose from: {supported_metrics}")

                # Set the new metrics
                self.metrics[metric_string] = getattr(self.MetricsCalculator, metric_string.lower())



[docs]
    def get_data_from_batch(self, batch):
        """
        Get data from batch.

        Parameters
        ----------
        batch : tensor
            Batch of data.

        Returns
        -------
        x : tensor
            Input data.
        y : tensor
            Labels.
        """
        if self.model.fusion_type == "graph":
            x = (batch.x, batch.edge_index, batch.edge_attr)
            y = batch.y
        else:
            if len(batch) == 2:
                x, y = batch
            elif len(batch) == 3:
                x1, x2, y = batch
                x = (x1, x2)
            else:
                raise ValueError(
                    (
                        "Batch size is not 2 (preds and labels) or 3 (2 pred data types and labels) "
                        "modalities long"
                    )
                )

        return x, y



[docs]
    def get_model_outputs(self, x):
        """
        Get model outputs.

        Parameters
        ----------
        x : tensor
            Input data.

        Returns
        -------
        logits : tensor
            Logits.
        reconstructions : tensor
            Reconstructions (returned if the model has a custom loss function such as a subspace method)

        Note
        ----
        if you get an error here, check that the forward output in fusion model is [out,] or [out, reconstructions]
        """
        model_outputs = self.model(x)

        logits, *reconstructions = model_outputs
        logits = logits.squeeze(dim=1)

        return logits, reconstructions



[docs]
    def get_model_outputs_and_loss(self, x, y, train=True):
        """
        Get model outputs and loss.

        Parameters
        ----------
        x : tensor
            Input data.
        y : tensor
            Labels.
        train : bool
            Whether the data is training data.

        Returns
        -------
        loss : tensor
            Loss.
        end_output : tensor
            Final output.
        logits : tensor
            Logits.
        """
        logits, reconstructions = self.get_model_outputs(x)

        end_output = self.output_activation_functions[self.model.prediction_task](logits)

        # if we're doing graph-based fusion and train/test doesn't work the same as normal
        if hasattr(self, "train_mask"):
            if train:
                logits = logits[self.train_mask]
                y = y[self.train_mask]
                end_output = end_output[self.train_mask]
            else:
                logits = logits[self.val_mask]
                y = y[self.val_mask]
                end_output = end_output[self.val_mask]

        loss = self.loss_functions[self.model.prediction_task](logits, y)

        if reconstructions != [] and self.model.custom_loss is not None:
            added_loss = self.model.custom_loss(
                reconstructions[0], x[-1]
            )  # x[-1] bc img is always last

            loss += added_loss

        return loss, end_output, logits



[docs]
    def training_step(self, batch, batch_idx):
        """
        Training step.

        Parameters
        ----------
        batch : tensor
            Batch of data.
        batch_idx : int
            Batch index.

        Returns
        -------
        loss : tensor
            Loss.
        """

        x, y = self.get_data_from_batch(batch)

        loss, end_output, logits = self.get_model_outputs_and_loss(x, y)

        self.log(
            "train_loss",
            loss,
            on_step=False,
            on_epoch=True,
            prog_bar=True,
            logger=True,
            batch_size=x[0].shape[0],
        )

        for metric_name, metric_func in self.metrics.items():
            if (self.safe_squeeze(end_output).shape[0] == 1) or (self.safe_squeeze(logits).shape[0] == 1):
                # if it's a single value, we can't calculate a metric
                pass

            else:
                train_step_metric = metric_func(
                    preds=self.safe_squeeze(end_output),
                    labels=self.safe_squeeze(y[self.train_mask]),
                    logits=self.safe_squeeze(logits),
                )

                self.log(
                    metric_name + "_train",
                    train_step_metric,
                    logger=True,
                    on_epoch=True,
                    on_step=False,
                    batch_size=x[0].shape[0],
                )
        # Store real and predicted values for training

        self.batch_train_reals.append(self.safe_squeeze(y[self.train_mask]).detach())
        self.batch_train_preds.append(end_output.detach())
        self.batch_train_logits.append(logits.detach())

        return loss



[docs]
    def validation_step(self, batch, batch_idx):
        """
        Validation step.

        Parameters
        ----------
        batch : tensor
            Batch of data.
        batch_idx : int
            Batch index.

        Returns
        -------
        None
        """
        x, y = self.get_data_from_batch(batch)

        loss, end_output, logits = self.get_model_outputs_and_loss(x, y, train=False)

        self.log(
            "val_loss",
            loss,
            on_step=False,
            on_epoch=True,
            prog_bar=True,
            logger=True,
            batch_size=x[0].shape[0],
        )

        # Store real and predicted values for later access

        self.batch_val_reals.append(self.safe_squeeze(y[self.val_mask]).detach())
        self.batch_val_preds.append(self.safe_squeeze(end_output).detach())
        self.batch_val_logits.append(self.safe_squeeze(logits).detach())



[docs]
    def on_validation_epoch_end(self):
        """
        Gets the final validation epoch outputs and metrics.
        When metrics are calculated at the validation step and logged on on_epoch=True,
        the batch metrics are averaged. However, some metrics don't average well (e.g. R2).
        Therefore, we're calculating the final validation metrics here on the full validation set.

        Parameters
        ----------
        outputs : list
            List of outputs.

        Returns
        -------
        None
        """

        self.val_reals = torch.cat(self.batch_val_reals, dim=-1)
        self.val_preds = torch.cat(self.batch_val_preds, dim=-1)
        self.val_logits = torch.cat(self.batch_val_logits, dim=0)

        try:
            self.train_reals = torch.cat(self.batch_train_reals, dim=-1)
            self.train_preds = torch.cat(self.batch_train_preds, dim=-1)
        except RuntimeError:  # if we're doing graph-based fusion and train/test doesn't work the same as normal
            pass

        for metric_name, metric_func in self.metrics.items():
            val_step_metric = metric_func(
                preds=self.safe_squeeze(self.val_preds),
                labels=self.safe_squeeze(self.val_reals),
                logits=self.safe_squeeze(self.val_logits),
            ).to(self.device)

            self.log(
                metric_name + "_val",
                val_step_metric,
                logger=True,
                on_epoch=True,
                batch_size=self.val_reals.shape[0],
            )

        self.batch_val_reals = []
        self.batch_val_preds = []
        self.batch_val_logits = []
        self.batch_train_reals = []
        self.batch_train_preds = []
        self.batch_train_logits = []



[docs]
    def predict_step(self, batch: Any, batch_idx: int, dataloader_idx: int = 0) -> Any:
        self.model.eval()

        x, y = self.get_data_from_batch(batch)

        loss, end_output, logits = self.get_model_outputs_and_loss(x, y, train=False)

        end_output = self.safe_squeeze(end_output).detach()
        logits = self.safe_squeeze(logits).detach()

        return end_output, logits



[docs]
    def configure_optimizers(self):
        """
        Configure optimizers.
        """
        optimizer = torch.optim.Adam(self.parameters(), lr=1e-3)
        return optimizer





[docs]
class ParentFusionModel:
    """
    Parent class for all fusion models.

    Attributes
    ----------
    prediction_task : str
        Type of prediction to be made. Options: binary, multiclass, regression.
    mod1_dim : int
        Dimension of modality 1.
    mod2_dim : int
        Dimension of modality 2.
    img_dim : tuple
        Dimensions of image modality. If using 2D images, then the dimensions will be (x, y). If using 3D images, then
        the dimensions will be (x, y, z).
    multiclass_dimensions : int
        Number of classes for multiclass prediction.
    final_prediction: nn.Sequential
        Final prediction layers.
    mod1_layers : nn.ModuleDict
        Modality 1 layers.
    mod2_layers : nn.ModuleDict
        Modality 2 layers.
    img_layers : nn.ModuleDict
        Image layers.
    fused_layers : nn.Sequential
        Fused layers.
    """


[docs]
    def __init__(self, prediction_task, data_dims, multiclass_dimensions):
        """
        Parameters
        ----------
        prediction_task : str
            Type of prediction to be made. Options: binary, multiclass, regression.
        data_dims : list
            List of data dimensions.
        multiclass_dimensions : int
            Number of classes for multiclass prediction.
        """
        super().__init__()
        self.prediction_task = prediction_task
        self.mod1_dim = data_dims[0]
        self.mod2_dim = data_dims[1]
        self.img_dim = data_dims[2]
        if self.prediction_task == "multiclass":
            self.multiclass_dimensions = multiclass_dimensions



[docs]
    def set_final_pred_layers(self, input_dim=64):
        """
        Sets final prediction layers.

        Parameters
        ----------
        input_dim : int
            Input dimension to final layers - may depend on fusion configuration.

        Returns
        -------
        None
        """
        # final predictions
        if self.prediction_task == "binary":
            self.final_prediction = nn.Sequential(nn.Linear(input_dim, 1), nn.Sigmoid())

        elif self.prediction_task == "multiclass":
            self.final_prediction = nn.Sequential(
                nn.Linear(input_dim, self.multiclass_dimensions)
            )

        elif self.prediction_task == "regression":
            self.final_prediction = nn.Sequential(nn.Linear(input_dim, 1))



[docs]
    def set_mod1_layers(self):
        """
        Sets layers for modality 1

        Returns
        -------
        None
        """
        self.mod1_layers = nn.ModuleDict(
            {
                "layer 1": nn.Sequential(
                    nn.Linear(self.mod1_dim, 32),
                    nn.ReLU(),
                ),
                "layer 2": nn.Sequential(
                    nn.Linear(32, 64),
                    nn.ReLU(),
                ),
                "layer 3": nn.Sequential(
                    nn.Linear(64, 128),
                    nn.ReLU(),
                ),
                "layer 4": nn.Sequential(
                    nn.Linear(128, 256),
                    nn.ReLU(),
                ),
                "layer 5": nn.Sequential(
                    nn.Linear(256, 256),
                    nn.ReLU(),
                ),
            }
        )



[docs]
    def set_mod2_layers(self):
        """
        Sets layers for modality 2

        Returns
        -------
        None
        """
        self.mod2_layers = nn.ModuleDict(
            {
                "layer 1": nn.Sequential(
                    nn.Linear(self.mod2_dim, 32),
                    nn.ReLU(),
                ),
                "layer 2": nn.Sequential(
                    nn.Linear(32, 64),
                    nn.ReLU(),
                ),
                "layer 3": nn.Sequential(
                    nn.Linear(64, 128),
                    nn.ReLU(),
                ),
                "layer 4": nn.Sequential(
                    nn.Linear(128, 256),
                    nn.ReLU(),
                ),
                "layer 5": nn.Sequential(
                    nn.Linear(256, 256),
                    nn.ReLU(),
                ),
            }
        )



[docs]
    def set_img_layers(self):
        """
        Sets layers for image modality. If using 2D images, then the layers will use Conv2D layers.
        If using 3D images, then the layers will use Conv3D layers.

        Returns
        -------
        None
        """

        if len(self.img_dim) == 2:  # 2D images
            self.img_layers = nn.ModuleDict(
                {
                    "layer 1": nn.Sequential(
                        nn.Conv2d(1, 32, kernel_size=(3, 3), padding=0),
                        nn.ReLU(),
                        nn.MaxPool2d((2, 2)),
                    ),
                    "layer 2": nn.Sequential(
                        nn.Conv2d(32, 64, kernel_size=(3, 3), padding=0),
                        nn.ReLU(),
                        nn.MaxPool2d((2, 2)),
                    ),
                    "layer 3": nn.Sequential(
                        nn.Conv2d(64, 128, kernel_size=(3, 3), padding=0),
                        nn.ReLU(),
                        nn.MaxPool2d((2, 2)),
                    ),
                    "layer 4": nn.Sequential(
                        nn.Conv2d(128, 256, kernel_size=(3, 3), padding=0),
                        nn.ReLU(),
                        nn.MaxPool2d((2, 2)),
                    ),
                    "layer 5": nn.Sequential(
                        nn.Conv2d(256, 256, kernel_size=(3, 3), padding=0),
                        nn.ReLU(),
                        nn.MaxPool2d((2, 2)),
                    ),
                }
            )

        elif len(self.img_dim) == 3:  # 3D images
            self.img_layers = nn.ModuleDict(
                {
                    "layer 1": nn.Sequential(
                        nn.Conv3d(1, 32, kernel_size=(3, 3, 3), padding=0),
                        nn.ReLU(),
                        nn.MaxPool3d((2, 2, 2)),
                    ),
                    "layer 2": nn.Sequential(
                        nn.Conv3d(32, 64, kernel_size=(3, 3, 3), padding=0),
                        nn.ReLU(),
                        nn.MaxPool3d((2, 2, 2)),
                    ),
                    "layer 3": nn.Sequential(
                        nn.Conv3d(64, 128, kernel_size=(3, 3, 3), padding=0),
                        nn.ReLU(),
                        nn.MaxPool3d((2, 2, 2)),
                    ),
                    "layer 4": nn.Sequential(
                        nn.Conv3d(128, 256, kernel_size=(3, 3, 3), padding=0),
                        nn.ReLU(),
                        nn.MaxPool3d((2, 2, 2)),
                    ),
                    "layer 5": nn.Sequential(
                        nn.Conv3d(256, 256, kernel_size=(3, 3, 3), padding=0),
                        nn.ReLU(),
                        nn.MaxPool3d((2, 2, 2)),
                    ),
                }
            )

        else:
            raise ValueError("Image dimensionality not supported")



[docs]
    def set_fused_layers(self, fused_dim):
        """
        Set layers for fused modality

        Parameters
        ----------
        fused_dim : int
            Dimension of fused modality: how many features are there after fusion?
            e.g. if we have 2 modalities with 64 features each, and the fusion method
            was concatenation, the fused_dim would be 128

        Returns
        -------
        None
        """
        self.fused_layers = nn.Sequential(
            nn.Linear(fused_dim, 256),
            nn.ReLU(),
            nn.Dropout(p=0.15),
            nn.Linear(256, 64),
            nn.ReLU(),
            nn.Dropout(p=0.15),
        )