Source code for alibi.models.pytorch.model

"""
This module tries to provided a class wrapper to mimic the TensorFlow API of `tensorflow.keras.Model`. It
is intended to simplify the training of a model through methods like compile, fit and evaluate which allow the user
to define custom loss functions, optimizers, evaluation metrics, train a model and evaluate it. Currently it is
used internally to test the functionalities for the Pytorch backend. To be discussed if the module will be exposed
to the user in future versions.
"""

import torch
import torch.nn as nn
import torch.optim as optim
from torch.utils.data import DataLoader

from tqdm import tqdm
from typing import List, Dict, Callable, Union, Tuple, Optional
from alibi.models.pytorch.metrics import Metric, LossContainer



[docs]
class Model(nn.Module):
    def __init__(self, **kwargs):
        super().__init__(**kwargs)
        self.device = torch.device("cuda" if torch.cuda.is_available() else "cpu")


[docs]
    def compile(self,
                optimizer: optim.Optimizer,
                loss: Union[Callable, List[Callable]],
                loss_weights: Optional[List[float]] = None,
                metrics: Optional[List[Metric]] = None):
        """
        Compiles a model by setting the optimizer and the loss functions, loss weights and metrics to monitor
        the training of the model.

        Parameters
        ----------
        optimizer
            Optimizer to be used.
        loss
            Loss function to be used. Can be a list of the loss function which will be weighted and summed up to
            compute the total loss.
        loss_weights
            Weights corresponding to each loss function. Only used if the `loss` argument is a  list.
        metrics
            Metrics used to monitor the training process.
        """
        self.optimizer = optimizer
        self.metrics = [] if (metrics is None) else metrics
        self.loss_weights = [] if (loss_weights is None) else loss_weights
        self.loss: Union[LossContainer, List[LossContainer]]

        if isinstance(loss, list):
            # check if the number of weights is the same as the number of partial losses
            if len(self.loss_weights) != len(loss):
                raise ValueError("The number of loss weights differs from the number of losses")

            self.loss = []
            for i, partial_loss in enumerate(loss):
                self.loss.append(LossContainer(partial_loss, name=f"output_{i+1}_loss"))
        else:
            self.loss = LossContainer(loss, name="loss")



[docs]
    def validate_prediction_labels(self,
                                   y_pred: Union[torch.Tensor, List[torch.Tensor]],
                                   y_true: Union[torch.Tensor, List[torch.Tensor]]):
        """
        Validates the loss functions, loss weights, training labels and prediction labels.

        Parameters
        ---------
        y_pred
            Prediction labels.
        y_true
            True labels.
        """
        if isinstance(self.loss, list):
            # check that prediction is a list
            if not isinstance(y_pred, list):
                raise ValueError("The prediction should be a list since list of losses have been passed.")

            # check that the labels is a list
            if not isinstance(y_true, list):
                raise ValueError("The label should be a list since list of losses have been passed.")

            # check if the number of predictions matches the number of labels
            if len(y_true) != len(y_pred):
                raise ValueError("Number of predictions differs from the number of labels.")

            # check if the number of output heads matches the number of output losses
            if len(y_pred) != len(self.loss):
                raise ValueError("Number of model's heads differs from the number of losses.")

            # TODO: remove this case since is already considered
            if len(self.loss_weights) != 0 and (len(self.loss_weights) != len(self.loss)):
                raise ValueError("Number of loss weights should be equal to the number of losses.")
        else:
            # check that the prediction is not a list
            if isinstance(y_pred, list):
                raise ValueError("The prediction is a list and should be a tensor since only one loss has been passed")

            # check that the label is not a list
            if isinstance(y_true, list):
                raise ValueError("The label is a list and should be a tensor since only one loss has been passed")

        # check if metrics and predictions agree
        if (len(self.metrics) > 0) and (not isinstance(self.metrics, dict)) and isinstance(y_pred, list):
            raise ValueError("Multiple model's head require dictionary of metrics.")



[docs]
    def compute_loss(self,
                     y_pred: Union[torch.Tensor, List[torch.Tensor]],
                     y_true: Union[torch.Tensor, List[torch.Tensor]]) -> Tuple[torch.Tensor, Dict[str, float]]:
        """
        Computes the loss given the prediction labels and the true labels.

        Parameters
        ---------
        y_pred
            Prediction labels.
        y_true
            True labels.

        Returns
        -------
        A tuple consisting of the total loss computed as a weighted sum of individual losses and a dictionary \
        of individual losses used of logging.
        """
        # compute loss
        if isinstance(self.loss, list):
            assert isinstance(y_pred, list)
            assert isinstance(y_true, list)

            loss = torch.tensor(0.).to(self.device)   # necessary for mypy otherwise use `type: ignore`
            results = dict()

            for i, partial_loss in enumerate(self.loss):
                weight = self.loss_weights[i] if len(self.loss_weights) else 1.
                loss += weight * partial_loss(y_pred[i], y_true[i])
                results.update({key: weight * val for key, val in partial_loss.result().items()})

            # compute total loss
            results.update({"loss": sum(results.values())})
        else:
            assert isinstance(y_pred, torch.Tensor)
            assert isinstance(y_true, torch.Tensor)

            loss = self.loss(y_pred, y_true)
            results = self.loss.result()

        return loss, results



[docs]
    def compute_metrics(self,
                        y_pred: Union[torch.Tensor, List[torch.Tensor]],
                        y_true: Union[torch.Tensor, List[torch.Tensor]]) -> Dict[str, float]:
        """
        Computes the metrics given the prediction labels and the true labels.

        Parameters
        ----------
        y_pred
            Prediction labels.
        y_true
            True labels.
        """
        results = dict()

        if isinstance(self.metrics, dict):
            for name in self.metrics:
                i = int(name.split("_")[1]) - 1  # name is of the form output_1_... . Maybe we use re?
                self.metrics[name].compute_metric(y_pred=y_pred[i], y_true=y_true[i])

                # add output prefix in front of the results
                result = {name + "_" + key: val for key, val in self.metrics[name].result().items()}
                results.update(result)

        else:  # this is just for one head
            assert isinstance(y_pred, torch.Tensor)
            assert isinstance(y_true, torch.Tensor)

            for metric in self.metrics:
                metric.compute_metric(y_pred=y_pred, y_true=y_true)
                results.update(metric.result())

        return results



[docs]
    def train_step(self, x: torch.Tensor, y: Union[torch.Tensor, List[torch.Tensor]]) -> Dict[str, float]:
        """
        Performs a train step.

        Parameters
        ----------
        x
            Input tensor.
        y
            Label tensor.
        """
        # set model to train
        self.train()

        # send tensors to device
        x = x.to(self.device)
        y_true: Union[torch.Tensor, List[torch.Tensor]] = \
            [y_i.to(self.device) for y_i in y] if isinstance(y, list) else y.to(self.device)

        # compute output
        y_pred: Union[torch.Tensor, List[torch.Tensor]] = self.forward(x)

        # validate prediction and labels
        self.validate_prediction_labels(y_pred=y_pred, y_true=y_true)

        # compute loss
        loss, results = self.compute_loss(y_pred=y_pred, y_true=y_true)

        # perform gradient update
        self.optimizer.zero_grad()
        loss.backward()
        self.optimizer.step()

        # update metrics
        metrics = self.compute_metrics(y_pred=y_pred, y_true=y_true)
        results.update(metrics)
        return results


    @torch.no_grad()
    def test_step(self,
                  x: torch.Tensor,
                  y: Union[torch.Tensor, List[torch.Tensor]]):
        """
        Performs a test step.

        Parameters
        ----------
        x
            Input tensor.
        y
            Label tensor.
        """
        # set to evaluation
        self.eval()

        # sent tensors to device
        x = x.to(self.device)
        y_true: Union[torch.Tensor, List[torch.Tensor]] = \
            [y_i.to(self.device) for y_i in y] if isinstance(y, list) else y.to(self.device)

        # compute output
        y_pred: torch.Tensor = self.forward(x)

        # validate prediction and labels
        self.validate_prediction_labels(y_pred=y_pred, y_true=y_true)

        # compute loss
        loss, results = self.compute_loss(y_pred=y_pred, y_true=y_true)

        # update metrics
        metrics = self.compute_metrics(y_pred=y_pred, y_true=y_true)
        results.update(metrics)
        return results


[docs]
    def fit(self, trainloader: DataLoader, epochs: int) -> Dict[str, float]:
        """
        Fit method. Equivalent of a training loop.

        Parameters
        ----------
        trainloader
            Training data loader.
        epochs
            Number of epochs to train the model.

        Returns
        -------
        Final epoch monitoring metrics.
        """
        for epoch in range(epochs):
            print("Epoch %d/%d" % (epoch, epochs))

            # reset losses and metrics
            self._reset_loss()
            self._reset_metrics()

            # perform train steps in batches
            for data in tqdm(trainloader):
                if len(data) < 2:
                    raise ValueError("An input and at least a label should be provided")

                x = data[0]
                y = data[1] if len(data) == 2 else data[1:]
                metrics_vals = self.train_step(x, y)

            # print metrics
            print(Model._metrics_to_str(metrics_vals))
        return metrics_vals



[docs]
    def evaluate(self, testloader: DataLoader) -> Dict[str, float]:
        """
        Evaluation function. The function reports the evaluation metrics used for monitoring the training loop.

        Parameters
        ----------
        testloader
            Test dataloader.

        Returns
        -------
        Evaluation metrics.
        """
        self._reset_loss()
        self._reset_metrics()

        # perform test steps in batches
        for data in tqdm(testloader):
            if len(data) < 2:
                raise ValueError("An input and at least a label should be provided.")

            x = data[0]
            y = data[1] if len(data) == 2 else data[1:]
            metrics_vals = self.test_step(x, y)

        # log losses
        print(Model._metrics_to_str(metrics_vals))
        return metrics_vals


    @staticmethod
    def _metrics_to_str(metrics: Dict[str, float]) -> str:
        """
        Converts a dictionary of metrics into a string for logging purposes.

        Parameters
        ----------
        metrics
            Dictionary of metrics to be converted into a string.

        Returns
        -------
        String representation of the metrics.
        """
        str_losses = ''
        for key in metrics:
            str_losses += "%s: %.4f\t" % (key, metrics[key])
        return str_losses

    def _reset_loss(self):
        """
        Rests the losses. Called at the beginning of each epoch.
        """
        if isinstance(self.loss, list):
            for partial_loss in self.loss:
                partial_loss.reset()
        else:
            self.loss.reset()

    def _reset_metrics(self):
        """
        Resets the monitoring metrics. Called at the beginning of each epoch.
        """
        metrics = self.metrics.values() if isinstance(self.metrics, dict) else self.metrics
        for metric in metrics:
            metric.reset()


[docs]
    def save_weights(self, path: str) -> None:
        """
        Save the weight of the current model.
        """
        torch.save(self.state_dict(), path)



[docs]
    def load_weights(self, path: str) -> None:
        """
        Loads the weight of the current model.
        """
        self.load_state_dict(torch.load(path))