Module `model_interpreter.model_interpreter`

Expand source code

import torch                            # PyTorch to create and apply deep learning models
from torch.autograd import Variable     # Create optimizable PyTorch variables
import pandas as pd                     # Pandas to handle the data in dataframes
import numpy as np                      # NumPy to handle numeric and NaN operations
import shap                             # Module used for the calculation of approximate Shapley values
import warnings                         # Print warnings for bad practices
from tqdm.auto import tqdm              # tqdm allows to track code execution progress
import time                             # Calculate code execution time
import plotly                           # Plotly for interactive and pretty plots
import plotly.graph_objs as go
import plotly.offline as py
import colorlover as cl                 # Get colors from colorscales
from functools import partial           # Enables using functions with some fixed parameters
import data_utils as du                 # Data science and machine learning relevant methods

# Constants
POS_COLOR = 'rgba(255,13,87,1)'
NEG_COLOR = 'rgba(30,136,229,1)'

# Auxiliary hidden methods
def calc_instance_score(model, sequence_data, instance, ref_output, x_length,
                        occlusion_wgt=0.7, id_column=0, inst_column=1):
    '''Calculate the instance importance score for a given instance.

    Parameters
    ----------
    model : nn.Module
        Machine learning model which will be interpreted.
    sequence_data : torch.Tensor
        Data corresponding to the data sequence to which the current instance
        belongs to.
    instance : int
        Number of the instance in the sequence. e.g. in a medical time series,
        the second clinical visit of a patient would be the instance number 1
        (counting starts at 0).
    ref_output : torch.Tensor
        Original model outputs of each instance in the sequence.
    x_length : int
        True sequence length, dismissing padding.
    occlusion_wgt : float, default 0.7
            Weight given to the occlusion part of the instance importance score.
            This scores is calculated as a weighted average of the instance's
            influence on the final output and the variation of the output
            probability, between the current instance and the previous one. As
            such, this weight should have a value between 0 and 1, with the
            output variation receiving the remaining weight (1 - occlusion_wgt),
            where 0 corresponds to not using the occlusion component at all, 0.5
            is a normal, unweighted average and 1 deactivates the use of the
            output variation part. If the value wasn't specified in the
            intepreter's initialization nor in the method argument, it will
            default to 0.7
    id_column : int, default 0
            Number of the column which corresponds to the subject identifier in
            the data tensor.
    inst_column : int, default 1
        Number of the column which corresponds to the instance or timestamp
        identifier in the data tensor.

    Returns
    -------
    inst_score : float
        Instance importance score calculated for the current instance, with the
        specified parameters.
    '''
    # Remove identifier columns from the data
    sequence_data = du.deep_learning.remove_tensor_column(sequence_data, [id_column, inst_column], inplace=True)
    # Indeces without the instance that is being analyzed
    instances_idx = list(range(sequence_data.shape[0]))
    instances_idx.remove(instance)
    # Sequence data without the instance that is being analyzed
    sequence_data = sequence_data[instances_idx, :]
    # Add a third dimension for the data to be readable by the model
    sequence_data = sequence_data.unsqueeze(0)
    # Update the sequence length as the instance is removed
    new_seq_length = x_length-1
    # Calculate the output without the instance that is being analyzed
    new_output = model(sequence_data[:, :new_seq_length, :])
    # Only use the last output (i.e. the one from the last instance of the sequence)
    new_output = new_output[new_seq_length-1].item()
    # Flag that indicates whether the output variation component will be used in the instance importance score
    # (in a weighted average)
    use_outvar_score = ref_output.shape[0] > 1 and instance > 0
    if use_outvar_score:
        # Get the output from the previous instance
        prev_output = ref_output[instance-1].item()
        # Get the output from the current instance
        curr_output = ref_output[instance].item()
    # Get the last output
    ref_output = ref_output[x_length-1].item()
    # The instance importance score is then the difference between the output probability with the instance
    # and the probability without the instance
    inst_score = ref_output - new_output
    if instance > 0 and use_outvar_score:
        # If it's not the first instance, add the output variation characteristic in a weighted average
        inst_score = occlusion_wgt * inst_score + (1 - occlusion_wgt) * (curr_output - prev_output)
    # Apply a tanh function to make even the smaller scores (which are the most frequent) more salient
    inst_score = np.tanh(4 * inst_score)
    return inst_score

class KernelFunction:
    def __init__(self, model, model_type='multivariate_rnn'):
        # Save the model object to be used in the main function
        self.model = model
        # Log the model type
        model_type = model_type.lower()
        if model_type == 'multivariate_rnn' or model_type == 'mlp':
            self.model_type = model_type
        else:
            raise Exception(f'ERROR: Invalid model type. It must be "multivariate_rnn" or "mlp", not {model_type}.')

    def f(self, data, hidden_state=None):
        '''Function that will be used in the SHAP kernel explainer, converting
        a NumPy array into the model's output.

        Parameters
        ----------
        data : numpy.ndarray
            Data corresponding to a single instance (or timestamp, in a time
            series) used in the SHAP kernel explainer.
        hidden_state : torch.Tensor or tuple of two torch.Tensor, default None
            Hidden state coming from the previous recurrent cell. If none is
            specified, the hidden state is initialized as zero.

        Returns
        -------
        output : numpy.ndarray
            Output of the model obtained with the given instance data and
            possible hidden state.
        '''
        if isinstance(data, np.ndarray):
            # Make sure the data is of type float
            data = torch.from_numpy(data).float()
        # Calculate the output
        if self.model_type == 'multivariate_rnn':
            if len(data.shape) < 3:
                data = data.unsqueeze(0)
            output = self.model(data, hidden_state=hidden_state)
        elif self.model_type == 'mlp':
            output = self.model(data)
        else:
            raise Exception(f'ERROR: Invalid model type. It must be "multivariate_rnn" or "mlp", not {self.model_type}.')
        if torch.cuda.is_available():
            return output.detach().cpu().numpy()
        else:
            return output.detach().numpy()

class ModelInterpreter:
    '''A machine learning model interpreter which calculates instance and
    feature importance.

    The current focus of the class is to analyze neural networks built in
    the PyTorch framework, which classify sequential data with potentially
    variable sequence length.

    Parameters
    ----------
    model : nn.Module
        Machine learning model which will be interpreted.
    data : torch.Tensor or pandas.DataFrame, default None
        Data used in the interpretation, either directly by analyzing the
        outputs obtained with each sample or indireclty by using as
        background data in methods such as SHAP explainers. The data will be
        used in PyTorch tensor format, but the user can submit it as a
        pandas dataframe, which is then automatically padded and converted.
    labels : torch.Tensor, default None
        Labels corresponding to the data used, either specified in the input
        or all the data that the interpreter has.
    model_type : string, default 'multivariate_rnn'
        Sets the type of machine learning model. Important to know what type
        of inference and data processing to do. Currently available options
        are ['multivariate_rnn', 'mlp'].
    is_custom : bool, default False
        If set to True, the method will assume that the model being used is a
        custom built one, which won't require sequence length information during
        the feedforward process.
    already_embedded : bool, default False
        If set to True, it means that the categorical features are already
        embedded when fetching a batch, i.e. there's no need to run the embedding
        layer(s) during the model's feedforward.
    seq_len_dict : dict, default None
        Dictionary containing the sequence lengths for each index of the
        original dataframe. This allows to ignore the padding done in
        the fixed sequence length tensor.
    id_column_num : int, default None
        Number of the column which corresponds to the subject identifier in
        the data tensor.
    id_column_name : string, default None
        Name of the column which corresponds to the subject identifier in
        the data tensor.
    inst_column_num : int, default None
        Number of the column which corresponds to the instance or timestamp
        identifier in the data tensor.
    inst_column_name : string, default None
        Name of the column which corresponds to the instance or timestamp
        identifier in the data tensor.
    label_column_num : int, default None
        Number of the column which corresponds to the label in the data
        tensor. Only needed if the data is in dataframe format.
    label_column_name : string, default None
        Name of the column which corresponds to the label in the data
        tensor. Only needed if the data is in dataframe format.
    fast_calc : bool, default True
        If set to True, the algorithm uses less background samples (SHAP)
        or optimization steps (mask filter), in order to do a fast
        interpretation of the model. If set to False, the process takes
        more time in order to get a more precise and truthful
        interpretation of the model's behavior, requiring longer
        computation times.
    SHAP_bkgnd_samples : int, default 'auto'
        Number of samples to use as background data, in case a SHAP
        explainer is applied (fast_calc must be set to False).
    random_seed : integer, default 42
        Seed used when shuffling the data.
    feat_names : list of string, default None
        Column names of the dataframe associated to the data. If no list is
        provided, the dataframe should be given in the data argument, so as
        to fetch the names of the columns.
    padding_value : numeric
        Value to use in the padding, to fill the sequences.
    occlusion_wgt : float, default 0.7
        Weight given to the occlusion part of the instance importance score.
        This scores is calculated as a weighted average of the instance's
        influence on the final output and the variation of the output
        probability, between the current instance and the previous one. As
        such, this weight should have a value between 0 and 1, with the
        output variation receiving the remaining weight (1 - occlusion_wgt),
        where 0 corresponds to not using the occlusion component at all, 0.5
        is a normal, unweighted average and 1 deactivates the use of the
        output variation part.
    total_length : int, default None
        If not None, the feature importance scores will be padded to have
        length total_length.
    '''
    def __init__(self, model, data=None, labels=None, model_type='multivariate_rnn',
                 is_custom=False, already_embedded=False, seq_len_dict=None,
                 id_column_num=None, id_column_name=None, inst_column_num=None,
                 inst_column_name=None, label_column_num=None, label_column_name=None,
                 fast_calc=True, SHAP_bkgnd_samples='auto', random_seed=42,
                 feat_names=None, padding_value=999999, occlusion_wgt=0.7,
                 total_length=None):
        # Initialize parameters according to user input
        self.model = model
        self.data = data
        self.seq_len_dict = seq_len_dict
        self.id_column_num = id_column_num
        self.id_column_name = id_column_name
        self.inst_column_num = inst_column_num
        self.inst_column_name = inst_column_name
        self.label_column_num = label_column_num
        self.label_column_name = label_column_name
        self.fast_calc = fast_calc
        self.SHAP_bkgnd_samples = SHAP_bkgnd_samples
        self.random_seed = random_seed
        self.feat_names = feat_names
        self.padding_value = padding_value
        self.occlusion_wgt = occlusion_wgt
        self.total_length = total_length
        if model_type == 'multivariate_rnn' or model_type == 'mlp':
            self.model_type = model_type
        else:
            raise Exception(f'ERROR: Invalid model type. It must be "multivariate_rnn" or "mlp", not {model_type}.')
        self.is_custom = is_custom
        self.already_embedded = already_embedded

        # Put the model in evaluation mode to deactivate dropout
        self.model.eval()

        if data is not None:
            if type(data) is torch.Tensor:
                self.data = data
                self.labels = labels
                if model_type == 'mlp':
                    self.data = du.deep_learning.remove_tensor_column(data, id_column, inplace=True)
            elif type(data) is np.ndarray:
                # Convert from numpy to pytorch
                self.data = torch.from_numpy(data)
                self.labels = torch.from_numpy(labels)
                if model_type == 'mlp':
                    self.data = du.deep_learning.remove_tensor_column(data, id_column, inplace=True)
            elif type(data) is pd.DataFrame:
                # Fetch the column names, ignoring the ID column
                self.feat_names = list(data.columns)
                if self.id_column_num is None and self.id_column_name is not None:
                    # Find the ID column number
                    self.id_column_num = du.search_explore.find_col_idx(data, self.id_column_name)
                elif self.id_column_num is not None and self.id_column_name is None:
                    # Convert the ID column index to the column name
                    self.id_column_name = self.feat_names[self.id_column_num]
                if self.inst_column_num is None and self.inst_column_name is not None:
                    # Find the instance column number
                    self.inst_column_num = du.search_explore.find_col_idx(data, self.inst_column_name)
                elif self.inst_column_num is not None and self.inst_column_name is None:
                    # Convert the instance column index to the column name
                    self.inst_column_name = self.feat_names[self.inst_column_num]
                if self.total_length is None:
                    # Find the maximum sequence length, so that the ML models and their related methods can handle all sequences, which have varying sequence lengths
                    self.total_length = data.groupby(self.id_column_name)[self.inst_column_name].count().max()
                if self.label_column_num is None:
                    if self.label_column_name is not None:
                        # Find the instance column number
                        self.label_column_num = du.search_explore.find_col_idx(data, self.label_column_name)
                    else:
                        # Counter that indicates in which column we're in when searching for the label column
                        col_num = 0
                        for col in data.columns:
                            if 'label' in col:
                                # Column name corresponding to the label
                                self.label_column_name = col
                                # Column number corresponding to the label
                                self.label_column_num = col_num
                                break
                            col_num += 1
                if self.label_column_name is None:
                    self.label_column_name = self.feat_names[self.label_column_num]
                self.feat_names = du.utils.remove_from_list(self.feat_names,
                                                            to_remove=[self.id_column_name,
                                                                       self.label_column_name],
                                                            update_idx=False)
                # Fetch the column numbers, ignoring the ID column
                self.feat_num = list(range(len(data.columns)))
                self.feat_num = du.utils.remove_from_list(self.feat_num,
                                                          to_remove=self.id_column_num,
                                                          update_idx=False)
                # Also update the idx when removing the label, since the features
                # tensors aren't going to contain the label
                self.feat_num = du.utils.remove_from_list(self.feat_num,
                                                          to_remove=self.label_column_num,
                                                          update_idx=True)
                if self.model_type == 'multivariate_rnn':
                    # Also ignore the instance ID column
                    self.feat_names = du.utils.remove_from_list(self.feat_names,
                                                                to_remove=self.inst_column_name,
                                                                update_idx=False)
                    self.feat_num = du.utils.remove_from_list(self.feat_num,
                                                              to_remove=self.inst_column_num,
                                                              update_idx=False)
                    # Find the sequence lengths of the data
                    self.seq_len_dict = du.padding.get_sequence_length_dict(data, id_column=self.id_column_name, ts_column=self.inst_column_name)
                    # Pad data (to have fixed sequence length) and convert into a PyTorch tensor
                    data_tensor = du.padding.dataframe_to_padded_tensor(data, seq_len_dict=self.seq_len_dict, id_column=self.id_column_name,
                                                                        ts_column=self.inst_column_name, padding_value=padding_value,
                                                                        label_column=self.label_column_name, total_length=self.total_length,
                                                                        inplace=True)
                    # Separate labels from features
                    dataset = du.datasets.Time_Series_Dataset(data, data_tensor,
                                                              seq_len_dict=self.seq_len_dict,
                                                              label_name=self.label_column_name)
                elif self.model_type == 'mlp':
                    # Convert into a PyTorch tensor
                    data_tensor = torch.from_numpy(data.numpy())
                    # Separate labels from features
                    dataset = du.datasets.Tabular_Dataset(data_tensor, data)

                self.data = dataset.X
                self.labels = dataset.y
            else:
                raise Exception('ERROR: Invalid data type. Please provide data in a Pandas DataFrame, PyTorch Tensor or NumPy Array format.')
        else:
            # Convert the column indeces to the column names
            if self.id_column_num is None and self.id_column_name is not None:
                # Find the ID column number
                self.id_column_num = self.feat_names.index(self.id_column_name)
            elif self.id_column_num is not None and self.id_column_name is None:
                # Convert the ID column index to the column name
                self.id_column_name = self.feat_names[self.id_column_num]
            if self.inst_column_num is None and self.inst_column_name is not None:
                # Find the instance column number
                self.inst_column_num =  self.feat_names.index(self.inst_column_name)
            elif self.inst_column_num is not None and self.inst_column_name is None:
                # Convert the instance column index to the column name
                self.inst_column_name = self.feat_names[self.inst_column_num]
            if self.label_column_num is None and self.label_column_name is not None:
                # Find the label column number
                self.label_column_num =  self.feat_names.index(self.label_column_name)
            elif self.label_column_num is not None and self.label_column_name is None:
                # Convert the label column index to the column name
                self.label_column_name = self.feat_names[self.label_column_num]
            # Fetch the column numbers, ignoring the ID column
            self.feat_num = list(range(len(self.feat_names)))
            self.feat_num = du.utils.remove_from_list(self.feat_num,
                                                      to_remove=self.id_column_num,
                                                      update_idx=False)
            self.feat_names = du.utils.remove_from_list(self.feat_names,
                                                        to_remove=self.id_column_name,
                                                        update_idx=False)
            if self.label_column_num is not None:
                # Also update the idx when removing the label, since the features
                # tensors aren't going to contain the label
                self.feat_names = du.utils.remove_from_list(self.feat_names,
                                                            to_remove=self.label_column_name,
                                                            update_idx=False)
                self.feat_num = du.utils.remove_from_list(self.feat_num,
                                                        to_remove=self.label_column_num,
                                                        update_idx=True)
            if self.model_type == 'multivariate_rnn':
                # Also ignore the instance ID column
                self.feat_names = du.utils.remove_from_list(self.feat_names,
                                                            to_remove=self.inst_column_name,
                                                            update_idx=False)
                self.feat_num = du.utils.remove_from_list(self.feat_num,
                                                          to_remove=self.inst_column_num,
                                                          update_idx=False)

        # Declare explainer attribute which will store the SHAP Explainer object
        self.explainer = None
        # Declare attributes that will store importance scores (instance and feature importance)
        self.inst_scores = None
        self.feat_scores = None

    def create_bkgnd_test_sets(self, shuffle_dataset=True):
        '''Distributes the data into background and test sets and returns
        the respective data tensors.

        Parameters
        ----------
        random_seed : integer, default 42
            Seed used when shuffling the data.
        shuffle_dataset : bool, default True
            If set to True, the data of which set is shuffled.

        Returns
        -------
        bkgnd_data : torch.Tensor, default None
            Background data used in the SHAP explainer to estimate conditional
            expectations.
        test_data : torch.Tensor, default None
            A subset of data on which model interpretation will be made (i.e.
            calculating feature and/or instance importance).
        '''
        # Create data indices for training and test splits
        dataset_size = self.data.shape[0]
        indices = list(range(dataset_size))
        if shuffle_dataset:
            # Shuffle data
            np.random.seed(self.random_seed)
            np.random.shuffle(indices)
        bkgnd_indices, test_indices = indices[:self.SHAP_bkgnd_samples], indices[self.SHAP_bkgnd_samples:]

        # Get separate tensors for the background data and the test data
        bkgnd_data = self.data[bkgnd_indices]
        test_data = self.data[test_indices]
        return bkgnd_data, test_data

    def mask_filter_step(self, mask, data, ref_output, l1_coeff=1,
                         hidden_state=None, debug_loss=False):
        '''Perform a single optimization step to calculate a new version of the
        mask filter.

        Parameters
        ----------
        mask : numpy.Array
            Current mask filter, either the initial one or from the previous
            optimization iteration.
        data : torch.Tensor
            Data sample which will be used to determine the most relevant
            features. In case of multivariate sequential data, this must be a
            single instance of a sequence.
        ref_output : torch.Tensor or float
            Model's output to the original instance, with no mask filters applied.
        l1_coeff : int, default 1
            Weight given in the loss function to the L1 norm of the mask filter.
        hidden_state : torch.Tensor or tuple of two torch.Tensor, default None
            Hidden state coming from the previous recurrent cell. If none is
            specified, the hidden state is initialized as zero.
        debug_loss : bool, default False
            Debugging flag, which makes the method also return an array of the
            optimization loss.

        Returns
        -------
        mask : numpy.Array
            Current mask filter, after the performed optimization step.

        if debug_loss is True:

        loss : float
            Current loss value of the mask filter optimization.
        '''
        # Get the model's output for the masked input data
        new_output = self.model((mask * data).unsqueeze(0).unsqueeze(0), hidden_state=hidden_state)
        # Calculate the loss function
        # • Minimize the number of activated mask filter units (occluded features)
        # • Maximize the change made to the output
        loss = l1_coeff * torch.mean(torch.abs(1 - mask)) + 1 - (ref_output - new_output).pow(2)
        # Backpropagate the loss function and run an optimization step (update the mask filter)
        loss.backward(retain_graph=True)
        mask.grad = du.deep_learning.change_grad((-1) * mask.grad, mask.data)
        mask.data = mask.data + mask.grad
        # Make sure that the mask has values either 0 or 1
        mask.data.clamp_(0, 1)
        mask.data.round_()
        if debug_loss:
            return mask, loss.item()
        else:
            return mask

    # [TODO] Confirm that the mask filter is working in every scenario
    def mask_filter(self, data=None, x_lengths=None, max_iter=100, l1_coeff=1,
                    lr=0.001, recur_layer=None, see_progress=True, debug_loss=False):
        '''Calculate a mask filter for the given data samples, through an
        appropriate optimization.

        Parameters
        ----------
        data : torch.Tensor, default None
            Data sample(s) which will be used to determine the most relevant
            features. In case of multivariate sequential data, each instance will
            be analyzed seperately. If None, all data known to the model
            interpreter will be used.
        x_lengths : list of int
            Sorted list of sequence lengths, relative to the input data.
        max_iter : int, default 100
            Maximum number of iterations of the mask filter optimization, for
            each instance.
        l1_coeff : int, default 1
            Weight given in the loss function to the L1 norm of the mask filter.
        lr : float, default 0.001
            Learning rate used in the optimization algorithm.
        recur_layer : torch.nn.LSTM or torch.nn.GRU or torch.nn.RNN, default None
            Pointer to the recurrent layer in the model, if it exists. It should
            either be a LSTM, GRU or RNN network. If none is specified, the
            method will automatically search for a recurrent layer in the model.
        see_progress : bool, default True
            If set to True, a progress bar will show up indicating the execution
            of the feature importance scores calculations.
        debug_loss : bool, default False
            Debugging flag, which makes the method also return an array of the
            optimization loss.

        Returns
        -------
        mask : numpy.Array
            Output mask, after finishing the optimization for every specified
            sample. It will be inverted before returning, so as to be an array
            filled with zeros, except in the indeces corresponding to the most
            relevant features, where it will be one.

        if debug_loss is True:

        loss_mtx : np.Array
            Matrix containing the loss values of the mask filter optimization.
        '''
        # [TODO] Work on an option to use input data different from multivariate sequential
        if data is None:
            # If a subset of data to interpret isn't specified, the interpreter will use all the data
            data = self.data
        if x_lengths is None:
            # Sort the data by sequence length
            data, x_lengths = du.padding.sort_by_seq_len(data, self.seq_len_dict)
        if len(data.shape) > 1 and recur_layer is None:
            # Search for a recurrent layer
            if hasattr(self.model, 'lstm'):
                recur_layer = self.model.lstm
            elif hasattr(self.model, 'gru'):
                recur_layer = self.model.gru
            elif hasattr(self.model, 'rnn'):
                recur_layer = self.model.rnn
            else:
                raise Exception('ERROR: No recurrent layer found. Please specify it in the recur_layer argument.')

        # Confirm that the model is in evaluation mode to deactivate dropout
        self.model.eval()
        # Create a mask filter variable, initialized as an all ones tensor
        mask = torch.ones(data.shape)
        # [DEBUG] Create a loss matrix to analyse the convergence of mask filter optimizations
        loss_mtx = []

        if len(data.shape) == 3:
            # Loop to go through each sequence in the input data
            for seq in tqdm(range(data.shape[0]), disable=not see_progress):
                # Get the true length of the current sequence
                seq_len = x_lengths[seq]
                # Loop to go through each instance in the input sequence
                for inst in tqdm(range(seq_len), disable=not see_progress):
                    hidden_state = None
                    # Get the hidden state that the model receives as an input
                    if inst > 0:
                        # Get the hidden state outputed from the previous recurrent cell
                        _, hidden_state = recur_layer(data[:inst])
                        # Avoid backpropagating through previous instances
                        if type(hidden_state) is tuple:
                            hidden_state = (hidden_state[0].detach(), hidden_state[1].detach())
                        else:
                            hidden_state.detach_()
                    # Temporary mask filter for he current instance
                    tmp_mask = Variable(mask[seq, inst, :], requires_grad=True)
                    # [DEBUG] List of the current optimization's losses
                    tmp_loss_list = []
                    # Mask filter optimization loop
                    for iter in tqdm(range(max_iter), disable=not see_progress):
                        # Calculate the model's output to the original, unchanged instance data
                        ref_output = self.model(data[seq, inst, :].unsqueeze(0).unsqueeze(0), hidden_state=hidden_state)
                        # Prevent mask filter optimization from backpropagating through the reference output
                        ref_output.detach_()
                        # Perform a single optimization step
                        tmp_mask, tmp_loss = self.mask_filter_step(tmp_mask, data[seq, inst, :], ref_output, l1_coeff, hidden_state, debug_loss=debug_loss)
                        tmp_loss_list.append(tmp_loss)
                    # Save the optimized mask filter of the current instance
                    mask[seq, inst, :] = tmp_mask
                    # [DEBUG] Add the current instance's optimization logs to the overall loss matrix
                    loss_mtx.append(tmp_loss_list)

        elif len(data.shape) == 2:
            # Loop to go through each instance in the input sequence
            for inst in tqdm(range(data.shape[0]), disable=not see_progress):
                hidden_state = None
                # Get the hidden state that the model receives as an input
                if inst > 0:
                    # Get the hidden state outputed from the previous recurrent cell
                    _, hidden_state = recur_layer(data[:inst])
                    # Avoid backpropagating through previous instances
                    if type(hidden_state) is tuple:
                        hidden_state = (hidden_state[0].detach(), hidden_state[1].detach())
                    else:
                        hidden_state.detach_()
                # Temporary mask filter for he current instance
                tmp_mask = Variable(mask[inst], requires_grad=True)
                # Mask filter optimization loop
                for iter in tqdm(range(max_iter), disable=not see_progress):
                    # Calculate the model's output to the original, unchanged instance data
                    ref_output = self.model(data[inst].unsqueeze(0).unsqueeze(0), hidden_state=hidden_state)
                    # Prevent mask filter optimization from backpropagating through the reference output
                    ref_output.detach_()
                    # Perform a single optimization step
                    tmp_mask = self.mask_filter_step(tmp_mask, data[inst], ref_output, l1_coeff, hidden_state)
                # Save the optimized mask filter of the current instance
                mask[inst] = tmp_mask

        elif len(data.shape) == 1:
            # Make sure that the mask can be optimized properly
            mask.requires_grad_()
            # Mask filter optimization loop
            for iter in tqdm(range(max_iter), disable=not see_progress):
                # Calculate the model's output to the original, unchanged instance data
                ref_output = self.model(data.unsqueeze(0).unsqueeze(0), hidden_state=hidden_state)
                # Prevent mask filter optimization from backpropagating through the reference output
                ref_output.detach_()
                # Perform a single optimization step
                mask = self.mask_filter_step(mask, data, ref_output, l1_coeff)

        else:
            raise Exception(f'ERROR: Can\'t handle data with more than 3 dimensions. Submitted data with {len(data.shape)} dimensions.')

        # Return the inverted version of the mask, to atrribute 1 (one) to the most relevant features
        if debug_loss:
            return 1 - mask, loss_mtx
        else:
            return 1 - mask

    def instance_importance(self, data=None, labels=None, x_lengths=None,
                            see_progress=True, occlusion_wgt=0.7):
        '''Calculate the instance importance scores to interpret the impact of
        each instance of a sequence on the final output.

        Parameters
        ----------
        data : torch.Tensor, default None
            Optionally, the user can specify a subset of data on which model
            interpretation will be made (i.e. calculating feature and/or
            instance importance). Otherwise, all the data is used.
        labels : torch.Tensor, default None
            Labels corresponding to the data used, either specified in the input
            or all the data that the interpreter has.
        x_lengths : list of int
            Sorted list of sequence lengths, relative to the input data.
        see_progress : bool, default True
            If set to True, a progress bar will show up indicating the execution
            of the instance importance scores calculations.
        occlusion_wgt : float, default 0.7
            Weight given to the occlusion part of the instance importance score.
            This scores is calculated as a weighted average of the instance's
            influence on the final output and the variation of the output
            probability, between the current instance and the previous one. As
            such, this weight should have a value between 0 and 1, with the
            output variation receiving the remaining weight (1 - occlusion_wgt),
            where 0 corresponds to not using the occlusion component at all, 0.5
            is a normal, unweighted average and 1 deactivates the use of the
            output variation part. If the value wasn't specified in the
            intepreter's initialization nor in the method argument, it will
            default to 0.7

        Returns
        -------
        inst_scores : numpy.Array
            Array containing the importance scores of each instance in the
            given input sequences.
        '''
        if occlusion_wgt is None:
            if self.occlusion_wgt is not None:
                # Set to the class's occlusion weight value
                occlusion_wgt = self.occlusion_wgt
            else:
                # Set the occlusion weight value to 0.7 (default)
                occlusion_wgt = 0.7
                self.occlusion_wgt = occlusion_wgt

        # Confirm that the occlusion weight has a valid value (between 0 and 1)
        if occlusion_wgt > 1 or occlusion_wgt < 0:
            raise Exception(f'ERROR: Inserted invalid occlusion weight value {occlusion_wgt}. Please replace with a value between 0 and 1.')

        if occlusion_wgt < 1:
            # If the output variation is used in the calculation of the score,
            # get the reference outputs for all the instances of the sequences
            seq_final_outputs = False
        else:
            # Otherwise, only the final outputs of the sequences are retrieved
            seq_final_outputs = True

        if data is None:
            # If a subset of data to interpret isn't specified, the interpreter will use all the data
            data = self.data
            labels = self.labels
        # Make sure that the data is in type float
        data = data.float()
        # Model output when using all the original instances in the input sequences
        ref_output, _ = du.deep_learning.model_inference(self.model, data=(data, labels),
                                                         metrics=[''], model_type=self.model_type,
                                                         is_custom=self.is_custom,
                                                         seq_len_dict=self.seq_len_dict,
                                                         padding_value=self.padding_value,
                                                         seq_final_outputs=seq_final_outputs,
                                                         cols_to_remove=[self.id_column_num, self.inst_column_num],
                                                         already_embedded=self.already_embedded)

        if not seq_final_outputs:
            # Cumulative sequence lengths (true end of the sequences)
            final_seq_idx = np.cumsum(x_lengths)
            start_idx = np.roll(final_seq_idx, 1)
            start_idx[0] = 0
            ref_output = [ref_output[start_idx[i]:final_seq_idx[i]] for i in range(len(start_idx))]

        inst_scores = [[calc_instance_score(self.model, data[seq_num, :, :], inst, ref_output[seq_num],
                                            x_lengths[seq_num], occlusion_wgt, self.id_column_num,
                                            self.inst_column_num)
                        for inst in range(x_lengths[seq_num])] for seq_num in tqdm(range(data.shape[0]), disable=not see_progress)]
        # DEBUG
        # inst_scores = []
        # for seq_num in tqdm(range(data.shape[0]), disable=not see_progress):
        #     tmp_list = []
        #     for inst in range(x_lengths[seq_num]):
        #         tmp_list.append(calc_instance_score(self.model, data[seq_num, :, :], inst, ref_output[seq_num],
        #                                             x_lengths[seq_num], occlusion_wgt, self.id_column_num, self.inst_column_num))
        #     inst_scores.append(tmp_list)

        # Pad the instance scores lists so that all have the same length
        inst_scores = [du.padding.pad_list(scores_list, data.shape[1], padding_value=self.padding_value)
                       for scores_list in inst_scores]
        # Convert to a NumPy array
        inst_scores = np.array(inst_scores)
        return inst_scores

    def feature_importance(self, test_data=None, model_type=None,
                           method='shap', fast_calc=None, see_progress=True,
                           bkgnd_data=None, max_iter=100, l1_coeff=0, lr=0.001,
                           recur_layer=None, create_new_explainer=True, debug_loss=False,
                           total_length=None):
        '''Calculate the feature importance scores to interpret the impact
        of each feature in each instance's output.

        Parameters
        ----------
        test_data : torch.Tensor, default None
            Optionally, the user can specify a subset of data on which model
            interpretation will be made (i.e. calculating feature and/or
            instance importance). Otherwise, all the data is used.
        model_type : string, default 'multivariate_rnn'
            Sets the type of machine learning model. Important to know what type
            of inference and data processing to do. Currently available options
            are ['multivariate_rnn', 'mlp'].
        method : string, defautl SHAP
            Defines which interpretability technique to use. Current options
            include SHAP Kernel Explainer (default) and mask filter.
        fast_calc : bool, default None
            If set to True, the algorithm uses less background samples (SHAP)
            or optimization steps (mask filter), in order to do a fast
            interpretation of the model. If set to False, the process takes
            more time in order to get a more precise and truthful
            interpretation of the model's behavior, requiring longer
            computation times.
        see_progress : bool, default True
            If set to True, a progress bar will show up indicating the execution
            of the feature importance scores calculations.
        total_length : int, default None
            If not None, the feature importance scores will be padded to have
            length total_length.

        if fast_calc is False:

        bkgnd_data : torch.Tensor, default None
            In case of setting fast_calc to False, which makes the algorithm
            require background data in SHAP during the feature importance, the
            background data used in the explainer can be set through this
            parameter.

        if fast_calc is True:

        max_iter : int, default 100
            Maximum number of iterations of the mask filter optimization, for
            each instance.
        l1_coeff : int, default 1
            Weight given in the loss function to the L1 norm of the mask filter.
        lr : float, default 0.001
            Learning rate used in the optimization algorithm of the mask filter.
        recur_layer : torch.nn.LSTM or torch.nn.GRU or torch.nn.RNN, default None
            Pointer to the recurrent layer in the model, if it exists. It should
            either be a LSTM, GRU or RNN network. If none is specified, the
            method will automatically search for a recurrent layer in the model.
        create_new_explainer : bool, default True
            Sets if we'll create a new SHAP KernelExplainer or if we'll use a
            previously defined one in the current model interpreter object.
        debug_loss : bool, default False
            Debugging flag, which makes the method also return an array of the
            mask filter optimization loss.

        Returns
        -------
        feat_scores : numpy.Array
            Array containing the importance scores of each feature, of each
            instance, in the given input sequences.

        if debug_loss is True:

        loss_mtx : np.Array
            Matrix containing the loss values of the mask filter optimization.
        '''
        if fast_calc is None:
            # Use the predefined option if fast_calc isn't set in the function call
            fast_calc = self.fast_calc
        else:
            self.fast_calc = fast_calc
        if model_type is None:
            # Use the predefined option if model_type isn't set in the function call
            model_type = self.model_type
        else:
            self.model_type = model_type
        if total_length is None:
            # Use the predefined option if total_length isn't set in the function call
            total_length = self.total_length

        if model_type == 'multivariate_rnn':
            # Sort the test data by sequence length
            test_data, x_lengths_test = du.padding.sort_by_seq_len(test_data, self.seq_len_dict)
        # Set an indicator to log that the current model is a RNN
        isRNN = model_type == 'multivariate_rnn'
        # Set an indicator to log that the current model is a bidirectional
        isBidir = self.model.bidir

        if method.lower() == 'shap':
            if create_new_explainer is True:
                # Go through all of the steps of initialiazing a new SHAP KernelExplainer
                if fast_calc:
                    print(f'Attention: you have chosen to interpret the model using SHAP, with one background sample (all zeros), with {self.SHAP_bkgnd_samples} reevalutions per prediction applied to {test_data.shape[0]} test samples. This might take a while. Depending on your computer\'s processing power, you should do a coffee break or even go to sleep!')
                    print('Evaluating the model with a reference value of zero. This should only be done if all the data is processed in a way that, for categorical features, 0 represents missing attribute and, for continuous features, 0 represents the average value of that feature.')
                    # Use a single all zeroes sample as a reference value
                    num_id_features = sum([1 if i is not None else 0 for i in [self.id_column_num, self.inst_column_num]])
                    bkgnd_data = np.zeros((1, len(self.feat_names) + num_id_features))
                else:
                    print(f'Attention: you have chosen to interpret the model using SHAP, with {bkgnd_data.shape[0]} background samples, with {self.SHAP_bkgnd_samples} reevalutions per prediction applied to {test_data.shape[0]} test samples. This might take a while. Depending on your computer\'s processing power, you should do a coffee break or even go to sleep!')
                    if model_type.lower() == 'multivariate_rnn':
                        # Sort the background data by sequence length
                        bkgnd_data, x_lengths_bkgnd = du.padding.sort_by_seq_len(bkgnd_data, self.seq_len_dict)
                        # Convert the background data into a 2D NumPy matrix
                        bkgnd_data = du.deep_learning.ts_tensor_to_np_matrix(bkgnd_data, self.feat_num, self.padding_value)
                    elif model_type.lower() == 'mlp':
                        # Just convert background data into a NumPy matrix
                        bkgnd_data = bkgnd_data.numpy()
                if model_type.lower() == 'multivariate_rnn':
                    # Convert the test data into a 2D NumPy matrix
                    test_data = du.deep_learning.ts_tensor_to_np_matrix(test_data, self.feat_num, self.padding_value)
                elif model_type.lower() == 'mlp':
                    # Remove ID columns from the data
                    bkgnd_data = du.deep_learning.remove_tensor_column(bkgnd_data, [self.id_column_num, self.inst_column_num], inplace=True)
                    test_data = du.deep_learning.remove_tensor_column(test_data, [self.id_column_num, self.inst_column_num], inplace=True)
                    # Convert test data into a NumPy matrix
                    test_data = test_data.numpy()
                # Create a function that represents the model's feedforward operation on a single instance
                kf = KernelFunction(self.model, model_type=model_type)
                # Use the background dataset to integrate over
                print('Creating a SHAP kernel explainer...')
                # [TODO] Removing this part of directly handling pure RNN models, as the `is_custom` parameter collides
                # with other definitions of it; ignoring for now as I'm never using pure RNNs, without any modification
                # or at least wrapping in some class.
                # if self.is_custom is False:
                    # # Let SHAP find the recurrent layer
                    # recur_layer = None
                # else:
                # When using custom models, the whole model behaves as a recurrent layer
                # We just need to make sure that it returns the hidden state
                recur_layer = partial(self.model.forward, get_hidden_state=True)
                self.explainer = shap.KernelExplainer(kf.f, bkgnd_data, isRNN=isRNN, isBidir=isBidir,
                                                      model_obj=self.model, max_bkgnd_samples=100,
                                                      id_col_num=self.id_column_num,
                                                      ts_col_num=self.inst_column_num,
                                                      recur_layer=recur_layer)
            # Count the time that takes to calculate the SHAP values
            start_time = time.time()
            # Explain the predictions of the sequences in the test set
            print('Calculating feature importance scores for each instance in the test data...')
            feat_scores = self.explainer.shap_values(test_data, l1_reg='num_features(10)', nsamples=self.SHAP_bkgnd_samples, max_seq_len=total_length)
            print(f'Calculation of SHAP values took {time.time() - start_time} seconds')
            return feat_scores

        else:
            # [TODO] Fix mask filter feature importance
            # [TODO] Add fast and slower versions of the mask filter
            # Remove identifier columns from the test data
            test_data = test_data[:, :, self.feat_num]
            # Make sure that the test data is in type float
            test_data = test_data.float()
            # Count the time that takes to calculate the SHAP values
            start_time = time.time()
            # Apply mask filter
            feat_scores, loss_mtx = self.mask_filter(test_data, x_lengths_test, max_iter,
                                                     l1_coeff, lr, recur_layer, debug_loss)
            print(f'Calculation of mask filter values took {time.time() - start_time} seconds')
            if debug_loss:
                return feat_scores, loss_mtx
            else:
                return feat_scores
        # [TODO] Add more interpretability techniques, such as LIME and Agglomerative Contextual Decomposition (ACD)

    # [Bonus TODO] Upload model explainer and interpretability plots to Comet.ml
    def interpret_model(self, bkgnd_data=None, test_data=None, test_labels=None,
                        new_data=False, model_type=None, df=None,
                        instance_importance=True, feature_importance=False,
                        fast_calc=None, create_new_explainer=True,
                        see_progress=True, save_data=True, debug_loss=False,
                        total_length=None):
        '''Method to calculate scores of feature and/or instance importance, in
        order to be able to interpret a model on a given data.

        Parameters
        ----------
        bkgnd_data : torch.Tensor, default None
            In case of setting fast_calc to False, which makes the algorithm
            require background data in SHAP during the feature importance, the
            background data used in the explainer can be set through this
            parameter.
        test_data : torch.Tensor, default None
            Optionally, the user can specify a subset of data on which model
            interpretation will be made (i.e. calculating feature and/or
            instance importance) as a PyTorch tensor. Otherwise, all the data is
            used.
        test_labels : torch.Tensor, default None
            Labels corresponding to the data used, either specified in the input
            or all the data that the interpreter has.
        new_data : bool, default False
            If set to True, it indicates that the data that will be interpreted
            hasn't been seen before, i.e. it has different ids than those in the
            original dataset defined in the object initialization. This implies
            that a dataframe of the new data is provided (parameter df) so that
            the sequence lengths are calculated. Otherwise, the original
            sequence lengths known by the model interpreter are used.
        model_type : string, default None
            Sets the type of machine learning model. Important to know what type
            of inference and data processing to do. Currently available options
            are ['multivariate_rnn', 'mlp'].
        df : pandas.DataFrame, default None
            Dataframe containing the new data so as to calculate the sequence
            lengths of the new ids. Only used if new_data is set to True and
            `model_type` is 'multivariate_rnn'.
        instance_importance : bool, default True
            If set to True, instance importance is made on the data. In other
            words, the algorithm will analyze the impact that each instance of
            an input sequence had on the output.
        feature_importance : bool or string, default False
            Defines which feature importance interpretability technique to use.
            The algorithm will analyze the impact that each feature of
            an instance had on the output. This is analyzed instance by instance,
            not in the entire sequence at once. For example, from the feature
            importance alone, it's not straightforward how a value in a previous
            instance impacted the current output. Current options include SHAP
            Kernel Explainer ('shap') and 'mask filter'. If set to False, no
            feature importance will be done.
        fast_calc : bool, default None
            If set to True, the algorithm uses less background samples (SHAP)
            or optimization steps (mask filter), in order to do a fast
            interpretation of the model. If set to False, the process takes
            more time in order to get a more precise and truthful
            interpretation of the model's behavior, requiring longer
            computation times.
        create_new_explainer : bool, default True
            Sets if we'll create a new SHAP KernelExplainer or if we'll use a
            previously defined one in the current model interpreter object.
        see_progress : bool, default True
            If set to True, a progress bar will show up indicating the execution
            of the instance importance scores calculations.
        save_data : bool, default True
            If set to True, the possible background data (used in the SHAP
            explainer) and the test data (on which importance scores are
            calculated) are saved as object attributes.
        debug_loss : bool, default False
            Debugging flag, which makes the method also return an array of the
            mask filter optimization loss.
        total_length : int, default None
            If not None, the feature importance scores will be padded to have
            length total_length.

        Returns
        -------
        inst_scores : numpy.Array
            Array containing the importance scores of each instance in the
            given input sequences. Only calculated if instance_importance is set
            to True.
        feat_scores : numpy.Array
            Array containing the importance scores of each feature, of each
            instance, in the given input sequences. Only calculated if
            feature_importance is set to True.

        if debug_loss is True:

        loss_mtx : np.Array
            Matrix containing the loss values of the mask filter optimization.
        '''
        # Confirm that the model is in evaluation mode to deactivate dropout
        self.model.eval()

        if feature_importance is not None and feature_importance is not False:
            try:
                feature_importance = feature_importance.lower()
                if feature_importance != 'shap' and feature_importance != 'mask filter':
                    raise Exception(f'ERROR: Specified {feature_importance} feature importance method isn\'t valid. Available options are \"shap\" and\"mask filter\".')
            except:
                raise Exception(f'ERROR: {feature_importance} is an incorrectly defined feature importance method, as it should be a string. Available options are \"shap\" and\"mask filter\".')

        if fast_calc is None:
            # Use the predefined option if fast_calc isn't set in the function call
            fast_calc = self.fast_calc
        else:
            self.fast_calc = fast_calc
        if model_type is None:
            # Use the predefined option if model_type isn't set in the function call
            model_type = self.model_type
        else:
            self.model_type = model_type
        if total_length is None:
            # Use the predefined option if total_length isn't set in the function call
            total_length = self.total_length

        if test_labels is not None:
            if type(test_labels) is np.ndarray:
                # Convert from numpy to pytorch
                test_labels = torch.from_numpy(test_labels)

        if test_data is None:
            if fast_calc:
                # If a subset of data to interpret isn't specified, the interpreter will use all the data
                test_data = self.data
                test_labels = self.labels
            else:
                if bkgnd_data is None:
                    # Get the background and test sets from the dataset
                    bkgnd_data, test_data = self.create_bkgnd_test_sets()
                else:
                    # Get the test set from the dataset
                    _, test_data = self.create_bkgnd_test_sets()
        elif type(test_data) is np.ndarray:
            # Convert from numpy to pytorch
            test_data = torch.from_numpy(test_data)

        if model_type == 'multivariate_rnn':
            if new_data is True:
                if df is None:
                    raise Exception('ERROR: A dataframe must be provided in order to work with the new data.')
                # Find the sequence lengths of the new data
                seq_len_dict = du.padding.get_sequence_length_dict(df, id_column=self.id_column_num, ts_column=self.inst_column_num)
                # Sort the data by sequence length
                test_data, test_labels, x_lengths_test = du.padding.sort_by_seq_len(test_data, seq_len_dict, test_labels)
            else:
                # Sort the data by sequence length
                test_data, test_labels, x_lengths_test = du.padding.sort_by_seq_len(test_data, self.seq_len_dict, test_labels)

        if not fast_calc:
            if bkgnd_data is None:
                # Get the background set from the dataset
                bkgnd_data, _ = self.create_bkgnd_test_sets()
            elif type(bkgnd_data) is np.ndarray:
                # Convert from numpy to pytorch
                bkgnd_data = torch.from_numpy(bkgnd_data)

        if save_data:
            # Save the data used in the model interpretation
            self.bkgnd_data = bkgnd_data
            self.test_data = test_data
            self.test_labels = test_labels

        if instance_importance is True:
            print('Calculating instance importance scores...')
            # Calculate the scores of importance of each instance
            self.inst_scores = self.instance_importance(test_data, test_labels, x_lengths_test, see_progress)

        if feature_importance is not False:
            print('Calculating feature importance scores...')
            # Calculate the scores of importance of each feature in each instance
            if feature_importance == 'mask filter' and debug_loss:
                self.feat_scores, loss_mtx = self.feature_importance(test_data, model_type,
                                                                     feature_importance,
                                                                     fast_calc, see_progress,
                                                                     bkgnd_data, debug_loss=True,
                                                                     total_length=total_length)
            else:
                self.feat_scores = self.feature_importance(test_data, model_type, feature_importance,
                                                           fast_calc, see_progress, bkgnd_data,
                                                           create_new_explainer=create_new_explainer,
                                                           debug_loss=False, total_length=total_length)

        print('Done!')

        if instance_importance and feature_importance:
            if fast_calc and debug_loss:
                return self.inst_scores, self.feat_scores, loss_mtx
            else:
                return self.inst_scores, self.feat_scores
        elif instance_importance and not feature_importance:
            return self.inst_scores
        elif not instance_importance and feature_importance:
            if fast_calc and debug_loss:
                return self.feat_scores, loss_mtx
            else:
                return self.feat_scores
        else:
            warnings.warn('Without setting instance_importance nor feature_importance to True, the interpret_model function won\'t do anything relevant.')
            return


    def instance_importance_plot(self, orig_data=None, inst_scores=None, seq_id=None,
                                 pred_prob=None, uniform_spacing=False,
                                 show_pred_prob=True, show_title=True,
                                 show_colorbar=True, click_mode='event+select',
                                 labels=None, seq_len=None, threshold=0,
                                 get_fig_obj=False, tensor_idx=True,
                                 max_seq=10, background_color='white',
                                 font_family='Roboto', font_size=14,
                                 font_color='black'):
        '''Create a bar chart that allows visualizing instance importance scores.

        Parameters
        ----------
        orig_data : torch.Tensor or numpy.Array, default None
            Original data used in the machine learning model. Used here to fetch
            the true ID corresponding to the plotted sequence.
        inst_scores : numpy.Array, default None
            Array containing the instance importance scores to be plotted.
        seq_id : int, default None
            ID or sequence index that select which time series / sequences to
            use in the plot. If it's a single value, the method plots a single
            sequence.
        pred_prob : numpy.Array or torch.Tensor or list of floats, default None
            Array containing the prediction probabilities for each sequence in
            the input data (orig_data). Only relevant if show_pred_prob is True.
        uniform_spacing : bool, default False
            Defines whether or not the sequences are displayed with uniform
            spacing (i.e. fixed distance) between their samples.
        show_pred_prob : bool, default True
            If set to True, a percentage bar chart will be shown to the right of
            the standard instance importance plot. If `pred_prob` isn't
            specified but the labels are, the prediction probabilities will be
            automatically calculated.
        show_title : bool, default True
            If set to True, the plot will have a title displayed above.
        show_colorbar : bool, default True
            If set to True, a bar legend will be shown, corresponding each color
            to each respective value.
        click_mode : string, default 'event+select'
            Determines the mode of single click interactions. "event" is the
            default value and emits the `plotly_click` event. In addition this
            mode emits the `plotly_selected` event in drag modes "lasso" and
            "select", but with no event data attached (kept for compatibility
            reasons). The "select" flag enables selecting single data points via
            click. This mode also supports persistent selections, meaning that
            pressing Shift while clicking, adds to / subtracts from an existing
            selection. "select" with `hovermode`: "x" can be confusing, consider
            explicitly setting `hovermode`: "closest" when using this feature.
            Selection events are sent accordingly as long as "event" flag is set
            as well. When the "event" flag is missing, `plotly_click` and
            `plotly_selected` events are not fired.
        labels : torch.Tensor, default None
            Labels corresponding to the data used, either specified in the input
            or all the data that the interpreter has.
        seq_len : int, default None
            Sequence lengths which represent the true, unpadded size of the
            input sequences.
        threshold : int or float, default 0
            Value to use as a threshold in the plot's color selection. In other
            words, values that exceed this threshold will have one color while the
            remaining have a different one, as specified in the parameters.
        get_fig_obj : bool, default False
            If set to True, the function returns the object that contains the
            displayed plotly figure.
        tensor_idx : bool, default True
            If set to True, the ID specified in the respective parameter
            constitutes the index where the desired sequence resides. Otherwise,
            it's the actual unique identifier that appears in the original data.
        max_seq : int, default 10
            Maximum number of sequences to show in the plot. This is meant to
            prevent cramming too many sequences into the graph window.
        background_color : str, default 'white'
            The plot's background color. Can be set in color name (e.g. 'white'),
            hexadecimal code (e.g. '#555') or RGB (e.g. 'rgb(0,0,255)').
        font_family : str, default 'Roboto'
            Text font family to be used in the numbers shown next to the graph.
        font_size : int, default 14
            Text font size to be used in the numbers shown next to the graph.
        font_color : str, default 'black'
            Text font color to be used in the numbers shown next to the graph. Can
            be set in color name (e.g. 'white'), hexadecimal code (e.g. '#555') or
            GB (e.g. 'rgb(0,0,255)').

        Returns
        -------
        fig : plotly.graph_objs.Figure or None
            If argument get_fig_obj is set to True, the figure object is returned.
            Otherwise, nothing is returned, only the plot is showned.'''
        if orig_data is None:
            # Use all the data if none was specified
            orig_data = self.data

            if labels is None:
                labels = self.labels

        if inst_scores is None:
            if self.inst_scores is None:
                raise Exception('ERROR: No instance importance scores found. If the scores aren\'t specified, then they must have already been calculated through the interpret_model method.')
            # Use all the previously calculated scores if none were specified
            inst_scores = self.inst_scores

        # Plot the instance importance of multiple sequences
        # Convert the instance scores data into a NumPy array
        if type(inst_scores) is torch.Tensor:
            inst_scores = inst_scores.detach().numpy()
        elif type(inst_scores) is list:
            inst_scores = np.array(inst_scores)

        # if is not tensor_idx:
        # [TODO] Search for the index associated to the specific ID asked for by the user
        # [TODO] Allow to search for multiple indeces and generate a multiple patients time series plot from it

        if len(inst_scores.shape) == 1 or (seq_id is not None and type(seq_id) is not list):
            # True sequence length of the current id's data
            if seq_len is None:
                seq_len = self.seq_len_dict[orig_data[seq_id, 0, self.id_column_num].item()]

            # [TODO] Add a prediction probability bar plot like in the multiple sequences case

            # Plot the instance importance of one sequence
            plot_data = [go.Bar(
                            x = list(range(seq_len)),
                            y = inst_scores[seq_id, :seq_len],
                            marker=dict(color=du.utils.set_bar_color(inst_scores, seq_id, seq_len,
                                                                     threshold=threshold,
                                                                     pos_color=POS_COLOR,
                                                                     neg_color=NEG_COLOR))
                          )]
            layout = go.Layout(
                                title=f'Instance importance scores for ID {int(orig_data[id, 0, self.id_column_num])}',
                                xaxis=dict(title='Instance'),
                                yaxis=dict(title='Importance scores')
                              )
        else:
            if seq_id is None:
                # Use all the sequences data if a subset isn't specified
                seq_id = list(range(inst_scores.shape[0]))
            # Select the desired data according to the specified IDs
            inst_scores = inst_scores[seq_id, :]
            orig_data = orig_data[seq_id, :, :]
            # Unique patient IDs in string format
            patients = [str(int(item)) for item in [tensor.item()
                        for tensor in list(orig_data[:, 0, self.id_column_num])]]
            if uniform_spacing is True:
                # Sequence instances count, used as X in the plot
                seq_insts_x = [list(range(inst_scores.shape[1]))
                               for patient in range(len(patients))]
            else:
                # Use the original timestamp values as the X axis
                seq_insts_x = [int(tensor) for seq_list
                               in [list(ts_array) for ts_array in list(orig_data[:, :, self.inst_column_num])]
                               for tensor in seq_list]
            # Patients ids repeated max sequence length times, used as Y in the plot
            patients_y = [[patient]*inst_scores.shape[1] for patient in list(patients)]
            # Flatten seq_insts and patients_y
            seq_insts_x = list(np.array(seq_insts_x).flatten())
            patients_y = list(np.array(patients_y).flatten())
            # Define colors for the data points based on their normalized scores (from 0 to 1 instead of -1 to 1)
            colors = [val for val in inst_scores.flatten()]
            # Count the number of already deleted paddings
            count = 0

            for i in range(inst_scores.shape[0]):
                for j in range(inst_scores.shape[1]):
                    if inst_scores[i, j] == self.padding_value:
                        # Delete elements that represent paddings, not real instances
                        del seq_insts_x[i*inst_scores.shape[1]+j-count]
                        del patients_y[i*inst_scores.shape[1]+j-count]
                        del colors[i*inst_scores.shape[1]+j-count]
                        # Increment the counting of already deleted items
                        count += 1

            if show_pred_prob is True:
                if pred_prob is None:
                    if labels is None:
                        raise Exception('ERROR: By setting `show_pred_prob` to True, either the prediction probabilities (pred_prob) or the labels must be provided.')
                    # Calculate the prediction probabilities for the provided data
                    pred_prob, _ = du.deep_learning.model_inference(self.model, data=(orig_data, labels),
                                                                    metrics=[''], model_type=self.model_type,
                                                                    is_custom=self.is_custom,
                                                                    seq_len_dict=self.seq_len_dict,
                                                                    padding_value=self.padding_value,
                                                                    output_rounded=False,
                                                                    seq_final_outputs=True,
                                                                    cols_to_remove=[self.id_column_num, self.inst_column_num],
                                                                    already_embedded=self.already_embedded)
                # Convert the prediction probability data into a NumPy array
                if type(pred_prob) is torch.Tensor:
                    pred_prob = pred_prob.detach().numpy()
                elif type(pred_prob) is list:
                    pred_prob = np.array(pred_prob)
                # Select the desired data according to the specified IDs
                pred_prob = pred_prob[seq_id]
                # Colors to use in the prediction probability bar plots
                pred_colors = cl.scales['8']['div']['RdYlGn']
                # Create "percentage bar" plots through pairs of unfilled and filled rectangles
                shapes_list = []
                # Starting y coordinate of the first shape
                y0 = -0.25
                # Height of the shapes (y length)
                step = 0.5
                # Maximum width of the shapes
                max_width = 1
                for i in range(len(patients)):
                    # Set the starting x coordinate to after the last data point
                    x0 = inst_scores.shape[1]
                    # Set the filling length of the shape
                    x1_fill = x0 + pred_prob[i] * max_width
                    shape_unfilled = {
                                        'type': 'rect',
                                        'x0': x0,
                                        'y0': y0,
                                        'x1': x0 + max_width,
                                        'y1': y0 + step,
                                        'line': {
                                                    'color': 'rgba(0, 0, 0, 1)',
                                                    'width': 2,
                                                },
                                    }
                    shape_filled = {
                                        'type': 'rect',
                                        'x0': x0,
                                        'y0': y0,
                                        'x1': x1_fill,
                                        'y1': y0 + step,
                                        'fillcolor': pred_colors[int(len(pred_colors)-1-max(pred_prob[i]*len(pred_colors)-1, 0))]
                                    }
                    shapes_list.append(shape_unfilled)
                    shapes_list.append(shape_filled)
                    # Set the starting y coordinate for the next shapes
                    y0 = y0 + 2 * step

                # Getting points along the percentage bar plots
                x_range = [list(np.array(range(0, 10, 1))*0.1+inst_scores.shape[1]) for idx in range(len(patients))]
                # Flatten the list
                text_x = [item for sublist in x_range for item in sublist]
                # Y coordinates of the prediction probability text
                text_y = [patient for patient in patients for idx in range(10)]
                # Prediction probabilities in text form, to appear in the plot
                text_content = [pred_prob[idx] for idx in range(len(pred_prob)) for i in range(10)]
                # [TODO] Ajdust the zoom so that the initial plot doens't block part of the first and last sequences that show up

            # Create plotly chart
            plot_data = [dict(
                x=seq_insts_x,
                y=patients_y,
                marker=dict(
                    color=colors,
                    size=12,
                    line = dict(
                        color = 'black',
                        width = 1
                    ),
                    colorscale=[[0, 'rgba(30,136,229,1)'], [0.5, 'white'], [1, 'rgba(255,13,87,1)']],
                    cmax=1,
                    cmin=-1,
                ),
                mode='markers',
                type='scatter',
                hoverinfo='x+y'
            )]
            layout = dict(
                paper_bgcolor=background_color,
                plot_bgcolor=background_color,
                font=dict(
                    family=font_family,
                    size=font_size,
                    color=font_color
                ),
                xaxis=dict(
                    title='Instance',
                    showgrid=False,
                    zeroline=False
                ),
                yaxis=dict(
                    title='Patient ID',
                    showgrid=False,
                    zeroline=False,
                    type='category'
                ),
                hovermode='closest',
                showlegend=False,
                clickmode=click_mode
            )
            if show_title is True:
                layout['title'] = 'Instance importance'
                layout['margin'] = dict(l=0, r=0, t=30, b=0, pad=0)
            else:
                layout['margin'] = dict(l=0, r=0, t=0, b=0, pad=0)
            if show_colorbar is True:
                layout['meta'] = dict()
                layout['meta']['colorbar'] = dict(title='Scores')
            if show_pred_prob is True:
                # Add hover text to indicate the final output probabilities
                prob_hover_info = go.Scatter(
                    x=text_x,
                    y=text_y,
                    text=text_content,
                    mode='text',
                    textfont=dict(size = 1, color='#ffffff'),
                    hoverinfo='y+text'
                )
                plot_data.append(prob_hover_info)
                # Add final output probabilities bar plots
                layout['shapes'] = shapes_list
            if len(patients) > max_seq:
                # Prevent cramming too many sequences into the plot
                layout['yaxis']['range'] = [patients[max_seq], patients[0]]
        # Show the plot
        fig = go.Figure(plot_data, layout)

        if get_fig_obj:
            # Only return the figure object if specified by the user
            return fig
        else:
            py.iplot(fig)
            return

    # [TODO] Develop function to explain, in text form, why a given input data has a certain output.
    # The results gather with instance and feature importance, as well as counter-examples, should
    # be used.
    # def explain_output(self, data, detailed_explanation=True):
        # if detailed_explanation:
        #     inst_scores, feat_scores = self.interpret_model(test_data=data, instance_importance=True,
        #                                                     feature_importance=True, fast_calc=False)
        #
            # [TODO] Explain the most important instances and most important features on those instances
            # [TODO] Compare with counter-examples, i.e. cases where the classification was different
        # else:
        #     inst_scores, feat_scores = self.interpret_model(test_data=data, instance_importance=True,
        #                                                     feature_importance=True, fast_calc=True)
        #
            # [TODO] Explain the most important instances and most important features on those instances

    # [TODO] Define an automatic method to discover which embedded category was more
    # important by doing inference on individual embeddings of each category separately,
    # seeing which one caused a bigger change in the output.

    def shap_values_df(self):
        '''Create a dataframe that contains both the original data used in the
        interpretation of the model and the resulting SHAP values.

        Returns
        -------
        data_n_shap_df : pandas.DataFrame
            Dataframe that contains both the original data used in the
            interpretation of the model and the resulting SHAP values.'''
        # [TODO] Add option to handle pre-calculated SHAP values
        # (pre-defined data and SHAP values, outside of the Model Interpreter)
        # Join the original data and the features' SHAP values
        data_n_shap = np.concatenate([self.test_data.numpy(), self.test_labels.unsqueeze(2).numpy(), self.feat_scores], axis=2)
        # Reshape into a 2D format
        data_n_shap = data_n_shap.reshape(-1, data_n_shap.shape[-1])
        # Remove padding samples
        data_n_shap = data_n_shap[[self.padding_value not in row for row in data_n_shap]]
        # Define the column names list
        shap_column_names = [f'{feature}_shap' for feature in self.feat_names]
        column_names = ([self.id_column_name] + [self.inst_column_name] + self.feat_names
                        + [self.label_column_name] + shap_column_names)
        # Create the dataframe
        data_n_shap_df = pd.DataFrame(data=data_n_shap, columns=column_names)
        return data_n_shap_df

Functions

def calc_instance_score(model, sequence_data, instance, ref_output, x_length, occlusion_wgt=0.7, id_column=0, inst_column=1)

Calculate the instance importance score for a given instance.

Parameters

model : nn.Module: Machine learning model which will be interpreted.
sequence_data : torch.Tensor: Data corresponding to the data sequence to which the current instance belongs to.
instance : int: Number of the instance in the sequence. e.g. in a medical time series, the second clinical visit of a patient would be the instance number 1 (counting starts at 0).
ref_output : torch.Tensor: Original model outputs of each instance in the sequence.
x_length : int: True sequence length, dismissing padding.
occlusion_wgt : float, default 0.7: Weight given to the occlusion part of the instance importance score. This scores is calculated as a weighted average of the instance's influence on the final output and the variation of the output probability, between the current instance and the previous one. As such, this weight should have a value between 0 and 1, with the output variation receiving the remaining weight (1 - occlusion_wgt), where 0 corresponds to not using the occlusion component at all, 0.5 is a normal, unweighted average and 1 deactivates the use of the output variation part. If the value wasn't specified in the intepreter's initialization nor in the method argument, it will default to 0.7
id_column : int, default 0: Number of the column which corresponds to the subject identifier in the data tensor.
inst_column : int, default 1: Number of the column which corresponds to the instance or timestamp identifier in the data tensor.

Returns

inst_score : float: Instance importance score calculated for the current instance, with the specified parameters.

Expand source code

def calc_instance_score(model, sequence_data, instance, ref_output, x_length,
                        occlusion_wgt=0.7, id_column=0, inst_column=1):
    '''Calculate the instance importance score for a given instance.

    Parameters
    ----------
    model : nn.Module
        Machine learning model which will be interpreted.
    sequence_data : torch.Tensor
        Data corresponding to the data sequence to which the current instance
        belongs to.
    instance : int
        Number of the instance in the sequence. e.g. in a medical time series,
        the second clinical visit of a patient would be the instance number 1
        (counting starts at 0).
    ref_output : torch.Tensor
        Original model outputs of each instance in the sequence.
    x_length : int
        True sequence length, dismissing padding.
    occlusion_wgt : float, default 0.7
            Weight given to the occlusion part of the instance importance score.
            This scores is calculated as a weighted average of the instance's
            influence on the final output and the variation of the output
            probability, between the current instance and the previous one. As
            such, this weight should have a value between 0 and 1, with the
            output variation receiving the remaining weight (1 - occlusion_wgt),
            where 0 corresponds to not using the occlusion component at all, 0.5
            is a normal, unweighted average and 1 deactivates the use of the
            output variation part. If the value wasn't specified in the
            intepreter's initialization nor in the method argument, it will
            default to 0.7
    id_column : int, default 0
            Number of the column which corresponds to the subject identifier in
            the data tensor.
    inst_column : int, default 1
        Number of the column which corresponds to the instance or timestamp
        identifier in the data tensor.

    Returns
    -------
    inst_score : float
        Instance importance score calculated for the current instance, with the
        specified parameters.
    '''
    # Remove identifier columns from the data
    sequence_data = du.deep_learning.remove_tensor_column(sequence_data, [id_column, inst_column], inplace=True)
    # Indeces without the instance that is being analyzed
    instances_idx = list(range(sequence_data.shape[0]))
    instances_idx.remove(instance)
    # Sequence data without the instance that is being analyzed
    sequence_data = sequence_data[instances_idx, :]
    # Add a third dimension for the data to be readable by the model
    sequence_data = sequence_data.unsqueeze(0)
    # Update the sequence length as the instance is removed
    new_seq_length = x_length-1
    # Calculate the output without the instance that is being analyzed
    new_output = model(sequence_data[:, :new_seq_length, :])
    # Only use the last output (i.e. the one from the last instance of the sequence)
    new_output = new_output[new_seq_length-1].item()
    # Flag that indicates whether the output variation component will be used in the instance importance score
    # (in a weighted average)
    use_outvar_score = ref_output.shape[0] > 1 and instance > 0
    if use_outvar_score:
        # Get the output from the previous instance
        prev_output = ref_output[instance-1].item()
        # Get the output from the current instance
        curr_output = ref_output[instance].item()
    # Get the last output
    ref_output = ref_output[x_length-1].item()
    # The instance importance score is then the difference between the output probability with the instance
    # and the probability without the instance
    inst_score = ref_output - new_output
    if instance > 0 and use_outvar_score:
        # If it's not the first instance, add the output variation characteristic in a weighted average
        inst_score = occlusion_wgt * inst_score + (1 - occlusion_wgt) * (curr_output - prev_output)
    # Apply a tanh function to make even the smaller scores (which are the most frequent) more salient
    inst_score = np.tanh(4 * inst_score)
    return inst_score

Classes

class KernelFunction (model, model_type='multivariate_rnn')

Expand source code

class KernelFunction:
    def __init__(self, model, model_type='multivariate_rnn'):
        # Save the model object to be used in the main function
        self.model = model
        # Log the model type
        model_type = model_type.lower()
        if model_type == 'multivariate_rnn' or model_type == 'mlp':
            self.model_type = model_type
        else:
            raise Exception(f'ERROR: Invalid model type. It must be "multivariate_rnn" or "mlp", not {model_type}.')

    def f(self, data, hidden_state=None):
        '''Function that will be used in the SHAP kernel explainer, converting
        a NumPy array into the model's output.

        Parameters
        ----------
        data : numpy.ndarray
            Data corresponding to a single instance (or timestamp, in a time
            series) used in the SHAP kernel explainer.
        hidden_state : torch.Tensor or tuple of two torch.Tensor, default None
            Hidden state coming from the previous recurrent cell. If none is
            specified, the hidden state is initialized as zero.

        Returns
        -------
        output : numpy.ndarray
            Output of the model obtained with the given instance data and
            possible hidden state.
        '''
        if isinstance(data, np.ndarray):
            # Make sure the data is of type float
            data = torch.from_numpy(data).float()
        # Calculate the output
        if self.model_type == 'multivariate_rnn':
            if len(data.shape) < 3:
                data = data.unsqueeze(0)
            output = self.model(data, hidden_state=hidden_state)
        elif self.model_type == 'mlp':
            output = self.model(data)
        else:
            raise Exception(f'ERROR: Invalid model type. It must be "multivariate_rnn" or "mlp", not {self.model_type}.')
        if torch.cuda.is_available():
            return output.detach().cpu().numpy()
        else:
            return output.detach().numpy()

Methods

def f(self, data, hidden_state=None)

Function that will be used in the SHAP kernel explainer, converting a NumPy array into the model's output.

Parameters

data : numpy.ndarray: Data corresponding to a single instance (or timestamp, in a time series) used in the SHAP kernel explainer.
hidden_state : torch.Tensor or tuple of two torch.Tensor, default None: Hidden state coming from the previous recurrent cell. If none is specified, the hidden state is initialized as zero.

Returns

output : numpy.ndarray: Output of the model obtained with the given instance data and possible hidden state.

Expand source code

def f(self, data, hidden_state=None):
    '''Function that will be used in the SHAP kernel explainer, converting
    a NumPy array into the model's output.

    Parameters
    ----------
    data : numpy.ndarray
        Data corresponding to a single instance (or timestamp, in a time
        series) used in the SHAP kernel explainer.
    hidden_state : torch.Tensor or tuple of two torch.Tensor, default None
        Hidden state coming from the previous recurrent cell. If none is
        specified, the hidden state is initialized as zero.

    Returns
    -------
    output : numpy.ndarray
        Output of the model obtained with the given instance data and
        possible hidden state.
    '''
    if isinstance(data, np.ndarray):
        # Make sure the data is of type float
        data = torch.from_numpy(data).float()
    # Calculate the output
    if self.model_type == 'multivariate_rnn':
        if len(data.shape) < 3:
            data = data.unsqueeze(0)
        output = self.model(data, hidden_state=hidden_state)
    elif self.model_type == 'mlp':
        output = self.model(data)
    else:
        raise Exception(f'ERROR: Invalid model type. It must be "multivariate_rnn" or "mlp", not {self.model_type}.')
    if torch.cuda.is_available():
        return output.detach().cpu().numpy()
    else:
        return output.detach().numpy()

class ModelInterpreter (model, data=None, labels=None, model_type='multivariate_rnn', is_custom=False, already_embedded=False, seq_len_dict=None, id_column_num=None, id_column_name=None, inst_column_num=None, inst_column_name=None, label_column_num=None, label_column_name=None, fast_calc=True, SHAP_bkgnd_samples='auto', random_seed=42, feat_names=None, padding_value=999999, occlusion_wgt=0.7, total_length=None)

A machine learning model interpreter which calculates instance and feature importance.

The current focus of the class is to analyze neural networks built in the PyTorch framework, which classify sequential data with potentially variable sequence length.

Parameters

model : nn.Module: Machine learning model which will be interpreted.
data : torch.Tensor or pandas.DataFrame, default None: Data used in the interpretation, either directly by analyzing the outputs obtained with each sample or indireclty by using as background data in methods such as SHAP explainers. The data will be used in PyTorch tensor format, but the user can submit it as a pandas dataframe, which is then automatically padded and converted.
labels : torch.Tensor, default None: Labels corresponding to the data used, either specified in the input or all the data that the interpreter has.
model_type : string, default 'multivariate_rnn': Sets the type of machine learning model. Important to know what type of inference and data processing to do. Currently available options are ['multivariate_rnn', 'mlp'].
is_custom : bool, default False: If set to True, the method will assume that the model being used is a custom built one, which won't require sequence length information during the feedforward process.
already_embedded : bool, default False: If set to True, it means that the categorical features are already embedded when fetching a batch, i.e. there's no need to run the embedding layer(s) during the model's feedforward.
seq_len_dict : dict, default None: Dictionary containing the sequence lengths for each index of the original dataframe. This allows to ignore the padding done in the fixed sequence length tensor.
id_column_num : int, default None: Number of the column which corresponds to the subject identifier in the data tensor.
id_column_name : string, default None: Name of the column which corresponds to the subject identifier in the data tensor.
inst_column_num : int, default None: Number of the column which corresponds to the instance or timestamp identifier in the data tensor.
inst_column_name : string, default None: Name of the column which corresponds to the instance or timestamp identifier in the data tensor.
label_column_num : int, default None: Number of the column which corresponds to the label in the data tensor. Only needed if the data is in dataframe format.
label_column_name : string, default None: Name of the column which corresponds to the label in the data tensor. Only needed if the data is in dataframe format.
fast_calc : bool, default True: If set to True, the algorithm uses less background samples (SHAP) or optimization steps (mask filter), in order to do a fast interpretation of the model. If set to False, the process takes more time in order to get a more precise and truthful interpretation of the model's behavior, requiring longer computation times.
SHAP_bkgnd_samples : int, default 'auto': Number of samples to use as background data, in case a SHAP explainer is applied (fast_calc must be set to False).
random_seed : integer, default 42: Seed used when shuffling the data.
feat_names : list of string, default None: Column names of the dataframe associated to the data. If no list is provided, the dataframe should be given in the data argument, so as to fetch the names of the columns.
padding_value : numeric: Value to use in the padding, to fill the sequences.
occlusion_wgt : float, default 0.7: Weight given to the occlusion part of the instance importance score. This scores is calculated as a weighted average of the instance's influence on the final output and the variation of the output probability, between the current instance and the previous one. As such, this weight should have a value between 0 and 1, with the output variation receiving the remaining weight (1 - occlusion_wgt), where 0 corresponds to not using the occlusion component at all, 0.5 is a normal, unweighted average and 1 deactivates the use of the output variation part.
total_length : int, default None: If not None, the feature importance scores will be padded to have length total_length.

Expand source code

class ModelInterpreter:
    '''A machine learning model interpreter which calculates instance and
    feature importance.

    The current focus of the class is to analyze neural networks built in
    the PyTorch framework, which classify sequential data with potentially
    variable sequence length.

    Parameters
    ----------
    model : nn.Module
        Machine learning model which will be interpreted.
    data : torch.Tensor or pandas.DataFrame, default None
        Data used in the interpretation, either directly by analyzing the
        outputs obtained with each sample or indireclty by using as
        background data in methods such as SHAP explainers. The data will be
        used in PyTorch tensor format, but the user can submit it as a
        pandas dataframe, which is then automatically padded and converted.
    labels : torch.Tensor, default None
        Labels corresponding to the data used, either specified in the input
        or all the data that the interpreter has.
    model_type : string, default 'multivariate_rnn'
        Sets the type of machine learning model. Important to know what type
        of inference and data processing to do. Currently available options
        are ['multivariate_rnn', 'mlp'].
    is_custom : bool, default False
        If set to True, the method will assume that the model being used is a
        custom built one, which won't require sequence length information during
        the feedforward process.
    already_embedded : bool, default False
        If set to True, it means that the categorical features are already
        embedded when fetching a batch, i.e. there's no need to run the embedding
        layer(s) during the model's feedforward.
    seq_len_dict : dict, default None
        Dictionary containing the sequence lengths for each index of the
        original dataframe. This allows to ignore the padding done in
        the fixed sequence length tensor.
    id_column_num : int, default None
        Number of the column which corresponds to the subject identifier in
        the data tensor.
    id_column_name : string, default None
        Name of the column which corresponds to the subject identifier in
        the data tensor.
    inst_column_num : int, default None
        Number of the column which corresponds to the instance or timestamp
        identifier in the data tensor.
    inst_column_name : string, default None
        Name of the column which corresponds to the instance or timestamp
        identifier in the data tensor.
    label_column_num : int, default None
        Number of the column which corresponds to the label in the data
        tensor. Only needed if the data is in dataframe format.
    label_column_name : string, default None
        Name of the column which corresponds to the label in the data
        tensor. Only needed if the data is in dataframe format.
    fast_calc : bool, default True
        If set to True, the algorithm uses less background samples (SHAP)
        or optimization steps (mask filter), in order to do a fast
        interpretation of the model. If set to False, the process takes
        more time in order to get a more precise and truthful
        interpretation of the model's behavior, requiring longer
        computation times.
    SHAP_bkgnd_samples : int, default 'auto'
        Number of samples to use as background data, in case a SHAP
        explainer is applied (fast_calc must be set to False).
    random_seed : integer, default 42
        Seed used when shuffling the data.
    feat_names : list of string, default None
        Column names of the dataframe associated to the data. If no list is
        provided, the dataframe should be given in the data argument, so as
        to fetch the names of the columns.
    padding_value : numeric
        Value to use in the padding, to fill the sequences.
    occlusion_wgt : float, default 0.7
        Weight given to the occlusion part of the instance importance score.
        This scores is calculated as a weighted average of the instance's
        influence on the final output and the variation of the output
        probability, between the current instance and the previous one. As
        such, this weight should have a value between 0 and 1, with the
        output variation receiving the remaining weight (1 - occlusion_wgt),
        where 0 corresponds to not using the occlusion component at all, 0.5
        is a normal, unweighted average and 1 deactivates the use of the
        output variation part.
    total_length : int, default None
        If not None, the feature importance scores will be padded to have
        length total_length.
    '''
    def __init__(self, model, data=None, labels=None, model_type='multivariate_rnn',
                 is_custom=False, already_embedded=False, seq_len_dict=None,
                 id_column_num=None, id_column_name=None, inst_column_num=None,
                 inst_column_name=None, label_column_num=None, label_column_name=None,
                 fast_calc=True, SHAP_bkgnd_samples='auto', random_seed=42,
                 feat_names=None, padding_value=999999, occlusion_wgt=0.7,
                 total_length=None):
        # Initialize parameters according to user input
        self.model = model
        self.data = data
        self.seq_len_dict = seq_len_dict
        self.id_column_num = id_column_num
        self.id_column_name = id_column_name
        self.inst_column_num = inst_column_num
        self.inst_column_name = inst_column_name
        self.label_column_num = label_column_num
        self.label_column_name = label_column_name
        self.fast_calc = fast_calc
        self.SHAP_bkgnd_samples = SHAP_bkgnd_samples
        self.random_seed = random_seed
        self.feat_names = feat_names
        self.padding_value = padding_value
        self.occlusion_wgt = occlusion_wgt
        self.total_length = total_length
        if model_type == 'multivariate_rnn' or model_type == 'mlp':
            self.model_type = model_type
        else:
            raise Exception(f'ERROR: Invalid model type. It must be "multivariate_rnn" or "mlp", not {model_type}.')
        self.is_custom = is_custom
        self.already_embedded = already_embedded

        # Put the model in evaluation mode to deactivate dropout
        self.model.eval()

        if data is not None:
            if type(data) is torch.Tensor:
                self.data = data
                self.labels = labels
                if model_type == 'mlp':
                    self.data = du.deep_learning.remove_tensor_column(data, id_column, inplace=True)
            elif type(data) is np.ndarray:
                # Convert from numpy to pytorch
                self.data = torch.from_numpy(data)
                self.labels = torch.from_numpy(labels)
                if model_type == 'mlp':
                    self.data = du.deep_learning.remove_tensor_column(data, id_column, inplace=True)
            elif type(data) is pd.DataFrame:
                # Fetch the column names, ignoring the ID column
                self.feat_names = list(data.columns)
                if self.id_column_num is None and self.id_column_name is not None:
                    # Find the ID column number
                    self.id_column_num = du.search_explore.find_col_idx(data, self.id_column_name)
                elif self.id_column_num is not None and self.id_column_name is None:
                    # Convert the ID column index to the column name
                    self.id_column_name = self.feat_names[self.id_column_num]
                if self.inst_column_num is None and self.inst_column_name is not None:
                    # Find the instance column number
                    self.inst_column_num = du.search_explore.find_col_idx(data, self.inst_column_name)
                elif self.inst_column_num is not None and self.inst_column_name is None:
                    # Convert the instance column index to the column name
                    self.inst_column_name = self.feat_names[self.inst_column_num]
                if self.total_length is None:
                    # Find the maximum sequence length, so that the ML models and their related methods can handle all sequences, which have varying sequence lengths
                    self.total_length = data.groupby(self.id_column_name)[self.inst_column_name].count().max()
                if self.label_column_num is None:
                    if self.label_column_name is not None:
                        # Find the instance column number
                        self.label_column_num = du.search_explore.find_col_idx(data, self.label_column_name)
                    else:
                        # Counter that indicates in which column we're in when searching for the label column
                        col_num = 0
                        for col in data.columns:
                            if 'label' in col:
                                # Column name corresponding to the label
                                self.label_column_name = col
                                # Column number corresponding to the label
                                self.label_column_num = col_num
                                break
                            col_num += 1
                if self.label_column_name is None:
                    self.label_column_name = self.feat_names[self.label_column_num]
                self.feat_names = du.utils.remove_from_list(self.feat_names,
                                                            to_remove=[self.id_column_name,
                                                                       self.label_column_name],
                                                            update_idx=False)
                # Fetch the column numbers, ignoring the ID column
                self.feat_num = list(range(len(data.columns)))
                self.feat_num = du.utils.remove_from_list(self.feat_num,
                                                          to_remove=self.id_column_num,
                                                          update_idx=False)
                # Also update the idx when removing the label, since the features
                # tensors aren't going to contain the label
                self.feat_num = du.utils.remove_from_list(self.feat_num,
                                                          to_remove=self.label_column_num,
                                                          update_idx=True)
                if self.model_type == 'multivariate_rnn':
                    # Also ignore the instance ID column
                    self.feat_names = du.utils.remove_from_list(self.feat_names,
                                                                to_remove=self.inst_column_name,
                                                                update_idx=False)
                    self.feat_num = du.utils.remove_from_list(self.feat_num,
                                                              to_remove=self.inst_column_num,
                                                              update_idx=False)
                    # Find the sequence lengths of the data
                    self.seq_len_dict = du.padding.get_sequence_length_dict(data, id_column=self.id_column_name, ts_column=self.inst_column_name)
                    # Pad data (to have fixed sequence length) and convert into a PyTorch tensor
                    data_tensor = du.padding.dataframe_to_padded_tensor(data, seq_len_dict=self.seq_len_dict, id_column=self.id_column_name,
                                                                        ts_column=self.inst_column_name, padding_value=padding_value,
                                                                        label_column=self.label_column_name, total_length=self.total_length,
                                                                        inplace=True)
                    # Separate labels from features
                    dataset = du.datasets.Time_Series_Dataset(data, data_tensor,
                                                              seq_len_dict=self.seq_len_dict,
                                                              label_name=self.label_column_name)
                elif self.model_type == 'mlp':
                    # Convert into a PyTorch tensor
                    data_tensor = torch.from_numpy(data.numpy())
                    # Separate labels from features
                    dataset = du.datasets.Tabular_Dataset(data_tensor, data)

                self.data = dataset.X
                self.labels = dataset.y
            else:
                raise Exception('ERROR: Invalid data type. Please provide data in a Pandas DataFrame, PyTorch Tensor or NumPy Array format.')
        else:
            # Convert the column indeces to the column names
            if self.id_column_num is None and self.id_column_name is not None:
                # Find the ID column number
                self.id_column_num = self.feat_names.index(self.id_column_name)
            elif self.id_column_num is not None and self.id_column_name is None:
                # Convert the ID column index to the column name
                self.id_column_name = self.feat_names[self.id_column_num]
            if self.inst_column_num is None and self.inst_column_name is not None:
                # Find the instance column number
                self.inst_column_num =  self.feat_names.index(self.inst_column_name)
            elif self.inst_column_num is not None and self.inst_column_name is None:
                # Convert the instance column index to the column name
                self.inst_column_name = self.feat_names[self.inst_column_num]
            if self.label_column_num is None and self.label_column_name is not None:
                # Find the label column number
                self.label_column_num =  self.feat_names.index(self.label_column_name)
            elif self.label_column_num is not None and self.label_column_name is None:
                # Convert the label column index to the column name
                self.label_column_name = self.feat_names[self.label_column_num]
            # Fetch the column numbers, ignoring the ID column
            self.feat_num = list(range(len(self.feat_names)))
            self.feat_num = du.utils.remove_from_list(self.feat_num,
                                                      to_remove=self.id_column_num,
                                                      update_idx=False)
            self.feat_names = du.utils.remove_from_list(self.feat_names,
                                                        to_remove=self.id_column_name,
                                                        update_idx=False)
            if self.label_column_num is not None:
                # Also update the idx when removing the label, since the features
                # tensors aren't going to contain the label
                self.feat_names = du.utils.remove_from_list(self.feat_names,
                                                            to_remove=self.label_column_name,
                                                            update_idx=False)
                self.feat_num = du.utils.remove_from_list(self.feat_num,
                                                        to_remove=self.label_column_num,
                                                        update_idx=True)
            if self.model_type == 'multivariate_rnn':
                # Also ignore the instance ID column
                self.feat_names = du.utils.remove_from_list(self.feat_names,
                                                            to_remove=self.inst_column_name,
                                                            update_idx=False)
                self.feat_num = du.utils.remove_from_list(self.feat_num,
                                                          to_remove=self.inst_column_num,
                                                          update_idx=False)

        # Declare explainer attribute which will store the SHAP Explainer object
        self.explainer = None
        # Declare attributes that will store importance scores (instance and feature importance)
        self.inst_scores = None
        self.feat_scores = None

    def create_bkgnd_test_sets(self, shuffle_dataset=True):
        '''Distributes the data into background and test sets and returns
        the respective data tensors.

        Parameters
        ----------
        random_seed : integer, default 42
            Seed used when shuffling the data.
        shuffle_dataset : bool, default True
            If set to True, the data of which set is shuffled.

        Returns
        -------
        bkgnd_data : torch.Tensor, default None
            Background data used in the SHAP explainer to estimate conditional
            expectations.
        test_data : torch.Tensor, default None
            A subset of data on which model interpretation will be made (i.e.
            calculating feature and/or instance importance).
        '''
        # Create data indices for training and test splits
        dataset_size = self.data.shape[0]
        indices = list(range(dataset_size))
        if shuffle_dataset:
            # Shuffle data
            np.random.seed(self.random_seed)
            np.random.shuffle(indices)
        bkgnd_indices, test_indices = indices[:self.SHAP_bkgnd_samples], indices[self.SHAP_bkgnd_samples:]

        # Get separate tensors for the background data and the test data
        bkgnd_data = self.data[bkgnd_indices]
        test_data = self.data[test_indices]
        return bkgnd_data, test_data

    def mask_filter_step(self, mask, data, ref_output, l1_coeff=1,
                         hidden_state=None, debug_loss=False):
        '''Perform a single optimization step to calculate a new version of the
        mask filter.

        Parameters
        ----------
        mask : numpy.Array
            Current mask filter, either the initial one or from the previous
            optimization iteration.
        data : torch.Tensor
            Data sample which will be used to determine the most relevant
            features. In case of multivariate sequential data, this must be a
            single instance of a sequence.
        ref_output : torch.Tensor or float
            Model's output to the original instance, with no mask filters applied.
        l1_coeff : int, default 1
            Weight given in the loss function to the L1 norm of the mask filter.
        hidden_state : torch.Tensor or tuple of two torch.Tensor, default None
            Hidden state coming from the previous recurrent cell. If none is
            specified, the hidden state is initialized as zero.
        debug_loss : bool, default False
            Debugging flag, which makes the method also return an array of the
            optimization loss.

        Returns
        -------
        mask : numpy.Array
            Current mask filter, after the performed optimization step.

        if debug_loss is True:

        loss : float
            Current loss value of the mask filter optimization.
        '''
        # Get the model's output for the masked input data
        new_output = self.model((mask * data).unsqueeze(0).unsqueeze(0), hidden_state=hidden_state)
        # Calculate the loss function
        # • Minimize the number of activated mask filter units (occluded features)
        # • Maximize the change made to the output
        loss = l1_coeff * torch.mean(torch.abs(1 - mask)) + 1 - (ref_output - new_output).pow(2)
        # Backpropagate the loss function and run an optimization step (update the mask filter)
        loss.backward(retain_graph=True)
        mask.grad = du.deep_learning.change_grad((-1) * mask.grad, mask.data)
        mask.data = mask.data + mask.grad
        # Make sure that the mask has values either 0 or 1
        mask.data.clamp_(0, 1)
        mask.data.round_()
        if debug_loss:
            return mask, loss.item()
        else:
            return mask

    # [TODO] Confirm that the mask filter is working in every scenario
    def mask_filter(self, data=None, x_lengths=None, max_iter=100, l1_coeff=1,
                    lr=0.001, recur_layer=None, see_progress=True, debug_loss=False):
        '''Calculate a mask filter for the given data samples, through an
        appropriate optimization.

        Parameters
        ----------
        data : torch.Tensor, default None
            Data sample(s) which will be used to determine the most relevant
            features. In case of multivariate sequential data, each instance will
            be analyzed seperately. If None, all data known to the model
            interpreter will be used.
        x_lengths : list of int
            Sorted list of sequence lengths, relative to the input data.
        max_iter : int, default 100
            Maximum number of iterations of the mask filter optimization, for
            each instance.
        l1_coeff : int, default 1
            Weight given in the loss function to the L1 norm of the mask filter.
        lr : float, default 0.001
            Learning rate used in the optimization algorithm.
        recur_layer : torch.nn.LSTM or torch.nn.GRU or torch.nn.RNN, default None
            Pointer to the recurrent layer in the model, if it exists. It should
            either be a LSTM, GRU or RNN network. If none is specified, the
            method will automatically search for a recurrent layer in the model.
        see_progress : bool, default True
            If set to True, a progress bar will show up indicating the execution
            of the feature importance scores calculations.
        debug_loss : bool, default False
            Debugging flag, which makes the method also return an array of the
            optimization loss.

        Returns
        -------
        mask : numpy.Array
            Output mask, after finishing the optimization for every specified
            sample. It will be inverted before returning, so as to be an array
            filled with zeros, except in the indeces corresponding to the most
            relevant features, where it will be one.

        if debug_loss is True:

        loss_mtx : np.Array
            Matrix containing the loss values of the mask filter optimization.
        '''
        # [TODO] Work on an option to use input data different from multivariate sequential
        if data is None:
            # If a subset of data to interpret isn't specified, the interpreter will use all the data
            data = self.data
        if x_lengths is None:
            # Sort the data by sequence length
            data, x_lengths = du.padding.sort_by_seq_len(data, self.seq_len_dict)
        if len(data.shape) > 1 and recur_layer is None:
            # Search for a recurrent layer
            if hasattr(self.model, 'lstm'):
                recur_layer = self.model.lstm
            elif hasattr(self.model, 'gru'):
                recur_layer = self.model.gru
            elif hasattr(self.model, 'rnn'):
                recur_layer = self.model.rnn
            else:
                raise Exception('ERROR: No recurrent layer found. Please specify it in the recur_layer argument.')

        # Confirm that the model is in evaluation mode to deactivate dropout
        self.model.eval()
        # Create a mask filter variable, initialized as an all ones tensor
        mask = torch.ones(data.shape)
        # [DEBUG] Create a loss matrix to analyse the convergence of mask filter optimizations
        loss_mtx = []

        if len(data.shape) == 3:
            # Loop to go through each sequence in the input data
            for seq in tqdm(range(data.shape[0]), disable=not see_progress):
                # Get the true length of the current sequence
                seq_len = x_lengths[seq]
                # Loop to go through each instance in the input sequence
                for inst in tqdm(range(seq_len), disable=not see_progress):
                    hidden_state = None
                    # Get the hidden state that the model receives as an input
                    if inst > 0:
                        # Get the hidden state outputed from the previous recurrent cell
                        _, hidden_state = recur_layer(data[:inst])
                        # Avoid backpropagating through previous instances
                        if type(hidden_state) is tuple:
                            hidden_state = (hidden_state[0].detach(), hidden_state[1].detach())
                        else:
                            hidden_state.detach_()
                    # Temporary mask filter for he current instance
                    tmp_mask = Variable(mask[seq, inst, :], requires_grad=True)
                    # [DEBUG] List of the current optimization's losses
                    tmp_loss_list = []
                    # Mask filter optimization loop
                    for iter in tqdm(range(max_iter), disable=not see_progress):
                        # Calculate the model's output to the original, unchanged instance data
                        ref_output = self.model(data[seq, inst, :].unsqueeze(0).unsqueeze(0), hidden_state=hidden_state)
                        # Prevent mask filter optimization from backpropagating through the reference output
                        ref_output.detach_()
                        # Perform a single optimization step
                        tmp_mask, tmp_loss = self.mask_filter_step(tmp_mask, data[seq, inst, :], ref_output, l1_coeff, hidden_state, debug_loss=debug_loss)
                        tmp_loss_list.append(tmp_loss)
                    # Save the optimized mask filter of the current instance
                    mask[seq, inst, :] = tmp_mask
                    # [DEBUG] Add the current instance's optimization logs to the overall loss matrix
                    loss_mtx.append(tmp_loss_list)

        elif len(data.shape) == 2:
            # Loop to go through each instance in the input sequence
            for inst in tqdm(range(data.shape[0]), disable=not see_progress):
                hidden_state = None
                # Get the hidden state that the model receives as an input
                if inst > 0:
                    # Get the hidden state outputed from the previous recurrent cell
                    _, hidden_state = recur_layer(data[:inst])
                    # Avoid backpropagating through previous instances
                    if type(hidden_state) is tuple:
                        hidden_state = (hidden_state[0].detach(), hidden_state[1].detach())
                    else:
                        hidden_state.detach_()
                # Temporary mask filter for he current instance
                tmp_mask = Variable(mask[inst], requires_grad=True)
                # Mask filter optimization loop
                for iter in tqdm(range(max_iter), disable=not see_progress):
                    # Calculate the model's output to the original, unchanged instance data
                    ref_output = self.model(data[inst].unsqueeze(0).unsqueeze(0), hidden_state=hidden_state)
                    # Prevent mask filter optimization from backpropagating through the reference output
                    ref_output.detach_()
                    # Perform a single optimization step
                    tmp_mask = self.mask_filter_step(tmp_mask, data[inst], ref_output, l1_coeff, hidden_state)
                # Save the optimized mask filter of the current instance
                mask[inst] = tmp_mask

        elif len(data.shape) == 1:
            # Make sure that the mask can be optimized properly
            mask.requires_grad_()
            # Mask filter optimization loop
            for iter in tqdm(range(max_iter), disable=not see_progress):
                # Calculate the model's output to the original, unchanged instance data
                ref_output = self.model(data.unsqueeze(0).unsqueeze(0), hidden_state=hidden_state)
                # Prevent mask filter optimization from backpropagating through the reference output
                ref_output.detach_()
                # Perform a single optimization step
                mask = self.mask_filter_step(mask, data, ref_output, l1_coeff)

        else:
            raise Exception(f'ERROR: Can\'t handle data with more than 3 dimensions. Submitted data with {len(data.shape)} dimensions.')

        # Return the inverted version of the mask, to atrribute 1 (one) to the most relevant features
        if debug_loss:
            return 1 - mask, loss_mtx
        else:
            return 1 - mask

    def instance_importance(self, data=None, labels=None, x_lengths=None,
                            see_progress=True, occlusion_wgt=0.7):
        '''Calculate the instance importance scores to interpret the impact of
        each instance of a sequence on the final output.

        Parameters
        ----------
        data : torch.Tensor, default None
            Optionally, the user can specify a subset of data on which model
            interpretation will be made (i.e. calculating feature and/or
            instance importance). Otherwise, all the data is used.
        labels : torch.Tensor, default None
            Labels corresponding to the data used, either specified in the input
            or all the data that the interpreter has.
        x_lengths : list of int
            Sorted list of sequence lengths, relative to the input data.
        see_progress : bool, default True
            If set to True, a progress bar will show up indicating the execution
            of the instance importance scores calculations.
        occlusion_wgt : float, default 0.7
            Weight given to the occlusion part of the instance importance score.
            This scores is calculated as a weighted average of the instance's
            influence on the final output and the variation of the output
            probability, between the current instance and the previous one. As
            such, this weight should have a value between 0 and 1, with the
            output variation receiving the remaining weight (1 - occlusion_wgt),
            where 0 corresponds to not using the occlusion component at all, 0.5
            is a normal, unweighted average and 1 deactivates the use of the
            output variation part. If the value wasn't specified in the
            intepreter's initialization nor in the method argument, it will
            default to 0.7

        Returns
        -------
        inst_scores : numpy.Array
            Array containing the importance scores of each instance in the
            given input sequences.
        '''
        if occlusion_wgt is None:
            if self.occlusion_wgt is not None:
                # Set to the class's occlusion weight value
                occlusion_wgt = self.occlusion_wgt
            else:
                # Set the occlusion weight value to 0.7 (default)
                occlusion_wgt = 0.7
                self.occlusion_wgt = occlusion_wgt

        # Confirm that the occlusion weight has a valid value (between 0 and 1)
        if occlusion_wgt > 1 or occlusion_wgt < 0:
            raise Exception(f'ERROR: Inserted invalid occlusion weight value {occlusion_wgt}. Please replace with a value between 0 and 1.')

        if occlusion_wgt < 1:
            # If the output variation is used in the calculation of the score,
            # get the reference outputs for all the instances of the sequences
            seq_final_outputs = False
        else:
            # Otherwise, only the final outputs of the sequences are retrieved
            seq_final_outputs = True

        if data is None:
            # If a subset of data to interpret isn't specified, the interpreter will use all the data
            data = self.data
            labels = self.labels
        # Make sure that the data is in type float
        data = data.float()
        # Model output when using all the original instances in the input sequences
        ref_output, _ = du.deep_learning.model_inference(self.model, data=(data, labels),
                                                         metrics=[''], model_type=self.model_type,
                                                         is_custom=self.is_custom,
                                                         seq_len_dict=self.seq_len_dict,
                                                         padding_value=self.padding_value,
                                                         seq_final_outputs=seq_final_outputs,
                                                         cols_to_remove=[self.id_column_num, self.inst_column_num],
                                                         already_embedded=self.already_embedded)

        if not seq_final_outputs:
            # Cumulative sequence lengths (true end of the sequences)
            final_seq_idx = np.cumsum(x_lengths)
            start_idx = np.roll(final_seq_idx, 1)
            start_idx[0] = 0
            ref_output = [ref_output[start_idx[i]:final_seq_idx[i]] for i in range(len(start_idx))]

        inst_scores = [[calc_instance_score(self.model, data[seq_num, :, :], inst, ref_output[seq_num],
                                            x_lengths[seq_num], occlusion_wgt, self.id_column_num,
                                            self.inst_column_num)
                        for inst in range(x_lengths[seq_num])] for seq_num in tqdm(range(data.shape[0]), disable=not see_progress)]
        # DEBUG
        # inst_scores = []
        # for seq_num in tqdm(range(data.shape[0]), disable=not see_progress):
        #     tmp_list = []
        #     for inst in range(x_lengths[seq_num]):
        #         tmp_list.append(calc_instance_score(self.model, data[seq_num, :, :], inst, ref_output[seq_num],
        #                                             x_lengths[seq_num], occlusion_wgt, self.id_column_num, self.inst_column_num))
        #     inst_scores.append(tmp_list)

        # Pad the instance scores lists so that all have the same length
        inst_scores = [du.padding.pad_list(scores_list, data.shape[1], padding_value=self.padding_value)
                       for scores_list in inst_scores]
        # Convert to a NumPy array
        inst_scores = np.array(inst_scores)
        return inst_scores

    def feature_importance(self, test_data=None, model_type=None,
                           method='shap', fast_calc=None, see_progress=True,
                           bkgnd_data=None, max_iter=100, l1_coeff=0, lr=0.001,
                           recur_layer=None, create_new_explainer=True, debug_loss=False,
                           total_length=None):
        '''Calculate the feature importance scores to interpret the impact
        of each feature in each instance's output.

        Parameters
        ----------
        test_data : torch.Tensor, default None
            Optionally, the user can specify a subset of data on which model
            interpretation will be made (i.e. calculating feature and/or
            instance importance). Otherwise, all the data is used.
        model_type : string, default 'multivariate_rnn'
            Sets the type of machine learning model. Important to know what type
            of inference and data processing to do. Currently available options
            are ['multivariate_rnn', 'mlp'].
        method : string, defautl SHAP
            Defines which interpretability technique to use. Current options
            include SHAP Kernel Explainer (default) and mask filter.
        fast_calc : bool, default None
            If set to True, the algorithm uses less background samples (SHAP)
            or optimization steps (mask filter), in order to do a fast
            interpretation of the model. If set to False, the process takes
            more time in order to get a more precise and truthful
            interpretation of the model's behavior, requiring longer
            computation times.
        see_progress : bool, default True
            If set to True, a progress bar will show up indicating the execution
            of the feature importance scores calculations.
        total_length : int, default None
            If not None, the feature importance scores will be padded to have
            length total_length.

        if fast_calc is False:

        bkgnd_data : torch.Tensor, default None
            In case of setting fast_calc to False, which makes the algorithm
            require background data in SHAP during the feature importance, the
            background data used in the explainer can be set through this
            parameter.

        if fast_calc is True:

        max_iter : int, default 100
            Maximum number of iterations of the mask filter optimization, for
            each instance.
        l1_coeff : int, default 1
            Weight given in the loss function to the L1 norm of the mask filter.
        lr : float, default 0.001
            Learning rate used in the optimization algorithm of the mask filter.
        recur_layer : torch.nn.LSTM or torch.nn.GRU or torch.nn.RNN, default None
            Pointer to the recurrent layer in the model, if it exists. It should
            either be a LSTM, GRU or RNN network. If none is specified, the
            method will automatically search for a recurrent layer in the model.
        create_new_explainer : bool, default True
            Sets if we'll create a new SHAP KernelExplainer or if we'll use a
            previously defined one in the current model interpreter object.
        debug_loss : bool, default False
            Debugging flag, which makes the method also return an array of the
            mask filter optimization loss.

        Returns
        -------
        feat_scores : numpy.Array
            Array containing the importance scores of each feature, of each
            instance, in the given input sequences.

        if debug_loss is True:

        loss_mtx : np.Array
            Matrix containing the loss values of the mask filter optimization.
        '''
        if fast_calc is None:
            # Use the predefined option if fast_calc isn't set in the function call
            fast_calc = self.fast_calc
        else:
            self.fast_calc = fast_calc
        if model_type is None:
            # Use the predefined option if model_type isn't set in the function call
            model_type = self.model_type
        else:
            self.model_type = model_type
        if total_length is None:
            # Use the predefined option if total_length isn't set in the function call
            total_length = self.total_length

        if model_type == 'multivariate_rnn':
            # Sort the test data by sequence length
            test_data, x_lengths_test = du.padding.sort_by_seq_len(test_data, self.seq_len_dict)
        # Set an indicator to log that the current model is a RNN
        isRNN = model_type == 'multivariate_rnn'
        # Set an indicator to log that the current model is a bidirectional
        isBidir = self.model.bidir

        if method.lower() == 'shap':
            if create_new_explainer is True:
                # Go through all of the steps of initialiazing a new SHAP KernelExplainer
                if fast_calc:
                    print(f'Attention: you have chosen to interpret the model using SHAP, with one background sample (all zeros), with {self.SHAP_bkgnd_samples} reevalutions per prediction applied to {test_data.shape[0]} test samples. This might take a while. Depending on your computer\'s processing power, you should do a coffee break or even go to sleep!')
                    print('Evaluating the model with a reference value of zero. This should only be done if all the data is processed in a way that, for categorical features, 0 represents missing attribute and, for continuous features, 0 represents the average value of that feature.')
                    # Use a single all zeroes sample as a reference value
                    num_id_features = sum([1 if i is not None else 0 for i in [self.id_column_num, self.inst_column_num]])
                    bkgnd_data = np.zeros((1, len(self.feat_names) + num_id_features))
                else:
                    print(f'Attention: you have chosen to interpret the model using SHAP, with {bkgnd_data.shape[0]} background samples, with {self.SHAP_bkgnd_samples} reevalutions per prediction applied to {test_data.shape[0]} test samples. This might take a while. Depending on your computer\'s processing power, you should do a coffee break or even go to sleep!')
                    if model_type.lower() == 'multivariate_rnn':
                        # Sort the background data by sequence length
                        bkgnd_data, x_lengths_bkgnd = du.padding.sort_by_seq_len(bkgnd_data, self.seq_len_dict)
                        # Convert the background data into a 2D NumPy matrix
                        bkgnd_data = du.deep_learning.ts_tensor_to_np_matrix(bkgnd_data, self.feat_num, self.padding_value)
                    elif model_type.lower() == 'mlp':
                        # Just convert background data into a NumPy matrix
                        bkgnd_data = bkgnd_data.numpy()
                if model_type.lower() == 'multivariate_rnn':
                    # Convert the test data into a 2D NumPy matrix
                    test_data = du.deep_learning.ts_tensor_to_np_matrix(test_data, self.feat_num, self.padding_value)
                elif model_type.lower() == 'mlp':
                    # Remove ID columns from the data
                    bkgnd_data = du.deep_learning.remove_tensor_column(bkgnd_data, [self.id_column_num, self.inst_column_num], inplace=True)
                    test_data = du.deep_learning.remove_tensor_column(test_data, [self.id_column_num, self.inst_column_num], inplace=True)
                    # Convert test data into a NumPy matrix
                    test_data = test_data.numpy()
                # Create a function that represents the model's feedforward operation on a single instance
                kf = KernelFunction(self.model, model_type=model_type)
                # Use the background dataset to integrate over
                print('Creating a SHAP kernel explainer...')
                # [TODO] Removing this part of directly handling pure RNN models, as the `is_custom` parameter collides
                # with other definitions of it; ignoring for now as I'm never using pure RNNs, without any modification
                # or at least wrapping in some class.
                # if self.is_custom is False:
                    # # Let SHAP find the recurrent layer
                    # recur_layer = None
                # else:
                # When using custom models, the whole model behaves as a recurrent layer
                # We just need to make sure that it returns the hidden state
                recur_layer = partial(self.model.forward, get_hidden_state=True)
                self.explainer = shap.KernelExplainer(kf.f, bkgnd_data, isRNN=isRNN, isBidir=isBidir,
                                                      model_obj=self.model, max_bkgnd_samples=100,
                                                      id_col_num=self.id_column_num,
                                                      ts_col_num=self.inst_column_num,
                                                      recur_layer=recur_layer)
            # Count the time that takes to calculate the SHAP values
            start_time = time.time()
            # Explain the predictions of the sequences in the test set
            print('Calculating feature importance scores for each instance in the test data...')
            feat_scores = self.explainer.shap_values(test_data, l1_reg='num_features(10)', nsamples=self.SHAP_bkgnd_samples, max_seq_len=total_length)
            print(f'Calculation of SHAP values took {time.time() - start_time} seconds')
            return feat_scores

        else:
            # [TODO] Fix mask filter feature importance
            # [TODO] Add fast and slower versions of the mask filter
            # Remove identifier columns from the test data
            test_data = test_data[:, :, self.feat_num]
            # Make sure that the test data is in type float
            test_data = test_data.float()
            # Count the time that takes to calculate the SHAP values
            start_time = time.time()
            # Apply mask filter
            feat_scores, loss_mtx = self.mask_filter(test_data, x_lengths_test, max_iter,
                                                     l1_coeff, lr, recur_layer, debug_loss)
            print(f'Calculation of mask filter values took {time.time() - start_time} seconds')
            if debug_loss:
                return feat_scores, loss_mtx
            else:
                return feat_scores
        # [TODO] Add more interpretability techniques, such as LIME and Agglomerative Contextual Decomposition (ACD)

    # [Bonus TODO] Upload model explainer and interpretability plots to Comet.ml
    def interpret_model(self, bkgnd_data=None, test_data=None, test_labels=None,
                        new_data=False, model_type=None, df=None,
                        instance_importance=True, feature_importance=False,
                        fast_calc=None, create_new_explainer=True,
                        see_progress=True, save_data=True, debug_loss=False,
                        total_length=None):
        '''Method to calculate scores of feature and/or instance importance, in
        order to be able to interpret a model on a given data.

        Parameters
        ----------
        bkgnd_data : torch.Tensor, default None
            In case of setting fast_calc to False, which makes the algorithm
            require background data in SHAP during the feature importance, the
            background data used in the explainer can be set through this
            parameter.
        test_data : torch.Tensor, default None
            Optionally, the user can specify a subset of data on which model
            interpretation will be made (i.e. calculating feature and/or
            instance importance) as a PyTorch tensor. Otherwise, all the data is
            used.
        test_labels : torch.Tensor, default None
            Labels corresponding to the data used, either specified in the input
            or all the data that the interpreter has.
        new_data : bool, default False
            If set to True, it indicates that the data that will be interpreted
            hasn't been seen before, i.e. it has different ids than those in the
            original dataset defined in the object initialization. This implies
            that a dataframe of the new data is provided (parameter df) so that
            the sequence lengths are calculated. Otherwise, the original
            sequence lengths known by the model interpreter are used.
        model_type : string, default None
            Sets the type of machine learning model. Important to know what type
            of inference and data processing to do. Currently available options
            are ['multivariate_rnn', 'mlp'].
        df : pandas.DataFrame, default None
            Dataframe containing the new data so as to calculate the sequence
            lengths of the new ids. Only used if new_data is set to True and
            `model_type` is 'multivariate_rnn'.
        instance_importance : bool, default True
            If set to True, instance importance is made on the data. In other
            words, the algorithm will analyze the impact that each instance of
            an input sequence had on the output.
        feature_importance : bool or string, default False
            Defines which feature importance interpretability technique to use.
            The algorithm will analyze the impact that each feature of
            an instance had on the output. This is analyzed instance by instance,
            not in the entire sequence at once. For example, from the feature
            importance alone, it's not straightforward how a value in a previous
            instance impacted the current output. Current options include SHAP
            Kernel Explainer ('shap') and 'mask filter'. If set to False, no
            feature importance will be done.
        fast_calc : bool, default None
            If set to True, the algorithm uses less background samples (SHAP)
            or optimization steps (mask filter), in order to do a fast
            interpretation of the model. If set to False, the process takes
            more time in order to get a more precise and truthful
            interpretation of the model's behavior, requiring longer
            computation times.
        create_new_explainer : bool, default True
            Sets if we'll create a new SHAP KernelExplainer or if we'll use a
            previously defined one in the current model interpreter object.
        see_progress : bool, default True
            If set to True, a progress bar will show up indicating the execution
            of the instance importance scores calculations.
        save_data : bool, default True
            If set to True, the possible background data (used in the SHAP
            explainer) and the test data (on which importance scores are
            calculated) are saved as object attributes.
        debug_loss : bool, default False
            Debugging flag, which makes the method also return an array of the
            mask filter optimization loss.
        total_length : int, default None
            If not None, the feature importance scores will be padded to have
            length total_length.

        Returns
        -------
        inst_scores : numpy.Array
            Array containing the importance scores of each instance in the
            given input sequences. Only calculated if instance_importance is set
            to True.
        feat_scores : numpy.Array
            Array containing the importance scores of each feature, of each
            instance, in the given input sequences. Only calculated if
            feature_importance is set to True.

        if debug_loss is True:

        loss_mtx : np.Array
            Matrix containing the loss values of the mask filter optimization.
        '''
        # Confirm that the model is in evaluation mode to deactivate dropout
        self.model.eval()

        if feature_importance is not None and feature_importance is not False:
            try:
                feature_importance = feature_importance.lower()
                if feature_importance != 'shap' and feature_importance != 'mask filter':
                    raise Exception(f'ERROR: Specified {feature_importance} feature importance method isn\'t valid. Available options are \"shap\" and\"mask filter\".')
            except:
                raise Exception(f'ERROR: {feature_importance} is an incorrectly defined feature importance method, as it should be a string. Available options are \"shap\" and\"mask filter\".')

        if fast_calc is None:
            # Use the predefined option if fast_calc isn't set in the function call
            fast_calc = self.fast_calc
        else:
            self.fast_calc = fast_calc
        if model_type is None:
            # Use the predefined option if model_type isn't set in the function call
            model_type = self.model_type
        else:
            self.model_type = model_type
        if total_length is None:
            # Use the predefined option if total_length isn't set in the function call
            total_length = self.total_length

        if test_labels is not None:
            if type(test_labels) is np.ndarray:
                # Convert from numpy to pytorch
                test_labels = torch.from_numpy(test_labels)

        if test_data is None:
            if fast_calc:
                # If a subset of data to interpret isn't specified, the interpreter will use all the data
                test_data = self.data
                test_labels = self.labels
            else:
                if bkgnd_data is None:
                    # Get the background and test sets from the dataset
                    bkgnd_data, test_data = self.create_bkgnd_test_sets()
                else:
                    # Get the test set from the dataset
                    _, test_data = self.create_bkgnd_test_sets()
        elif type(test_data) is np.ndarray:
            # Convert from numpy to pytorch
            test_data = torch.from_numpy(test_data)

        if model_type == 'multivariate_rnn':
            if new_data is True:
                if df is None:
                    raise Exception('ERROR: A dataframe must be provided in order to work with the new data.')
                # Find the sequence lengths of the new data
                seq_len_dict = du.padding.get_sequence_length_dict(df, id_column=self.id_column_num, ts_column=self.inst_column_num)
                # Sort the data by sequence length
                test_data, test_labels, x_lengths_test = du.padding.sort_by_seq_len(test_data, seq_len_dict, test_labels)
            else:
                # Sort the data by sequence length
                test_data, test_labels, x_lengths_test = du.padding.sort_by_seq_len(test_data, self.seq_len_dict, test_labels)

        if not fast_calc:
            if bkgnd_data is None:
                # Get the background set from the dataset
                bkgnd_data, _ = self.create_bkgnd_test_sets()
            elif type(bkgnd_data) is np.ndarray:
                # Convert from numpy to pytorch
                bkgnd_data = torch.from_numpy(bkgnd_data)

        if save_data:
            # Save the data used in the model interpretation
            self.bkgnd_data = bkgnd_data
            self.test_data = test_data
            self.test_labels = test_labels

        if instance_importance is True:
            print('Calculating instance importance scores...')
            # Calculate the scores of importance of each instance
            self.inst_scores = self.instance_importance(test_data, test_labels, x_lengths_test, see_progress)

        if feature_importance is not False:
            print('Calculating feature importance scores...')
            # Calculate the scores of importance of each feature in each instance
            if feature_importance == 'mask filter' and debug_loss:
                self.feat_scores, loss_mtx = self.feature_importance(test_data, model_type,
                                                                     feature_importance,
                                                                     fast_calc, see_progress,
                                                                     bkgnd_data, debug_loss=True,
                                                                     total_length=total_length)
            else:
                self.feat_scores = self.feature_importance(test_data, model_type, feature_importance,
                                                           fast_calc, see_progress, bkgnd_data,
                                                           create_new_explainer=create_new_explainer,
                                                           debug_loss=False, total_length=total_length)

        print('Done!')

        if instance_importance and feature_importance:
            if fast_calc and debug_loss:
                return self.inst_scores, self.feat_scores, loss_mtx
            else:
                return self.inst_scores, self.feat_scores
        elif instance_importance and not feature_importance:
            return self.inst_scores
        elif not instance_importance and feature_importance:
            if fast_calc and debug_loss:
                return self.feat_scores, loss_mtx
            else:
                return self.feat_scores
        else:
            warnings.warn('Without setting instance_importance nor feature_importance to True, the interpret_model function won\'t do anything relevant.')
            return


    def instance_importance_plot(self, orig_data=None, inst_scores=None, seq_id=None,
                                 pred_prob=None, uniform_spacing=False,
                                 show_pred_prob=True, show_title=True,
                                 show_colorbar=True, click_mode='event+select',
                                 labels=None, seq_len=None, threshold=0,
                                 get_fig_obj=False, tensor_idx=True,
                                 max_seq=10, background_color='white',
                                 font_family='Roboto', font_size=14,
                                 font_color='black'):
        '''Create a bar chart that allows visualizing instance importance scores.

        Parameters
        ----------
        orig_data : torch.Tensor or numpy.Array, default None
            Original data used in the machine learning model. Used here to fetch
            the true ID corresponding to the plotted sequence.
        inst_scores : numpy.Array, default None
            Array containing the instance importance scores to be plotted.
        seq_id : int, default None
            ID or sequence index that select which time series / sequences to
            use in the plot. If it's a single value, the method plots a single
            sequence.
        pred_prob : numpy.Array or torch.Tensor or list of floats, default None
            Array containing the prediction probabilities for each sequence in
            the input data (orig_data). Only relevant if show_pred_prob is True.
        uniform_spacing : bool, default False
            Defines whether or not the sequences are displayed with uniform
            spacing (i.e. fixed distance) between their samples.
        show_pred_prob : bool, default True
            If set to True, a percentage bar chart will be shown to the right of
            the standard instance importance plot. If `pred_prob` isn't
            specified but the labels are, the prediction probabilities will be
            automatically calculated.
        show_title : bool, default True
            If set to True, the plot will have a title displayed above.
        show_colorbar : bool, default True
            If set to True, a bar legend will be shown, corresponding each color
            to each respective value.
        click_mode : string, default 'event+select'
            Determines the mode of single click interactions. "event" is the
            default value and emits the `plotly_click` event. In addition this
            mode emits the `plotly_selected` event in drag modes "lasso" and
            "select", but with no event data attached (kept for compatibility
            reasons). The "select" flag enables selecting single data points via
            click. This mode also supports persistent selections, meaning that
            pressing Shift while clicking, adds to / subtracts from an existing
            selection. "select" with `hovermode`: "x" can be confusing, consider
            explicitly setting `hovermode`: "closest" when using this feature.
            Selection events are sent accordingly as long as "event" flag is set
            as well. When the "event" flag is missing, `plotly_click` and
            `plotly_selected` events are not fired.
        labels : torch.Tensor, default None
            Labels corresponding to the data used, either specified in the input
            or all the data that the interpreter has.
        seq_len : int, default None
            Sequence lengths which represent the true, unpadded size of the
            input sequences.
        threshold : int or float, default 0
            Value to use as a threshold in the plot's color selection. In other
            words, values that exceed this threshold will have one color while the
            remaining have a different one, as specified in the parameters.
        get_fig_obj : bool, default False
            If set to True, the function returns the object that contains the
            displayed plotly figure.
        tensor_idx : bool, default True
            If set to True, the ID specified in the respective parameter
            constitutes the index where the desired sequence resides. Otherwise,
            it's the actual unique identifier that appears in the original data.
        max_seq : int, default 10
            Maximum number of sequences to show in the plot. This is meant to
            prevent cramming too many sequences into the graph window.
        background_color : str, default 'white'
            The plot's background color. Can be set in color name (e.g. 'white'),
            hexadecimal code (e.g. '#555') or RGB (e.g. 'rgb(0,0,255)').
        font_family : str, default 'Roboto'
            Text font family to be used in the numbers shown next to the graph.
        font_size : int, default 14
            Text font size to be used in the numbers shown next to the graph.
        font_color : str, default 'black'
            Text font color to be used in the numbers shown next to the graph. Can
            be set in color name (e.g. 'white'), hexadecimal code (e.g. '#555') or
            GB (e.g. 'rgb(0,0,255)').

        Returns
        -------
        fig : plotly.graph_objs.Figure or None
            If argument get_fig_obj is set to True, the figure object is returned.
            Otherwise, nothing is returned, only the plot is showned.'''
        if orig_data is None:
            # Use all the data if none was specified
            orig_data = self.data

            if labels is None:
                labels = self.labels

        if inst_scores is None:
            if self.inst_scores is None:
                raise Exception('ERROR: No instance importance scores found. If the scores aren\'t specified, then they must have already been calculated through the interpret_model method.')
            # Use all the previously calculated scores if none were specified
            inst_scores = self.inst_scores

        # Plot the instance importance of multiple sequences
        # Convert the instance scores data into a NumPy array
        if type(inst_scores) is torch.Tensor:
            inst_scores = inst_scores.detach().numpy()
        elif type(inst_scores) is list:
            inst_scores = np.array(inst_scores)

        # if is not tensor_idx:
        # [TODO] Search for the index associated to the specific ID asked for by the user
        # [TODO] Allow to search for multiple indeces and generate a multiple patients time series plot from it

        if len(inst_scores.shape) == 1 or (seq_id is not None and type(seq_id) is not list):
            # True sequence length of the current id's data
            if seq_len is None:
                seq_len = self.seq_len_dict[orig_data[seq_id, 0, self.id_column_num].item()]

            # [TODO] Add a prediction probability bar plot like in the multiple sequences case

            # Plot the instance importance of one sequence
            plot_data = [go.Bar(
                            x = list(range(seq_len)),
                            y = inst_scores[seq_id, :seq_len],
                            marker=dict(color=du.utils.set_bar_color(inst_scores, seq_id, seq_len,
                                                                     threshold=threshold,
                                                                     pos_color=POS_COLOR,
                                                                     neg_color=NEG_COLOR))
                          )]
            layout = go.Layout(
                                title=f'Instance importance scores for ID {int(orig_data[id, 0, self.id_column_num])}',
                                xaxis=dict(title='Instance'),
                                yaxis=dict(title='Importance scores')
                              )
        else:
            if seq_id is None:
                # Use all the sequences data if a subset isn't specified
                seq_id = list(range(inst_scores.shape[0]))
            # Select the desired data according to the specified IDs
            inst_scores = inst_scores[seq_id, :]
            orig_data = orig_data[seq_id, :, :]
            # Unique patient IDs in string format
            patients = [str(int(item)) for item in [tensor.item()
                        for tensor in list(orig_data[:, 0, self.id_column_num])]]
            if uniform_spacing is True:
                # Sequence instances count, used as X in the plot
                seq_insts_x = [list(range(inst_scores.shape[1]))
                               for patient in range(len(patients))]
            else:
                # Use the original timestamp values as the X axis
                seq_insts_x = [int(tensor) for seq_list
                               in [list(ts_array) for ts_array in list(orig_data[:, :, self.inst_column_num])]
                               for tensor in seq_list]
            # Patients ids repeated max sequence length times, used as Y in the plot
            patients_y = [[patient]*inst_scores.shape[1] for patient in list(patients)]
            # Flatten seq_insts and patients_y
            seq_insts_x = list(np.array(seq_insts_x).flatten())
            patients_y = list(np.array(patients_y).flatten())
            # Define colors for the data points based on their normalized scores (from 0 to 1 instead of -1 to 1)
            colors = [val for val in inst_scores.flatten()]
            # Count the number of already deleted paddings
            count = 0

            for i in range(inst_scores.shape[0]):
                for j in range(inst_scores.shape[1]):
                    if inst_scores[i, j] == self.padding_value:
                        # Delete elements that represent paddings, not real instances
                        del seq_insts_x[i*inst_scores.shape[1]+j-count]
                        del patients_y[i*inst_scores.shape[1]+j-count]
                        del colors[i*inst_scores.shape[1]+j-count]
                        # Increment the counting of already deleted items
                        count += 1

            if show_pred_prob is True:
                if pred_prob is None:
                    if labels is None:
                        raise Exception('ERROR: By setting `show_pred_prob` to True, either the prediction probabilities (pred_prob) or the labels must be provided.')
                    # Calculate the prediction probabilities for the provided data
                    pred_prob, _ = du.deep_learning.model_inference(self.model, data=(orig_data, labels),
                                                                    metrics=[''], model_type=self.model_type,
                                                                    is_custom=self.is_custom,
                                                                    seq_len_dict=self.seq_len_dict,
                                                                    padding_value=self.padding_value,
                                                                    output_rounded=False,
                                                                    seq_final_outputs=True,
                                                                    cols_to_remove=[self.id_column_num, self.inst_column_num],
                                                                    already_embedded=self.already_embedded)
                # Convert the prediction probability data into a NumPy array
                if type(pred_prob) is torch.Tensor:
                    pred_prob = pred_prob.detach().numpy()
                elif type(pred_prob) is list:
                    pred_prob = np.array(pred_prob)
                # Select the desired data according to the specified IDs
                pred_prob = pred_prob[seq_id]
                # Colors to use in the prediction probability bar plots
                pred_colors = cl.scales['8']['div']['RdYlGn']
                # Create "percentage bar" plots through pairs of unfilled and filled rectangles
                shapes_list = []
                # Starting y coordinate of the first shape
                y0 = -0.25
                # Height of the shapes (y length)
                step = 0.5
                # Maximum width of the shapes
                max_width = 1
                for i in range(len(patients)):
                    # Set the starting x coordinate to after the last data point
                    x0 = inst_scores.shape[1]
                    # Set the filling length of the shape
                    x1_fill = x0 + pred_prob[i] * max_width
                    shape_unfilled = {
                                        'type': 'rect',
                                        'x0': x0,
                                        'y0': y0,
                                        'x1': x0 + max_width,
                                        'y1': y0 + step,
                                        'line': {
                                                    'color': 'rgba(0, 0, 0, 1)',
                                                    'width': 2,
                                                },
                                    }
                    shape_filled = {
                                        'type': 'rect',
                                        'x0': x0,
                                        'y0': y0,
                                        'x1': x1_fill,
                                        'y1': y0 + step,
                                        'fillcolor': pred_colors[int(len(pred_colors)-1-max(pred_prob[i]*len(pred_colors)-1, 0))]
                                    }
                    shapes_list.append(shape_unfilled)
                    shapes_list.append(shape_filled)
                    # Set the starting y coordinate for the next shapes
                    y0 = y0 + 2 * step

                # Getting points along the percentage bar plots
                x_range = [list(np.array(range(0, 10, 1))*0.1+inst_scores.shape[1]) for idx in range(len(patients))]
                # Flatten the list
                text_x = [item for sublist in x_range for item in sublist]
                # Y coordinates of the prediction probability text
                text_y = [patient for patient in patients for idx in range(10)]
                # Prediction probabilities in text form, to appear in the plot
                text_content = [pred_prob[idx] for idx in range(len(pred_prob)) for i in range(10)]
                # [TODO] Ajdust the zoom so that the initial plot doens't block part of the first and last sequences that show up

            # Create plotly chart
            plot_data = [dict(
                x=seq_insts_x,
                y=patients_y,
                marker=dict(
                    color=colors,
                    size=12,
                    line = dict(
                        color = 'black',
                        width = 1
                    ),
                    colorscale=[[0, 'rgba(30,136,229,1)'], [0.5, 'white'], [1, 'rgba(255,13,87,1)']],
                    cmax=1,
                    cmin=-1,
                ),
                mode='markers',
                type='scatter',
                hoverinfo='x+y'
            )]
            layout = dict(
                paper_bgcolor=background_color,
                plot_bgcolor=background_color,
                font=dict(
                    family=font_family,
                    size=font_size,
                    color=font_color
                ),
                xaxis=dict(
                    title='Instance',
                    showgrid=False,
                    zeroline=False
                ),
                yaxis=dict(
                    title='Patient ID',
                    showgrid=False,
                    zeroline=False,
                    type='category'
                ),
                hovermode='closest',
                showlegend=False,
                clickmode=click_mode
            )
            if show_title is True:
                layout['title'] = 'Instance importance'
                layout['margin'] = dict(l=0, r=0, t=30, b=0, pad=0)
            else:
                layout['margin'] = dict(l=0, r=0, t=0, b=0, pad=0)
            if show_colorbar is True:
                layout['meta'] = dict()
                layout['meta']['colorbar'] = dict(title='Scores')
            if show_pred_prob is True:
                # Add hover text to indicate the final output probabilities
                prob_hover_info = go.Scatter(
                    x=text_x,
                    y=text_y,
                    text=text_content,
                    mode='text',
                    textfont=dict(size = 1, color='#ffffff'),
                    hoverinfo='y+text'
                )
                plot_data.append(prob_hover_info)
                # Add final output probabilities bar plots
                layout['shapes'] = shapes_list
            if len(patients) > max_seq:
                # Prevent cramming too many sequences into the plot
                layout['yaxis']['range'] = [patients[max_seq], patients[0]]
        # Show the plot
        fig = go.Figure(plot_data, layout)

        if get_fig_obj:
            # Only return the figure object if specified by the user
            return fig
        else:
            py.iplot(fig)
            return

    # [TODO] Develop function to explain, in text form, why a given input data has a certain output.
    # The results gather with instance and feature importance, as well as counter-examples, should
    # be used.
    # def explain_output(self, data, detailed_explanation=True):
        # if detailed_explanation:
        #     inst_scores, feat_scores = self.interpret_model(test_data=data, instance_importance=True,
        #                                                     feature_importance=True, fast_calc=False)
        #
            # [TODO] Explain the most important instances and most important features on those instances
            # [TODO] Compare with counter-examples, i.e. cases where the classification was different
        # else:
        #     inst_scores, feat_scores = self.interpret_model(test_data=data, instance_importance=True,
        #                                                     feature_importance=True, fast_calc=True)
        #
            # [TODO] Explain the most important instances and most important features on those instances

    # [TODO] Define an automatic method to discover which embedded category was more
    # important by doing inference on individual embeddings of each category separately,
    # seeing which one caused a bigger change in the output.

    def shap_values_df(self):
        '''Create a dataframe that contains both the original data used in the
        interpretation of the model and the resulting SHAP values.

        Returns
        -------
        data_n_shap_df : pandas.DataFrame
            Dataframe that contains both the original data used in the
            interpretation of the model and the resulting SHAP values.'''
        # [TODO] Add option to handle pre-calculated SHAP values
        # (pre-defined data and SHAP values, outside of the Model Interpreter)
        # Join the original data and the features' SHAP values
        data_n_shap = np.concatenate([self.test_data.numpy(), self.test_labels.unsqueeze(2).numpy(), self.feat_scores], axis=2)
        # Reshape into a 2D format
        data_n_shap = data_n_shap.reshape(-1, data_n_shap.shape[-1])
        # Remove padding samples
        data_n_shap = data_n_shap[[self.padding_value not in row for row in data_n_shap]]
        # Define the column names list
        shap_column_names = [f'{feature}_shap' for feature in self.feat_names]
        column_names = ([self.id_column_name] + [self.inst_column_name] + self.feat_names
                        + [self.label_column_name] + shap_column_names)
        # Create the dataframe
        data_n_shap_df = pd.DataFrame(data=data_n_shap, columns=column_names)
        return data_n_shap_df

Methods

def create_bkgnd_test_sets(self, shuffle_dataset=True)

Distributes the data into background and test sets and returns the respective data tensors.

Parameters

random_seed : integer, default 42: Seed used when shuffling the data.
shuffle_dataset : bool, default True: If set to True, the data of which set is shuffled.

Returns

bkgnd_data : torch.Tensor, default None: Background data used in the SHAP explainer to estimate conditional expectations.
test_data : torch.Tensor, default None: A subset of data on which model interpretation will be made (i.e. calculating feature and/or instance importance).

Expand source code

def create_bkgnd_test_sets(self, shuffle_dataset=True):
    '''Distributes the data into background and test sets and returns
    the respective data tensors.

    Parameters
    ----------
    random_seed : integer, default 42
        Seed used when shuffling the data.
    shuffle_dataset : bool, default True
        If set to True, the data of which set is shuffled.

    Returns
    -------
    bkgnd_data : torch.Tensor, default None
        Background data used in the SHAP explainer to estimate conditional
        expectations.
    test_data : torch.Tensor, default None
        A subset of data on which model interpretation will be made (i.e.
        calculating feature and/or instance importance).
    '''
    # Create data indices for training and test splits
    dataset_size = self.data.shape[0]
    indices = list(range(dataset_size))
    if shuffle_dataset:
        # Shuffle data
        np.random.seed(self.random_seed)
        np.random.shuffle(indices)
    bkgnd_indices, test_indices = indices[:self.SHAP_bkgnd_samples], indices[self.SHAP_bkgnd_samples:]

    # Get separate tensors for the background data and the test data
    bkgnd_data = self.data[bkgnd_indices]
    test_data = self.data[test_indices]
    return bkgnd_data, test_data

def feature_importance(self, test_data=None, model_type=None, method='shap', fast_calc=None, see_progress=True, bkgnd_data=None, max_iter=100, l1_coeff=0, lr=0.001, recur_layer=None, create_new_explainer=True, debug_loss=False, total_length=None)

Calculate the feature importance scores to interpret the impact of each feature in each instance's output.

Parameters

test_data : torch.Tensor, default None: Optionally, the user can specify a subset of data on which model interpretation will be made (i.e. calculating feature and/or instance importance). Otherwise, all the data is used.
model_type : string, default 'multivariate_rnn': Sets the type of machine learning model. Important to know what type of inference and data processing to do. Currently available options are ['multivariate_rnn', 'mlp'].
method : string, defautl SHAP: Defines which interpretability technique to use. Current options include SHAP Kernel Explainer (default) and mask filter.
fast_calc : bool, default None: If set to True, the algorithm uses less background samples (SHAP) or optimization steps (mask filter), in order to do a fast interpretation of the model. If set to False, the process takes more time in order to get a more precise and truthful interpretation of the model's behavior, requiring longer computation times.
see_progress : bool, default True: If set to True, a progress bar will show up indicating the execution of the feature importance scores calculations.
total_length : int, default None: If not None, the feature importance scores will be padded to have length total_length.

if fast_calc is False:

bkgnd_data : torch.Tensor, default None: In case of setting fast_calc to False, which makes the algorithm require background data in SHAP during the feature importance, the background data used in the explainer can be set through this parameter.

if fast_calc is True:

max_iter : int, default 100: Maximum number of iterations of the mask filter optimization, for each instance.
l1_coeff : int, default 1: Weight given in the loss function to the L1 norm of the mask filter.
lr : float, default 0.001: Learning rate used in the optimization algorithm of the mask filter.
recur_layer : torch.nn.LSTM or torch.nn.GRU or torch.nn.RNN, default None: Pointer to the recurrent layer in the model, if it exists. It should either be a LSTM, GRU or RNN network. If none is specified, the method will automatically search for a recurrent layer in the model.
create_new_explainer : bool, default True: Sets if we'll create a new SHAP KernelExplainer or if we'll use a previously defined one in the current model interpreter object.
debug_loss : bool, default False: Debugging flag, which makes the method also return an array of the mask filter optimization loss.

Returns

feat_scores : numpy.Array: Array containing the importance scores of each feature, of each instance, in the given input sequences.
if debug_loss is True:
loss_mtx : np.Array: Matrix containing the loss values of the mask filter optimization.

Expand source code

def feature_importance(self, test_data=None, model_type=None,
                       method='shap', fast_calc=None, see_progress=True,
                       bkgnd_data=None, max_iter=100, l1_coeff=0, lr=0.001,
                       recur_layer=None, create_new_explainer=True, debug_loss=False,
                       total_length=None):
    '''Calculate the feature importance scores to interpret the impact
    of each feature in each instance's output.

    Parameters
    ----------
    test_data : torch.Tensor, default None
        Optionally, the user can specify a subset of data on which model
        interpretation will be made (i.e. calculating feature and/or
        instance importance). Otherwise, all the data is used.
    model_type : string, default 'multivariate_rnn'
        Sets the type of machine learning model. Important to know what type
        of inference and data processing to do. Currently available options
        are ['multivariate_rnn', 'mlp'].
    method : string, defautl SHAP
        Defines which interpretability technique to use. Current options
        include SHAP Kernel Explainer (default) and mask filter.
    fast_calc : bool, default None
        If set to True, the algorithm uses less background samples (SHAP)
        or optimization steps (mask filter), in order to do a fast
        interpretation of the model. If set to False, the process takes
        more time in order to get a more precise and truthful
        interpretation of the model's behavior, requiring longer
        computation times.
    see_progress : bool, default True
        If set to True, a progress bar will show up indicating the execution
        of the feature importance scores calculations.
    total_length : int, default None
        If not None, the feature importance scores will be padded to have
        length total_length.

    if fast_calc is False:

    bkgnd_data : torch.Tensor, default None
        In case of setting fast_calc to False, which makes the algorithm
        require background data in SHAP during the feature importance, the
        background data used in the explainer can be set through this
        parameter.

    if fast_calc is True:

    max_iter : int, default 100
        Maximum number of iterations of the mask filter optimization, for
        each instance.
    l1_coeff : int, default 1
        Weight given in the loss function to the L1 norm of the mask filter.
    lr : float, default 0.001
        Learning rate used in the optimization algorithm of the mask filter.
    recur_layer : torch.nn.LSTM or torch.nn.GRU or torch.nn.RNN, default None
        Pointer to the recurrent layer in the model, if it exists. It should
        either be a LSTM, GRU or RNN network. If none is specified, the
        method will automatically search for a recurrent layer in the model.
    create_new_explainer : bool, default True
        Sets if we'll create a new SHAP KernelExplainer or if we'll use a
        previously defined one in the current model interpreter object.
    debug_loss : bool, default False
        Debugging flag, which makes the method also return an array of the
        mask filter optimization loss.

    Returns
    -------
    feat_scores : numpy.Array
        Array containing the importance scores of each feature, of each
        instance, in the given input sequences.

    if debug_loss is True:

    loss_mtx : np.Array
        Matrix containing the loss values of the mask filter optimization.
    '''
    if fast_calc is None:
        # Use the predefined option if fast_calc isn't set in the function call
        fast_calc = self.fast_calc
    else:
        self.fast_calc = fast_calc
    if model_type is None:
        # Use the predefined option if model_type isn't set in the function call
        model_type = self.model_type
    else:
        self.model_type = model_type
    if total_length is None:
        # Use the predefined option if total_length isn't set in the function call
        total_length = self.total_length

    if model_type == 'multivariate_rnn':
        # Sort the test data by sequence length
        test_data, x_lengths_test = du.padding.sort_by_seq_len(test_data, self.seq_len_dict)
    # Set an indicator to log that the current model is a RNN
    isRNN = model_type == 'multivariate_rnn'
    # Set an indicator to log that the current model is a bidirectional
    isBidir = self.model.bidir

    if method.lower() == 'shap':
        if create_new_explainer is True:
            # Go through all of the steps of initialiazing a new SHAP KernelExplainer
            if fast_calc:
                print(f'Attention: you have chosen to interpret the model using SHAP, with one background sample (all zeros), with {self.SHAP_bkgnd_samples} reevalutions per prediction applied to {test_data.shape[0]} test samples. This might take a while. Depending on your computer\'s processing power, you should do a coffee break or even go to sleep!')
                print('Evaluating the model with a reference value of zero. This should only be done if all the data is processed in a way that, for categorical features, 0 represents missing attribute and, for continuous features, 0 represents the average value of that feature.')
                # Use a single all zeroes sample as a reference value
                num_id_features = sum([1 if i is not None else 0 for i in [self.id_column_num, self.inst_column_num]])
                bkgnd_data = np.zeros((1, len(self.feat_names) + num_id_features))
            else:
                print(f'Attention: you have chosen to interpret the model using SHAP, with {bkgnd_data.shape[0]} background samples, with {self.SHAP_bkgnd_samples} reevalutions per prediction applied to {test_data.shape[0]} test samples. This might take a while. Depending on your computer\'s processing power, you should do a coffee break or even go to sleep!')
                if model_type.lower() == 'multivariate_rnn':
                    # Sort the background data by sequence length
                    bkgnd_data, x_lengths_bkgnd = du.padding.sort_by_seq_len(bkgnd_data, self.seq_len_dict)
                    # Convert the background data into a 2D NumPy matrix
                    bkgnd_data = du.deep_learning.ts_tensor_to_np_matrix(bkgnd_data, self.feat_num, self.padding_value)
                elif model_type.lower() == 'mlp':
                    # Just convert background data into a NumPy matrix
                    bkgnd_data = bkgnd_data.numpy()
            if model_type.lower() == 'multivariate_rnn':
                # Convert the test data into a 2D NumPy matrix
                test_data = du.deep_learning.ts_tensor_to_np_matrix(test_data, self.feat_num, self.padding_value)
            elif model_type.lower() == 'mlp':
                # Remove ID columns from the data
                bkgnd_data = du.deep_learning.remove_tensor_column(bkgnd_data, [self.id_column_num, self.inst_column_num], inplace=True)
                test_data = du.deep_learning.remove_tensor_column(test_data, [self.id_column_num, self.inst_column_num], inplace=True)
                # Convert test data into a NumPy matrix
                test_data = test_data.numpy()
            # Create a function that represents the model's feedforward operation on a single instance
            kf = KernelFunction(self.model, model_type=model_type)
            # Use the background dataset to integrate over
            print('Creating a SHAP kernel explainer...')
            # [TODO] Removing this part of directly handling pure RNN models, as the `is_custom` parameter collides
            # with other definitions of it; ignoring for now as I'm never using pure RNNs, without any modification
            # or at least wrapping in some class.
            # if self.is_custom is False:
                # # Let SHAP find the recurrent layer
                # recur_layer = None
            # else:
            # When using custom models, the whole model behaves as a recurrent layer
            # We just need to make sure that it returns the hidden state
            recur_layer = partial(self.model.forward, get_hidden_state=True)
            self.explainer = shap.KernelExplainer(kf.f, bkgnd_data, isRNN=isRNN, isBidir=isBidir,
                                                  model_obj=self.model, max_bkgnd_samples=100,
                                                  id_col_num=self.id_column_num,
                                                  ts_col_num=self.inst_column_num,
                                                  recur_layer=recur_layer)
        # Count the time that takes to calculate the SHAP values
        start_time = time.time()
        # Explain the predictions of the sequences in the test set
        print('Calculating feature importance scores for each instance in the test data...')
        feat_scores = self.explainer.shap_values(test_data, l1_reg='num_features(10)', nsamples=self.SHAP_bkgnd_samples, max_seq_len=total_length)
        print(f'Calculation of SHAP values took {time.time() - start_time} seconds')
        return feat_scores

    else:
        # [TODO] Fix mask filter feature importance
        # [TODO] Add fast and slower versions of the mask filter
        # Remove identifier columns from the test data
        test_data = test_data[:, :, self.feat_num]
        # Make sure that the test data is in type float
        test_data = test_data.float()
        # Count the time that takes to calculate the SHAP values
        start_time = time.time()
        # Apply mask filter
        feat_scores, loss_mtx = self.mask_filter(test_data, x_lengths_test, max_iter,
                                                 l1_coeff, lr, recur_layer, debug_loss)
        print(f'Calculation of mask filter values took {time.time() - start_time} seconds')
        if debug_loss:
            return feat_scores, loss_mtx
        else:
            return feat_scores

def instance_importance(self, data=None, labels=None, x_lengths=None, see_progress=True, occlusion_wgt=0.7)

Calculate the instance importance scores to interpret the impact of each instance of a sequence on the final output.

Parameters

data : torch.Tensor, default None: Optionally, the user can specify a subset of data on which model interpretation will be made (i.e. calculating feature and/or instance importance). Otherwise, all the data is used.
labels : torch.Tensor, default None: Labels corresponding to the data used, either specified in the input or all the data that the interpreter has.
x_lengths : list of int: Sorted list of sequence lengths, relative to the input data.
see_progress : bool, default True: If set to True, a progress bar will show up indicating the execution of the instance importance scores calculations.
occlusion_wgt : float, default 0.7: Weight given to the occlusion part of the instance importance score. This scores is calculated as a weighted average of the instance's influence on the final output and the variation of the output probability, between the current instance and the previous one. As such, this weight should have a value between 0 and 1, with the output variation receiving the remaining weight (1 - occlusion_wgt), where 0 corresponds to not using the occlusion component at all, 0.5 is a normal, unweighted average and 1 deactivates the use of the output variation part. If the value wasn't specified in the intepreter's initialization nor in the method argument, it will default to 0.7

Returns

inst_scores : numpy.Array: Array containing the importance scores of each instance in the given input sequences.

Expand source code

def instance_importance(self, data=None, labels=None, x_lengths=None,
                        see_progress=True, occlusion_wgt=0.7):
    '''Calculate the instance importance scores to interpret the impact of
    each instance of a sequence on the final output.

    Parameters
    ----------
    data : torch.Tensor, default None
        Optionally, the user can specify a subset of data on which model
        interpretation will be made (i.e. calculating feature and/or
        instance importance). Otherwise, all the data is used.
    labels : torch.Tensor, default None
        Labels corresponding to the data used, either specified in the input
        or all the data that the interpreter has.
    x_lengths : list of int
        Sorted list of sequence lengths, relative to the input data.
    see_progress : bool, default True
        If set to True, a progress bar will show up indicating the execution
        of the instance importance scores calculations.
    occlusion_wgt : float, default 0.7
        Weight given to the occlusion part of the instance importance score.
        This scores is calculated as a weighted average of the instance's
        influence on the final output and the variation of the output
        probability, between the current instance and the previous one. As
        such, this weight should have a value between 0 and 1, with the
        output variation receiving the remaining weight (1 - occlusion_wgt),
        where 0 corresponds to not using the occlusion component at all, 0.5
        is a normal, unweighted average and 1 deactivates the use of the
        output variation part. If the value wasn't specified in the
        intepreter's initialization nor in the method argument, it will
        default to 0.7

    Returns
    -------
    inst_scores : numpy.Array
        Array containing the importance scores of each instance in the
        given input sequences.
    '''
    if occlusion_wgt is None:
        if self.occlusion_wgt is not None:
            # Set to the class's occlusion weight value
            occlusion_wgt = self.occlusion_wgt
        else:
            # Set the occlusion weight value to 0.7 (default)
            occlusion_wgt = 0.7
            self.occlusion_wgt = occlusion_wgt

    # Confirm that the occlusion weight has a valid value (between 0 and 1)
    if occlusion_wgt > 1 or occlusion_wgt < 0:
        raise Exception(f'ERROR: Inserted invalid occlusion weight value {occlusion_wgt}. Please replace with a value between 0 and 1.')

    if occlusion_wgt < 1:
        # If the output variation is used in the calculation of the score,
        # get the reference outputs for all the instances of the sequences
        seq_final_outputs = False
    else:
        # Otherwise, only the final outputs of the sequences are retrieved
        seq_final_outputs = True

    if data is None:
        # If a subset of data to interpret isn't specified, the interpreter will use all the data
        data = self.data
        labels = self.labels
    # Make sure that the data is in type float
    data = data.float()
    # Model output when using all the original instances in the input sequences
    ref_output, _ = du.deep_learning.model_inference(self.model, data=(data, labels),
                                                     metrics=[''], model_type=self.model_type,
                                                     is_custom=self.is_custom,
                                                     seq_len_dict=self.seq_len_dict,
                                                     padding_value=self.padding_value,
                                                     seq_final_outputs=seq_final_outputs,
                                                     cols_to_remove=[self.id_column_num, self.inst_column_num],
                                                     already_embedded=self.already_embedded)

    if not seq_final_outputs:
        # Cumulative sequence lengths (true end of the sequences)
        final_seq_idx = np.cumsum(x_lengths)
        start_idx = np.roll(final_seq_idx, 1)
        start_idx[0] = 0
        ref_output = [ref_output[start_idx[i]:final_seq_idx[i]] for i in range(len(start_idx))]

    inst_scores = [[calc_instance_score(self.model, data[seq_num, :, :], inst, ref_output[seq_num],
                                        x_lengths[seq_num], occlusion_wgt, self.id_column_num,
                                        self.inst_column_num)
                    for inst in range(x_lengths[seq_num])] for seq_num in tqdm(range(data.shape[0]), disable=not see_progress)]
    # DEBUG
    # inst_scores = []
    # for seq_num in tqdm(range(data.shape[0]), disable=not see_progress):
    #     tmp_list = []
    #     for inst in range(x_lengths[seq_num]):
    #         tmp_list.append(calc_instance_score(self.model, data[seq_num, :, :], inst, ref_output[seq_num],
    #                                             x_lengths[seq_num], occlusion_wgt, self.id_column_num, self.inst_column_num))
    #     inst_scores.append(tmp_list)

    # Pad the instance scores lists so that all have the same length
    inst_scores = [du.padding.pad_list(scores_list, data.shape[1], padding_value=self.padding_value)
                   for scores_list in inst_scores]
    # Convert to a NumPy array
    inst_scores = np.array(inst_scores)
    return inst_scores

def instance_importance_plot(self, orig_data=None, inst_scores=None, seq_id=None, pred_prob=None, uniform_spacing=False, show_pred_prob=True, show_title=True, show_colorbar=True, click_mode='event+select', labels=None, seq_len=None, threshold=0, get_fig_obj=False, tensor_idx=True, max_seq=10, background_color='white', font_family='Roboto', font_size=14, font_color='black')

Create a bar chart that allows visualizing instance importance scores.

Parameters

orig_data : torch.Tensor or numpy.Array, default None: Original data used in the machine learning model. Used here to fetch the true ID corresponding to the plotted sequence.
inst_scores : numpy.Array, default None: Array containing the instance importance scores to be plotted.
seq_id : int, default None: ID or sequence index that select which time series / sequences to use in the plot. If it's a single value, the method plots a single sequence.
pred_prob : numpy.Array or torch.Tensor or list of floats, default None: Array containing the prediction probabilities for each sequence in the input data (orig_data). Only relevant if show_pred_prob is True.
uniform_spacing : bool, default False: Defines whether or not the sequences are displayed with uniform spacing (i.e. fixed distance) between their samples.
show_pred_prob : bool, default True: If set to True, a percentage bar chart will be shown to the right of the standard instance importance plot. If pred_prob isn't specified but the labels are, the prediction probabilities will be automatically calculated.
show_title : bool, default True: If set to True, the plot will have a title displayed above.
show_colorbar : bool, default True: If set to True, a bar legend will be shown, corresponding each color to each respective value.
click_mode : string, default 'event+select': Determines the mode of single click interactions. "event" is the default value and emits the plotly_click event. In addition this mode emits the plotly_selected event in drag modes "lasso" and "select", but with no event data attached (kept for compatibility reasons). The "select" flag enables selecting single data points via click. This mode also supports persistent selections, meaning that pressing Shift while clicking, adds to / subtracts from an existing selection. "select" with hovermode: "x" can be confusing, consider explicitly setting hovermode: "closest" when using this feature. Selection events are sent accordingly as long as "event" flag is set as well. When the "event" flag is missing, plotly_click and plotly_selected events are not fired.
labels : torch.Tensor, default None: Labels corresponding to the data used, either specified in the input or all the data that the interpreter has.
seq_len : int, default None: Sequence lengths which represent the true, unpadded size of the input sequences.
threshold : int or float, default 0: Value to use as a threshold in the plot's color selection. In other words, values that exceed this threshold will have one color while the remaining have a different one, as specified in the parameters.
get_fig_obj : bool, default False: If set to True, the function returns the object that contains the displayed plotly figure.
tensor_idx : bool, default True: If set to True, the ID specified in the respective parameter constitutes the index where the desired sequence resides. Otherwise, it's the actual unique identifier that appears in the original data.
max_seq : int, default 10: Maximum number of sequences to show in the plot. This is meant to prevent cramming too many sequences into the graph window.
background_color : str, default 'white': The plot's background color. Can be set in color name (e.g. 'white'), hexadecimal code (e.g. '#555') or RGB (e.g. 'rgb(0,0,255)').
font_family : str, default 'Roboto': Text font family to be used in the numbers shown next to the graph.
font_size : int, default 14: Text font size to be used in the numbers shown next to the graph.
font_color : str, default 'black': Text font color to be used in the numbers shown next to the graph. Can be set in color name (e.g. 'white'), hexadecimal code (e.g. '#555') or GB (e.g. 'rgb(0,0,255)').

Returns

fig : plotly.graph_objs.Figure or None: If argument get_fig_obj is set to True, the figure object is returned. Otherwise, nothing is returned, only the plot is showned.

Expand source code

def instance_importance_plot(self, orig_data=None, inst_scores=None, seq_id=None,
                             pred_prob=None, uniform_spacing=False,
                             show_pred_prob=True, show_title=True,
                             show_colorbar=True, click_mode='event+select',
                             labels=None, seq_len=None, threshold=0,
                             get_fig_obj=False, tensor_idx=True,
                             max_seq=10, background_color='white',
                             font_family='Roboto', font_size=14,
                             font_color='black'):
    '''Create a bar chart that allows visualizing instance importance scores.

    Parameters
    ----------
    orig_data : torch.Tensor or numpy.Array, default None
        Original data used in the machine learning model. Used here to fetch
        the true ID corresponding to the plotted sequence.
    inst_scores : numpy.Array, default None
        Array containing the instance importance scores to be plotted.
    seq_id : int, default None
        ID or sequence index that select which time series / sequences to
        use in the plot. If it's a single value, the method plots a single
        sequence.
    pred_prob : numpy.Array or torch.Tensor or list of floats, default None
        Array containing the prediction probabilities for each sequence in
        the input data (orig_data). Only relevant if show_pred_prob is True.
    uniform_spacing : bool, default False
        Defines whether or not the sequences are displayed with uniform
        spacing (i.e. fixed distance) between their samples.
    show_pred_prob : bool, default True
        If set to True, a percentage bar chart will be shown to the right of
        the standard instance importance plot. If `pred_prob` isn't
        specified but the labels are, the prediction probabilities will be
        automatically calculated.
    show_title : bool, default True
        If set to True, the plot will have a title displayed above.
    show_colorbar : bool, default True
        If set to True, a bar legend will be shown, corresponding each color
        to each respective value.
    click_mode : string, default 'event+select'
        Determines the mode of single click interactions. "event" is the
        default value and emits the `plotly_click` event. In addition this
        mode emits the `plotly_selected` event in drag modes "lasso" and
        "select", but with no event data attached (kept for compatibility
        reasons). The "select" flag enables selecting single data points via
        click. This mode also supports persistent selections, meaning that
        pressing Shift while clicking, adds to / subtracts from an existing
        selection. "select" with `hovermode`: "x" can be confusing, consider
        explicitly setting `hovermode`: "closest" when using this feature.
        Selection events are sent accordingly as long as "event" flag is set
        as well. When the "event" flag is missing, `plotly_click` and
        `plotly_selected` events are not fired.
    labels : torch.Tensor, default None
        Labels corresponding to the data used, either specified in the input
        or all the data that the interpreter has.
    seq_len : int, default None
        Sequence lengths which represent the true, unpadded size of the
        input sequences.
    threshold : int or float, default 0
        Value to use as a threshold in the plot's color selection. In other
        words, values that exceed this threshold will have one color while the
        remaining have a different one, as specified in the parameters.
    get_fig_obj : bool, default False
        If set to True, the function returns the object that contains the
        displayed plotly figure.
    tensor_idx : bool, default True
        If set to True, the ID specified in the respective parameter
        constitutes the index where the desired sequence resides. Otherwise,
        it's the actual unique identifier that appears in the original data.
    max_seq : int, default 10
        Maximum number of sequences to show in the plot. This is meant to
        prevent cramming too many sequences into the graph window.
    background_color : str, default 'white'
        The plot's background color. Can be set in color name (e.g. 'white'),
        hexadecimal code (e.g. '#555') or RGB (e.g. 'rgb(0,0,255)').
    font_family : str, default 'Roboto'
        Text font family to be used in the numbers shown next to the graph.
    font_size : int, default 14
        Text font size to be used in the numbers shown next to the graph.
    font_color : str, default 'black'
        Text font color to be used in the numbers shown next to the graph. Can
        be set in color name (e.g. 'white'), hexadecimal code (e.g. '#555') or
        GB (e.g. 'rgb(0,0,255)').

    Returns
    -------
    fig : plotly.graph_objs.Figure or None
        If argument get_fig_obj is set to True, the figure object is returned.
        Otherwise, nothing is returned, only the plot is showned.'''
    if orig_data is None:
        # Use all the data if none was specified
        orig_data = self.data

        if labels is None:
            labels = self.labels

    if inst_scores is None:
        if self.inst_scores is None:
            raise Exception('ERROR: No instance importance scores found. If the scores aren\'t specified, then they must have already been calculated through the interpret_model method.')
        # Use all the previously calculated scores if none were specified
        inst_scores = self.inst_scores

    # Plot the instance importance of multiple sequences
    # Convert the instance scores data into a NumPy array
    if type(inst_scores) is torch.Tensor:
        inst_scores = inst_scores.detach().numpy()
    elif type(inst_scores) is list:
        inst_scores = np.array(inst_scores)

    # if is not tensor_idx:
    # [TODO] Search for the index associated to the specific ID asked for by the user
    # [TODO] Allow to search for multiple indeces and generate a multiple patients time series plot from it

    if len(inst_scores.shape) == 1 or (seq_id is not None and type(seq_id) is not list):
        # True sequence length of the current id's data
        if seq_len is None:
            seq_len = self.seq_len_dict[orig_data[seq_id, 0, self.id_column_num].item()]

        # [TODO] Add a prediction probability bar plot like in the multiple sequences case

        # Plot the instance importance of one sequence
        plot_data = [go.Bar(
                        x = list(range(seq_len)),
                        y = inst_scores[seq_id, :seq_len],
                        marker=dict(color=du.utils.set_bar_color(inst_scores, seq_id, seq_len,
                                                                 threshold=threshold,
                                                                 pos_color=POS_COLOR,
                                                                 neg_color=NEG_COLOR))
                      )]
        layout = go.Layout(
                            title=f'Instance importance scores for ID {int(orig_data[id, 0, self.id_column_num])}',
                            xaxis=dict(title='Instance'),
                            yaxis=dict(title='Importance scores')
                          )
    else:
        if seq_id is None:
            # Use all the sequences data if a subset isn't specified
            seq_id = list(range(inst_scores.shape[0]))
        # Select the desired data according to the specified IDs
        inst_scores = inst_scores[seq_id, :]
        orig_data = orig_data[seq_id, :, :]
        # Unique patient IDs in string format
        patients = [str(int(item)) for item in [tensor.item()
                    for tensor in list(orig_data[:, 0, self.id_column_num])]]
        if uniform_spacing is True:
            # Sequence instances count, used as X in the plot
            seq_insts_x = [list(range(inst_scores.shape[1]))
                           for patient in range(len(patients))]
        else:
            # Use the original timestamp values as the X axis
            seq_insts_x = [int(tensor) for seq_list
                           in [list(ts_array) for ts_array in list(orig_data[:, :, self.inst_column_num])]
                           for tensor in seq_list]
        # Patients ids repeated max sequence length times, used as Y in the plot
        patients_y = [[patient]*inst_scores.shape[1] for patient in list(patients)]
        # Flatten seq_insts and patients_y
        seq_insts_x = list(np.array(seq_insts_x).flatten())
        patients_y = list(np.array(patients_y).flatten())
        # Define colors for the data points based on their normalized scores (from 0 to 1 instead of -1 to 1)
        colors = [val for val in inst_scores.flatten()]
        # Count the number of already deleted paddings
        count = 0

        for i in range(inst_scores.shape[0]):
            for j in range(inst_scores.shape[1]):
                if inst_scores[i, j] == self.padding_value:
                    # Delete elements that represent paddings, not real instances
                    del seq_insts_x[i*inst_scores.shape[1]+j-count]
                    del patients_y[i*inst_scores.shape[1]+j-count]
                    del colors[i*inst_scores.shape[1]+j-count]
                    # Increment the counting of already deleted items
                    count += 1

        if show_pred_prob is True:
            if pred_prob is None:
                if labels is None:
                    raise Exception('ERROR: By setting `show_pred_prob` to True, either the prediction probabilities (pred_prob) or the labels must be provided.')
                # Calculate the prediction probabilities for the provided data
                pred_prob, _ = du.deep_learning.model_inference(self.model, data=(orig_data, labels),
                                                                metrics=[''], model_type=self.model_type,
                                                                is_custom=self.is_custom,
                                                                seq_len_dict=self.seq_len_dict,
                                                                padding_value=self.padding_value,
                                                                output_rounded=False,
                                                                seq_final_outputs=True,
                                                                cols_to_remove=[self.id_column_num, self.inst_column_num],
                                                                already_embedded=self.already_embedded)
            # Convert the prediction probability data into a NumPy array
            if type(pred_prob) is torch.Tensor:
                pred_prob = pred_prob.detach().numpy()
            elif type(pred_prob) is list:
                pred_prob = np.array(pred_prob)
            # Select the desired data according to the specified IDs
            pred_prob = pred_prob[seq_id]
            # Colors to use in the prediction probability bar plots
            pred_colors = cl.scales['8']['div']['RdYlGn']
            # Create "percentage bar" plots through pairs of unfilled and filled rectangles
            shapes_list = []
            # Starting y coordinate of the first shape
            y0 = -0.25
            # Height of the shapes (y length)
            step = 0.5
            # Maximum width of the shapes
            max_width = 1
            for i in range(len(patients)):
                # Set the starting x coordinate to after the last data point
                x0 = inst_scores.shape[1]
                # Set the filling length of the shape
                x1_fill = x0 + pred_prob[i] * max_width
                shape_unfilled = {
                                    'type': 'rect',
                                    'x0': x0,
                                    'y0': y0,
                                    'x1': x0 + max_width,
                                    'y1': y0 + step,
                                    'line': {
                                                'color': 'rgba(0, 0, 0, 1)',
                                                'width': 2,
                                            },
                                }
                shape_filled = {
                                    'type': 'rect',
                                    'x0': x0,
                                    'y0': y0,
                                    'x1': x1_fill,
                                    'y1': y0 + step,
                                    'fillcolor': pred_colors[int(len(pred_colors)-1-max(pred_prob[i]*len(pred_colors)-1, 0))]
                                }
                shapes_list.append(shape_unfilled)
                shapes_list.append(shape_filled)
                # Set the starting y coordinate for the next shapes
                y0 = y0 + 2 * step

            # Getting points along the percentage bar plots
            x_range = [list(np.array(range(0, 10, 1))*0.1+inst_scores.shape[1]) for idx in range(len(patients))]
            # Flatten the list
            text_x = [item for sublist in x_range for item in sublist]
            # Y coordinates of the prediction probability text
            text_y = [patient for patient in patients for idx in range(10)]
            # Prediction probabilities in text form, to appear in the plot
            text_content = [pred_prob[idx] for idx in range(len(pred_prob)) for i in range(10)]
            # [TODO] Ajdust the zoom so that the initial plot doens't block part of the first and last sequences that show up

        # Create plotly chart
        plot_data = [dict(
            x=seq_insts_x,
            y=patients_y,
            marker=dict(
                color=colors,
                size=12,
                line = dict(
                    color = 'black',
                    width = 1
                ),
                colorscale=[[0, 'rgba(30,136,229,1)'], [0.5, 'white'], [1, 'rgba(255,13,87,1)']],
                cmax=1,
                cmin=-1,
            ),
            mode='markers',
            type='scatter',
            hoverinfo='x+y'
        )]
        layout = dict(
            paper_bgcolor=background_color,
            plot_bgcolor=background_color,
            font=dict(
                family=font_family,
                size=font_size,
                color=font_color
            ),
            xaxis=dict(
                title='Instance',
                showgrid=False,
                zeroline=False
            ),
            yaxis=dict(
                title='Patient ID',
                showgrid=False,
                zeroline=False,
                type='category'
            ),
            hovermode='closest',
            showlegend=False,
            clickmode=click_mode
        )
        if show_title is True:
            layout['title'] = 'Instance importance'
            layout['margin'] = dict(l=0, r=0, t=30, b=0, pad=0)
        else:
            layout['margin'] = dict(l=0, r=0, t=0, b=0, pad=0)
        if show_colorbar is True:
            layout['meta'] = dict()
            layout['meta']['colorbar'] = dict(title='Scores')
        if show_pred_prob is True:
            # Add hover text to indicate the final output probabilities
            prob_hover_info = go.Scatter(
                x=text_x,
                y=text_y,
                text=text_content,
                mode='text',
                textfont=dict(size = 1, color='#ffffff'),
                hoverinfo='y+text'
            )
            plot_data.append(prob_hover_info)
            # Add final output probabilities bar plots
            layout['shapes'] = shapes_list
        if len(patients) > max_seq:
            # Prevent cramming too many sequences into the plot
            layout['yaxis']['range'] = [patients[max_seq], patients[0]]
    # Show the plot
    fig = go.Figure(plot_data, layout)

    if get_fig_obj:
        # Only return the figure object if specified by the user
        return fig
    else:
        py.iplot(fig)
        return

def interpret_model(self, bkgnd_data=None, test_data=None, test_labels=None, new_data=False, model_type=None, df=None, instance_importance=True, feature_importance=False, fast_calc=None, create_new_explainer=True, see_progress=True, save_data=True, debug_loss=False, total_length=None)

Method to calculate scores of feature and/or instance importance, in order to be able to interpret a model on a given data.

Parameters

bkgnd_data : torch.Tensor, default None: In case of setting fast_calc to False, which makes the algorithm require background data in SHAP during the feature importance, the background data used in the explainer can be set through this parameter.
test_data : torch.Tensor, default None: Optionally, the user can specify a subset of data on which model interpretation will be made (i.e. calculating feature and/or instance importance) as a PyTorch tensor. Otherwise, all the data is used.
test_labels : torch.Tensor, default None: Labels corresponding to the data used, either specified in the input or all the data that the interpreter has.
new_data : bool, default False: If set to True, it indicates that the data that will be interpreted hasn't been seen before, i.e. it has different ids than those in the original dataset defined in the object initialization. This implies that a dataframe of the new data is provided (parameter df) so that the sequence lengths are calculated. Otherwise, the original sequence lengths known by the model interpreter are used.
model_type : string, default None: Sets the type of machine learning model. Important to know what type of inference and data processing to do. Currently available options are ['multivariate_rnn', 'mlp'].
df : pandas.DataFrame, default None: Dataframe containing the new data so as to calculate the sequence lengths of the new ids. Only used if new_data is set to True and model_type is 'multivariate_rnn'.
instance_importance : bool, default True: If set to True, instance importance is made on the data. In other words, the algorithm will analyze the impact that each instance of an input sequence had on the output.
feature_importance : bool or string, default False: Defines which feature importance interpretability technique to use. The algorithm will analyze the impact that each feature of an instance had on the output. This is analyzed instance by instance, not in the entire sequence at once. For example, from the feature importance alone, it's not straightforward how a value in a previous instance impacted the current output. Current options include SHAP Kernel Explainer ('shap') and 'mask filter'. If set to False, no feature importance will be done.
fast_calc : bool, default None: If set to True, the algorithm uses less background samples (SHAP) or optimization steps (mask filter), in order to do a fast interpretation of the model. If set to False, the process takes more time in order to get a more precise and truthful interpretation of the model's behavior, requiring longer computation times.
create_new_explainer : bool, default True: Sets if we'll create a new SHAP KernelExplainer or if we'll use a previously defined one in the current model interpreter object.
see_progress : bool, default True: If set to True, a progress bar will show up indicating the execution of the instance importance scores calculations.
save_data : bool, default True: If set to True, the possible background data (used in the SHAP explainer) and the test data (on which importance scores are calculated) are saved as object attributes.
debug_loss : bool, default False: Debugging flag, which makes the method also return an array of the mask filter optimization loss.
total_length : int, default None: If not None, the feature importance scores will be padded to have length total_length.

Returns

inst_scores : numpy.Array: Array containing the importance scores of each instance in the given input sequences. Only calculated if instance_importance is set to True.
feat_scores : numpy.Array: Array containing the importance scores of each feature, of each instance, in the given input sequences. Only calculated if feature_importance is set to True.
if debug_loss is True:
loss_mtx : np.Array: Matrix containing the loss values of the mask filter optimization.

Expand source code

def interpret_model(self, bkgnd_data=None, test_data=None, test_labels=None,
                    new_data=False, model_type=None, df=None,
                    instance_importance=True, feature_importance=False,
                    fast_calc=None, create_new_explainer=True,
                    see_progress=True, save_data=True, debug_loss=False,
                    total_length=None):
    '''Method to calculate scores of feature and/or instance importance, in
    order to be able to interpret a model on a given data.

    Parameters
    ----------
    bkgnd_data : torch.Tensor, default None
        In case of setting fast_calc to False, which makes the algorithm
        require background data in SHAP during the feature importance, the
        background data used in the explainer can be set through this
        parameter.
    test_data : torch.Tensor, default None
        Optionally, the user can specify a subset of data on which model
        interpretation will be made (i.e. calculating feature and/or
        instance importance) as a PyTorch tensor. Otherwise, all the data is
        used.
    test_labels : torch.Tensor, default None
        Labels corresponding to the data used, either specified in the input
        or all the data that the interpreter has.
    new_data : bool, default False
        If set to True, it indicates that the data that will be interpreted
        hasn't been seen before, i.e. it has different ids than those in the
        original dataset defined in the object initialization. This implies
        that a dataframe of the new data is provided (parameter df) so that
        the sequence lengths are calculated. Otherwise, the original
        sequence lengths known by the model interpreter are used.
    model_type : string, default None
        Sets the type of machine learning model. Important to know what type
        of inference and data processing to do. Currently available options
        are ['multivariate_rnn', 'mlp'].
    df : pandas.DataFrame, default None
        Dataframe containing the new data so as to calculate the sequence
        lengths of the new ids. Only used if new_data is set to True and
        `model_type` is 'multivariate_rnn'.
    instance_importance : bool, default True
        If set to True, instance importance is made on the data. In other
        words, the algorithm will analyze the impact that each instance of
        an input sequence had on the output.
    feature_importance : bool or string, default False
        Defines which feature importance interpretability technique to use.
        The algorithm will analyze the impact that each feature of
        an instance had on the output. This is analyzed instance by instance,
        not in the entire sequence at once. For example, from the feature
        importance alone, it's not straightforward how a value in a previous
        instance impacted the current output. Current options include SHAP
        Kernel Explainer ('shap') and 'mask filter'. If set to False, no
        feature importance will be done.
    fast_calc : bool, default None
        If set to True, the algorithm uses less background samples (SHAP)
        or optimization steps (mask filter), in order to do a fast
        interpretation of the model. If set to False, the process takes
        more time in order to get a more precise and truthful
        interpretation of the model's behavior, requiring longer
        computation times.
    create_new_explainer : bool, default True
        Sets if we'll create a new SHAP KernelExplainer or if we'll use a
        previously defined one in the current model interpreter object.
    see_progress : bool, default True
        If set to True, a progress bar will show up indicating the execution
        of the instance importance scores calculations.
    save_data : bool, default True
        If set to True, the possible background data (used in the SHAP
        explainer) and the test data (on which importance scores are
        calculated) are saved as object attributes.
    debug_loss : bool, default False
        Debugging flag, which makes the method also return an array of the
        mask filter optimization loss.
    total_length : int, default None
        If not None, the feature importance scores will be padded to have
        length total_length.

    Returns
    -------
    inst_scores : numpy.Array
        Array containing the importance scores of each instance in the
        given input sequences. Only calculated if instance_importance is set
        to True.
    feat_scores : numpy.Array
        Array containing the importance scores of each feature, of each
        instance, in the given input sequences. Only calculated if
        feature_importance is set to True.

    if debug_loss is True:

    loss_mtx : np.Array
        Matrix containing the loss values of the mask filter optimization.
    '''
    # Confirm that the model is in evaluation mode to deactivate dropout
    self.model.eval()

    if feature_importance is not None and feature_importance is not False:
        try:
            feature_importance = feature_importance.lower()
            if feature_importance != 'shap' and feature_importance != 'mask filter':
                raise Exception(f'ERROR: Specified {feature_importance} feature importance method isn\'t valid. Available options are \"shap\" and\"mask filter\".')
        except:
            raise Exception(f'ERROR: {feature_importance} is an incorrectly defined feature importance method, as it should be a string. Available options are \"shap\" and\"mask filter\".')

    if fast_calc is None:
        # Use the predefined option if fast_calc isn't set in the function call
        fast_calc = self.fast_calc
    else:
        self.fast_calc = fast_calc
    if model_type is None:
        # Use the predefined option if model_type isn't set in the function call
        model_type = self.model_type
    else:
        self.model_type = model_type
    if total_length is None:
        # Use the predefined option if total_length isn't set in the function call
        total_length = self.total_length

    if test_labels is not None:
        if type(test_labels) is np.ndarray:
            # Convert from numpy to pytorch
            test_labels = torch.from_numpy(test_labels)

    if test_data is None:
        if fast_calc:
            # If a subset of data to interpret isn't specified, the interpreter will use all the data
            test_data = self.data
            test_labels = self.labels
        else:
            if bkgnd_data is None:
                # Get the background and test sets from the dataset
                bkgnd_data, test_data = self.create_bkgnd_test_sets()
            else:
                # Get the test set from the dataset
                _, test_data = self.create_bkgnd_test_sets()
    elif type(test_data) is np.ndarray:
        # Convert from numpy to pytorch
        test_data = torch.from_numpy(test_data)

    if model_type == 'multivariate_rnn':
        if new_data is True:
            if df is None:
                raise Exception('ERROR: A dataframe must be provided in order to work with the new data.')
            # Find the sequence lengths of the new data
            seq_len_dict = du.padding.get_sequence_length_dict(df, id_column=self.id_column_num, ts_column=self.inst_column_num)
            # Sort the data by sequence length
            test_data, test_labels, x_lengths_test = du.padding.sort_by_seq_len(test_data, seq_len_dict, test_labels)
        else:
            # Sort the data by sequence length
            test_data, test_labels, x_lengths_test = du.padding.sort_by_seq_len(test_data, self.seq_len_dict, test_labels)

    if not fast_calc:
        if bkgnd_data is None:
            # Get the background set from the dataset
            bkgnd_data, _ = self.create_bkgnd_test_sets()
        elif type(bkgnd_data) is np.ndarray:
            # Convert from numpy to pytorch
            bkgnd_data = torch.from_numpy(bkgnd_data)

    if save_data:
        # Save the data used in the model interpretation
        self.bkgnd_data = bkgnd_data
        self.test_data = test_data
        self.test_labels = test_labels

    if instance_importance is True:
        print('Calculating instance importance scores...')
        # Calculate the scores of importance of each instance
        self.inst_scores = self.instance_importance(test_data, test_labels, x_lengths_test, see_progress)

    if feature_importance is not False:
        print('Calculating feature importance scores...')
        # Calculate the scores of importance of each feature in each instance
        if feature_importance == 'mask filter' and debug_loss:
            self.feat_scores, loss_mtx = self.feature_importance(test_data, model_type,
                                                                 feature_importance,
                                                                 fast_calc, see_progress,
                                                                 bkgnd_data, debug_loss=True,
                                                                 total_length=total_length)
        else:
            self.feat_scores = self.feature_importance(test_data, model_type, feature_importance,
                                                       fast_calc, see_progress, bkgnd_data,
                                                       create_new_explainer=create_new_explainer,
                                                       debug_loss=False, total_length=total_length)

    print('Done!')

    if instance_importance and feature_importance:
        if fast_calc and debug_loss:
            return self.inst_scores, self.feat_scores, loss_mtx
        else:
            return self.inst_scores, self.feat_scores
    elif instance_importance and not feature_importance:
        return self.inst_scores
    elif not instance_importance and feature_importance:
        if fast_calc and debug_loss:
            return self.feat_scores, loss_mtx
        else:
            return self.feat_scores
    else:
        warnings.warn('Without setting instance_importance nor feature_importance to True, the interpret_model function won\'t do anything relevant.')
        return

def mask_filter(self, data=None, x_lengths=None, max_iter=100, l1_coeff=1, lr=0.001, recur_layer=None, see_progress=True, debug_loss=False)

Calculate a mask filter for the given data samples, through an appropriate optimization.

Parameters

data : torch.Tensor, default None: Data sample(s) which will be used to determine the most relevant features. In case of multivariate sequential data, each instance will be analyzed seperately. If None, all data known to the model interpreter will be used.
x_lengths : list of int: Sorted list of sequence lengths, relative to the input data.
max_iter : int, default 100: Maximum number of iterations of the mask filter optimization, for each instance.
l1_coeff : int, default 1: Weight given in the loss function to the L1 norm of the mask filter.
lr : float, default 0.001: Learning rate used in the optimization algorithm.
recur_layer : torch.nn.LSTM or torch.nn.GRU or torch.nn.RNN, default None: Pointer to the recurrent layer in the model, if it exists. It should either be a LSTM, GRU or RNN network. If none is specified, the method will automatically search for a recurrent layer in the model.
see_progress : bool, default True: If set to True, a progress bar will show up indicating the execution of the feature importance scores calculations.
debug_loss : bool, default False: Debugging flag, which makes the method also return an array of the optimization loss.

Returns

mask : numpy.Array: Output mask, after finishing the optimization for every specified sample. It will be inverted before returning, so as to be an array filled with zeros, except in the indeces corresponding to the most relevant features, where it will be one.
if debug_loss is True:
loss_mtx : np.Array: Matrix containing the loss values of the mask filter optimization.

Expand source code

def mask_filter(self, data=None, x_lengths=None, max_iter=100, l1_coeff=1,
                lr=0.001, recur_layer=None, see_progress=True, debug_loss=False):
    '''Calculate a mask filter for the given data samples, through an
    appropriate optimization.

    Parameters
    ----------
    data : torch.Tensor, default None
        Data sample(s) which will be used to determine the most relevant
        features. In case of multivariate sequential data, each instance will
        be analyzed seperately. If None, all data known to the model
        interpreter will be used.
    x_lengths : list of int
        Sorted list of sequence lengths, relative to the input data.
    max_iter : int, default 100
        Maximum number of iterations of the mask filter optimization, for
        each instance.
    l1_coeff : int, default 1
        Weight given in the loss function to the L1 norm of the mask filter.
    lr : float, default 0.001
        Learning rate used in the optimization algorithm.
    recur_layer : torch.nn.LSTM or torch.nn.GRU or torch.nn.RNN, default None
        Pointer to the recurrent layer in the model, if it exists. It should
        either be a LSTM, GRU or RNN network. If none is specified, the
        method will automatically search for a recurrent layer in the model.
    see_progress : bool, default True
        If set to True, a progress bar will show up indicating the execution
        of the feature importance scores calculations.
    debug_loss : bool, default False
        Debugging flag, which makes the method also return an array of the
        optimization loss.

    Returns
    -------
    mask : numpy.Array
        Output mask, after finishing the optimization for every specified
        sample. It will be inverted before returning, so as to be an array
        filled with zeros, except in the indeces corresponding to the most
        relevant features, where it will be one.

    if debug_loss is True:

    loss_mtx : np.Array
        Matrix containing the loss values of the mask filter optimization.
    '''
    # [TODO] Work on an option to use input data different from multivariate sequential
    if data is None:
        # If a subset of data to interpret isn't specified, the interpreter will use all the data
        data = self.data
    if x_lengths is None:
        # Sort the data by sequence length
        data, x_lengths = du.padding.sort_by_seq_len(data, self.seq_len_dict)
    if len(data.shape) > 1 and recur_layer is None:
        # Search for a recurrent layer
        if hasattr(self.model, 'lstm'):
            recur_layer = self.model.lstm
        elif hasattr(self.model, 'gru'):
            recur_layer = self.model.gru
        elif hasattr(self.model, 'rnn'):
            recur_layer = self.model.rnn
        else:
            raise Exception('ERROR: No recurrent layer found. Please specify it in the recur_layer argument.')

    # Confirm that the model is in evaluation mode to deactivate dropout
    self.model.eval()
    # Create a mask filter variable, initialized as an all ones tensor
    mask = torch.ones(data.shape)
    # [DEBUG] Create a loss matrix to analyse the convergence of mask filter optimizations
    loss_mtx = []

    if len(data.shape) == 3:
        # Loop to go through each sequence in the input data
        for seq in tqdm(range(data.shape[0]), disable=not see_progress):
            # Get the true length of the current sequence
            seq_len = x_lengths[seq]
            # Loop to go through each instance in the input sequence
            for inst in tqdm(range(seq_len), disable=not see_progress):
                hidden_state = None
                # Get the hidden state that the model receives as an input
                if inst > 0:
                    # Get the hidden state outputed from the previous recurrent cell
                    _, hidden_state = recur_layer(data[:inst])
                    # Avoid backpropagating through previous instances
                    if type(hidden_state) is tuple:
                        hidden_state = (hidden_state[0].detach(), hidden_state[1].detach())
                    else:
                        hidden_state.detach_()
                # Temporary mask filter for he current instance
                tmp_mask = Variable(mask[seq, inst, :], requires_grad=True)
                # [DEBUG] List of the current optimization's losses
                tmp_loss_list = []
                # Mask filter optimization loop
                for iter in tqdm(range(max_iter), disable=not see_progress):
                    # Calculate the model's output to the original, unchanged instance data
                    ref_output = self.model(data[seq, inst, :].unsqueeze(0).unsqueeze(0), hidden_state=hidden_state)
                    # Prevent mask filter optimization from backpropagating through the reference output
                    ref_output.detach_()
                    # Perform a single optimization step
                    tmp_mask, tmp_loss = self.mask_filter_step(tmp_mask, data[seq, inst, :], ref_output, l1_coeff, hidden_state, debug_loss=debug_loss)
                    tmp_loss_list.append(tmp_loss)
                # Save the optimized mask filter of the current instance
                mask[seq, inst, :] = tmp_mask
                # [DEBUG] Add the current instance's optimization logs to the overall loss matrix
                loss_mtx.append(tmp_loss_list)

    elif len(data.shape) == 2:
        # Loop to go through each instance in the input sequence
        for inst in tqdm(range(data.shape[0]), disable=not see_progress):
            hidden_state = None
            # Get the hidden state that the model receives as an input
            if inst > 0:
                # Get the hidden state outputed from the previous recurrent cell
                _, hidden_state = recur_layer(data[:inst])
                # Avoid backpropagating through previous instances
                if type(hidden_state) is tuple:
                    hidden_state = (hidden_state[0].detach(), hidden_state[1].detach())
                else:
                    hidden_state.detach_()
            # Temporary mask filter for he current instance
            tmp_mask = Variable(mask[inst], requires_grad=True)
            # Mask filter optimization loop
            for iter in tqdm(range(max_iter), disable=not see_progress):
                # Calculate the model's output to the original, unchanged instance data
                ref_output = self.model(data[inst].unsqueeze(0).unsqueeze(0), hidden_state=hidden_state)
                # Prevent mask filter optimization from backpropagating through the reference output
                ref_output.detach_()
                # Perform a single optimization step
                tmp_mask = self.mask_filter_step(tmp_mask, data[inst], ref_output, l1_coeff, hidden_state)
            # Save the optimized mask filter of the current instance
            mask[inst] = tmp_mask

    elif len(data.shape) == 1:
        # Make sure that the mask can be optimized properly
        mask.requires_grad_()
        # Mask filter optimization loop
        for iter in tqdm(range(max_iter), disable=not see_progress):
            # Calculate the model's output to the original, unchanged instance data
            ref_output = self.model(data.unsqueeze(0).unsqueeze(0), hidden_state=hidden_state)
            # Prevent mask filter optimization from backpropagating through the reference output
            ref_output.detach_()
            # Perform a single optimization step
            mask = self.mask_filter_step(mask, data, ref_output, l1_coeff)

    else:
        raise Exception(f'ERROR: Can\'t handle data with more than 3 dimensions. Submitted data with {len(data.shape)} dimensions.')

    # Return the inverted version of the mask, to atrribute 1 (one) to the most relevant features
    if debug_loss:
        return 1 - mask, loss_mtx
    else:
        return 1 - mask

def mask_filter_step(self, mask, data, ref_output, l1_coeff=1, hidden_state=None, debug_loss=False)

Perform a single optimization step to calculate a new version of the mask filter.

Parameters

mask : numpy.Array: Current mask filter, either the initial one or from the previous optimization iteration.
data : torch.Tensor: Data sample which will be used to determine the most relevant features. In case of multivariate sequential data, this must be a single instance of a sequence.
ref_output : torch.Tensor or float: Model's output to the original instance, with no mask filters applied.
l1_coeff : int, default 1: Weight given in the loss function to the L1 norm of the mask filter.
hidden_state : torch.Tensor or tuple of two torch.Tensor, default None: Hidden state coming from the previous recurrent cell. If none is specified, the hidden state is initialized as zero.
debug_loss : bool, default False: Debugging flag, which makes the method also return an array of the optimization loss.

Returns

mask : numpy.Array: Current mask filter, after the performed optimization step.
if debug_loss is True:
loss : float: Current loss value of the mask filter optimization.

Expand source code

def mask_filter_step(self, mask, data, ref_output, l1_coeff=1,
                     hidden_state=None, debug_loss=False):
    '''Perform a single optimization step to calculate a new version of the
    mask filter.

    Parameters
    ----------
    mask : numpy.Array
        Current mask filter, either the initial one or from the previous
        optimization iteration.
    data : torch.Tensor
        Data sample which will be used to determine the most relevant
        features. In case of multivariate sequential data, this must be a
        single instance of a sequence.
    ref_output : torch.Tensor or float
        Model's output to the original instance, with no mask filters applied.
    l1_coeff : int, default 1
        Weight given in the loss function to the L1 norm of the mask filter.
    hidden_state : torch.Tensor or tuple of two torch.Tensor, default None
        Hidden state coming from the previous recurrent cell. If none is
        specified, the hidden state is initialized as zero.
    debug_loss : bool, default False
        Debugging flag, which makes the method also return an array of the
        optimization loss.

    Returns
    -------
    mask : numpy.Array
        Current mask filter, after the performed optimization step.

    if debug_loss is True:

    loss : float
        Current loss value of the mask filter optimization.
    '''
    # Get the model's output for the masked input data
    new_output = self.model((mask * data).unsqueeze(0).unsqueeze(0), hidden_state=hidden_state)
    # Calculate the loss function
    # • Minimize the number of activated mask filter units (occluded features)
    # • Maximize the change made to the output
    loss = l1_coeff * torch.mean(torch.abs(1 - mask)) + 1 - (ref_output - new_output).pow(2)
    # Backpropagate the loss function and run an optimization step (update the mask filter)
    loss.backward(retain_graph=True)
    mask.grad = du.deep_learning.change_grad((-1) * mask.grad, mask.data)
    mask.data = mask.data + mask.grad
    # Make sure that the mask has values either 0 or 1
    mask.data.clamp_(0, 1)
    mask.data.round_()
    if debug_loss:
        return mask, loss.item()
    else:
        return mask

def shap_values_df(self)

Create a dataframe that contains both the original data used in the interpretation of the model and the resulting SHAP values.

Returns

data_n_shap_df : pandas.DataFrame: Dataframe that contains both the original data used in the interpretation of the model and the resulting SHAP values.

Expand source code

def shap_values_df(self):
    '''Create a dataframe that contains both the original data used in the
    interpretation of the model and the resulting SHAP values.

    Returns
    -------
    data_n_shap_df : pandas.DataFrame
        Dataframe that contains both the original data used in the
        interpretation of the model and the resulting SHAP values.'''
    # [TODO] Add option to handle pre-calculated SHAP values
    # (pre-defined data and SHAP values, outside of the Model Interpreter)
    # Join the original data and the features' SHAP values
    data_n_shap = np.concatenate([self.test_data.numpy(), self.test_labels.unsqueeze(2).numpy(), self.feat_scores], axis=2)
    # Reshape into a 2D format
    data_n_shap = data_n_shap.reshape(-1, data_n_shap.shape[-1])
    # Remove padding samples
    data_n_shap = data_n_shap[[self.padding_value not in row for row in data_n_shap]]
    # Define the column names list
    shap_column_names = [f'{feature}_shap' for feature in self.feat_names]
    column_names = ([self.id_column_name] + [self.inst_column_name] + self.feat_names
                    + [self.label_column_name] + shap_column_names)
    # Create the dataframe
    data_n_shap_df = pd.DataFrame(data=data_n_shap, columns=column_names)
    return data_n_shap_df