Source code for model_architectures.rnn_base_model.predict.prediction

"""Prediction of recurrent neural network model.

Functions
---------
predict
    Make predictions with recurrent neural network model for given dataset.
compute_sample_prediction_loss
    Compute loss of sample output features prediction.
"""
#
#                                                                       Modules
# =============================================================================
# Standard
import os
import random
import time
import datetime
# Third-party
import torch
import tqdm
import numpy as np
# Local
from time_series_data.time_dataset import get_time_series_data_loader
from model_architectures.rnn_base_model.model.gru_model import GRURNNModel
from model_architectures.procedures.model_prediction import \
    make_predictions_subdir, save_sample_predictions, \
    write_prediction_summary_file
from model_architectures.procedures.model_data_scaling import \
    data_scaler_transform
from model_architectures.procedures.model_state_files import load_model_state
from utilities.loss_functions import get_pytorch_loss
from utilities.data_loaders import seed_worker
#
#                                                          Authorship & Credits
# =============================================================================
__author__ = 'Bernardo Ferreira (bernardo_ferreira@brown.edu)'
__credits__ = ['Bernardo Ferreira', ]
__status__ = 'Stable'
# =============================================================================
#
# =============================================================================
[docs]def predict(dataset, model_directory, model=None, predict_directory=None,
            model_load_state=None, loss_nature='features_out',
            loss_type='mse', loss_kwargs={}, is_normalized_loss=False,
            batch_size=1, dataset_file_path=None, device_type='cpu', seed=None,
            is_verbose=False):
    """Make predictions with recurrent neural network model for given dataset.
    
    Parameters
    ----------
    dataset : torch.utils.data.Dataset
        Time series data set. Each sample is stored as a dictionary where
        each feature (key, str) data is a torch.Tensor(2d) of shape
        (sequence_length, n_features).
    model_directory : str
        Directory where model is stored.
    model : GRURNNModel, default=None
        Hybrid material constitutive model. If None, then model is initialized
        from the initialization file and the state is loaded from the state
        file. In both cases the model is set to evaluation mode.
    predict_directory : str, default=None
        Directory where model predictions results are stored. If None, then
        all output files are supressed.
    model_load_state : {'default', 'init', int, 'best', 'last'},
                       default='default'
        Available model state to be loaded from the model directory.
        Options:
        
        'default'   : Model default state file
        
        'init'      : Model initial state
        
        int         : Model state of given training epoch
        
        'best'      : Model state of best performance
        
        'last'      : Model state of latest training epoch

    loss_nature : {'features_out',}, default='features_out'
        Loss nature:
        
        'features_out' : Based on output features

    loss_type : {'mse',}, default='mse'
        Loss function type:
        
        'mse'  : MSE (torch.nn.MSELoss)
        
    loss_kwargs : dict, default={}
        Arguments of torch.nn._Loss initializer.
    is_normalized_loss : bool, default=False
        If True, then samples prediction loss are computed from normalized
        output data, False otherwise. Normalization of output data requires
        that model data scalers are available.
    batch_size : int, default=1
        Number of samples loaded per batch.
    dataset_file_path : str, default=None
        Time series data set file path if such file exists. Only used for
        output purposes.
    device_type : {'cpu', 'cuda'}, default='cpu'
        Type of device on which torch.Tensor is allocated.
    seed : int, default=None
        Seed used to initialize the random number generators of Python and
        other libraries (e.g., NumPy, PyTorch) for all devices to preserve
        reproducibility. Does also set workers seed in PyTorch data loaders.
    is_verbose : bool, default=False
        If True, enable verbose output.
        
    Returns
    -------
    predict_subdir : str
        Subdirectory where samples predictions results files are stored.
    avg_predict_loss : float
        Average prediction loss per sample. Defaults to None if ground-truth is
        not available for all data set samples.
    """
    # Set random number generators initialization for reproducibility
    if isinstance(seed, int):
        random.seed(seed)
        np.random.seed(seed)
        generator = torch.Generator().manual_seed(seed)
    # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
    # Set device
    device = torch.device(device_type)
    # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
    start_time_sec = time.time()
    if is_verbose:
        print('\nRecurrent Neural Network model prediction'
              '\n-----------------------------------------')
    # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
    # Check model directory
    if not os.path.exists(model_directory):
        raise RuntimeError('The model directory has not been found:\n\n'
                           + model_directory)
    # Check prediction directory
    if predict_directory is not None and not os.path.exists(predict_directory):
        raise RuntimeError('The model prediction directory has not been '
                           'found:\n\n' + predict_directory)
    # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
    # Initialize model and load model state if not provided
    if model is None:
        if is_verbose:
            print('\n> Loading Recurrent Neural Network model...')
        # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
        # Initialize recurrent neural network model
        model = GRURNNModel.init_model_from_file(
            model_directory=model_directory)
        # Set model device
        model.set_device(device_type)
        # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
        # Load recurrent neural network model state
        _ = load_model_state(model, model_load_state=model_load_state,
                             is_remove_posterior=False)
    # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
    # Get model input and output features normalization
    is_model_in_normalized = model.is_model_in_normalized
    is_model_out_normalized = model.is_model_out_normalized
    # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
    # Move model to device
    model.to(device=device)
    # Set model in evaluation mode
    model.eval()
    # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
    # Create model predictions subdirectory for current prediction process
    predict_subdir = None
    if predict_directory is not None:
        predict_subdir = make_predictions_subdir(predict_directory)
    # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
    # Set data loader
    if isinstance(seed, int):
        data_loader = get_time_series_data_loader(
            dataset=dataset, batch_size=batch_size,
            kwargs={'worker_init_fn': seed_worker, 'generator': generator})
    else:
        data_loader = get_time_series_data_loader(
            dataset=dataset, batch_size=batch_size)
    # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
    # Initialize loss function
    loss_function = get_pytorch_loss(loss_type, **loss_kwargs)
    # Initialize samples prediction loss
    loss_samples = []
    # Initialize sample ID
    sample_id = 0
    # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
    if is_verbose:
        print('\n\n> Starting prediction process...\n')
    # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
    # Set context manager to avoid creation of computation graphs during the
    # model evaluation (forward propagation)
    with torch.no_grad():
        # Loop over samples
        for _, batch in enumerate(tqdm.tqdm(data_loader,
                                            desc='> Predictions (batches): ',
                                            disable=not is_verbose)):
            # Move batch to device
            for key in batch.keys():
                batch[key] = batch[key].to(device)
            # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
            # Get input features
            if is_model_in_normalized:
                # Normalize features ground-truth
                features_in = \
                    data_scaler_transform(model, tensor=batch['features_in'],
                                          features_type='features_in',
                                          mode='normalize')
            else:
                features_in = batch['features_in']
            # Get initial hidden state features
            if 'hidden_features_in' in batch.keys():
                hidden_features_in = batch['hidden_features_in']
            else:
                hidden_features_in = None
            # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
            # Get output features ground-truth (None if not available)
            targets = batch['features_out']
            # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
            # Get number of batched samples
            batch_n_sample = batch['features_in'].shape[1]
            # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
            # Initialize batched samples results
            samples_results = []
            # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
            # Compute output features predictions (forward propagation)
            if loss_nature == 'features_out':
                # Compute output features
                features_out, _ = model(features_in, hidden_features_in)
                # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
                # Denormalize output features data
                if is_model_out_normalized:
                    features_out = \
                        data_scaler_transform(model, tensor=features_out,
                                              features_type='features_out',
                                              mode='denormalize')
                # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
                # Loop over batched samples
                for j in range(batch_n_sample):
                    # Initialize sample results
                    sample_results = {}
                    # Build sample results (removing batch dimension)
                    sample_results['features_out'] = \
                        features_out[:, j, :].detach().clone().cpu()
                    sample_results['targets'] = None
                    if targets is not None:
                        sample_results['targets'] = \
                            targets[:, j, :].detach().clone().cpu()
                    # Store sample results
                    samples_results.append(sample_results)
            # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
            else:
                raise RuntimeError('Unknown loss nature.')
            # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
            # Loop over batched samples
            for sample_results in samples_results:
                # Compute sample output features prediction loss
                loss = compute_sample_prediction_loss(
                    model, loss_function, sample_results['features_out'],
                    sample_results['targets'],
                    is_normalized_loss=is_normalized_loss)
                # Store prediction loss data
                sample_results['prediction_loss_data'] = \
                    (loss_nature, loss_type, loss, is_normalized_loss)
                # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
                # Assemble sample prediction loss if ground-truth is available
                if loss is not None:
                    loss_samples.append(loss.detach().clone().cpu())
                # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
                # Save sample predictions results
                if predict_directory is not None:
                    save_sample_predictions(predictions_dir=predict_subdir,
                                            sample_id=sample_id,
                                            sample_results=sample_results)
                # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
                # Increment sample ID
                sample_id += 1
    # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
    if is_verbose:
        print('\n> Finished prediction process!\n')
    # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
    # Compute average prediction loss per sample
    avg_predict_loss = None
    if isinstance(loss_samples, list) and len(loss_samples) == len(dataset):
        avg_predict_loss = np.mean(loss_samples)
    # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
    if is_verbose:
        # Set average prediction loss output format
        if avg_predict_loss:
            loss_str = (f'{avg_predict_loss:.8e} | {loss_type}')
            if is_normalized_loss:
                loss_str += ', normalized'
        else:
            loss_str = 'Ground-truth not available'  
        # Display average loss
        print('\n> Avg. prediction loss per sample: '
              + loss_str)
    # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
    # Compute total prediction time and average prediction time per sample
    total_time_sec = time.time() - start_time_sec
    if len(dataset) > 0:
        avg_time_sample = total_time_sec/len(dataset)
    else:
        avg_time_sample = float('nan')
    # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
    if is_verbose:
        print(f'\n> Prediction results directory: {predict_subdir}')
        print(f'\n> Total prediction time: '
              f'{str(datetime.timedelta(seconds=int(total_time_sec)))} | '
              f'Avg. prediction time per sample: '
              f'{str(datetime.timedelta(seconds=int(avg_time_sample)))}\n')
    # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
    # Write summary data file for model prediction process
    if predict_directory is not None:
        write_prediction_summary_file(
            predict_subdir, device_type, seed, model_directory,
            model_load_state, loss_type, loss_kwargs, is_normalized_loss,
            dataset_file_path, dataset, avg_predict_loss, total_time_sec,
            avg_time_sample)
    # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
    return predict_subdir, avg_predict_loss
# =============================================================================
def compute_sample_prediction_loss(model, loss_function, features_out, targets,
                                   is_normalized_loss=False):
    """Compute loss of sample output features prediction.
    
    Assumes that provided output features and targets are denormalized.

    Parameters
    ----------
    model : torch.nn.Module
        Recurrent neural network model.
    loss_function : torch.nn._Loss
        PyTorch loss function.
    features_out : torch.Tensor
        Predicted output features stored as a torch.Tensor(2d).
    targets : {torch.Tensor, None}
        Output features ground-truth stored as a torch.Tensor(2d).
    is_normalized_loss : bool, default=False
        If True, then samples prediction loss are computed from normalized
        output data, False otherwise. Normalization of output data requires
        that model data scalers are available.
    
    Returns
    -------
    loss : {float, None}
        Loss of sample output features prediction. Set to None if output
        features ground-truth is not available.
    """
    # Check if output features ground-truth is available
    is_ground_truth_available = targets is not None
    # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
    # Compute sample loss if ground-truth is available
    if is_ground_truth_available:
        # Normalize output features
        if is_normalized_loss:
            # Normalize output features predictions
            features_out = \
                data_scaler_transform(model, tensor=features_out,
                                      features_type='features_out',
                                      mode='normalize')
            # Normalize output features ground-truth
            targets = \
                data_scaler_transform(model, tensor=targets,
                                      features_type='features_out',
                                      mode='normalize')
        # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
        # Compute sample loss
        loss = loss_function(features_out, targets)
    else:
        # Set sample loss to None if ground-truth is not available
        loss = None
    # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
    return loss