Source code for runlmc.models.multigp

# Copyright (c) 2016, Vladimir Feinberg
# Licensed under the BSD 3-clause license (see LICENSE)

# This file was modified from the GPy project. Its file header is replicated
# below. Its LICENSE.txt is replicated in the LICENSE file for this directory.

# Copyright (c) 2012-2014, GPy authors (see AUTHORS.txt).
# Licensed under the BSD 3-clause license (see LICENSE.txt)

"""
This module houses the base model that the package centers around:
:class:`runlmc.model.MultiGP`, the parent class for all multi-output
GP models in this package.
"""

import logging

import numpy as np
import scipy.stats

from ..parameterization.model import Model
from ..util.normalizer import Norm

_LOG = logging.getLogger(__name__)


[docs]class MultiGP(Model):
    """
    The generic GP model for multi-output regression. This handles common
    functionality between all models regarding input validation and high
    level parameter optimization routines.

    This model assumes Gaussian noise.

    This class shouldn't be instantiated directly.

    .. Note: Currently, only one-dimensional input is supported.

    Upon construction, this class assumes ownership of its parameters and
    does not account for changes in their values.

    :param Xs: input observations, should be a list of numpy arrays,
               where each numpy array is a design matrix for the inputs to
               output :math:`i`. If the :math:`i`-th input has :math:`n_i`
               data points, then this matrix can be :math:`n_i` or
               :math:`n_i\\times P` shape for input dimension :math:`P`,
               with the former re-interpreted as :math:`P=1`.
    :param Ys: output observations, this must be a list of one-dimensional
               numpy arrays, matching up with the number of rows in `Xs`.
    :param normalize: optional normalization for outputs `Ys`.
                           Prediction will be un-normalized.
    :param str name:
    :raises: :class:`ValueError` if `Xs` and `Ys` lengths do not match.
    :raises: :class:`ValueError` if normalization if any `Ys` have no variance
                                 or values in `Xs` have multiple identical
                                 values.
    """

    def __init__(self, Xs, Ys, normalize=True, name='multigp'):
        super().__init__(name)
        self.input_dim, self.output_dim = self._validate_io(Xs, Ys)

        self.normalizer = None
        if normalize:
            _LOG.info('%s: normalizing outputs', name)
            self.normalizer = [Norm() for _ in range(len(Ys))]
            for norm, Y in zip(self.normalizer, Ys):
                norm.scale_by(Y)
            Ys = [norm.normalize(Y) for norm, Y in zip(self.normalizer, Ys)]
        self.Ys = Ys
        self.Xs = self._pad_dims(Xs)

        _LOG.info('%s: MultiGP initialized', name)

[docs]    def parameters_changed(self):
        """
        This method is called automatically when linked parameters change,
        which the may during the optimization process.

        Classes should update their posterior information, log likelihood,
        and gradients when this happens, such that :meth:`_raw_predict`,
        :meth:`log_likelihood`, and :meth:`gradient`
        are consistent with the new parameters.

        .. Note: This method should not be called except by the internal
                 usage of `paramz`.
        """
        raise NotImplementedError

[docs]    def log_likelihood(self):
        """
        The log marginal likelihood of the model, :math:`p(\mathbf{y})`,
        this is the objective function of the model being optimised
        """
        raise NotImplementedError

    def _raw_predict(self, Xs):
        """
        Returns the raw predictive mean and variance, without
        incorporating normalization.

        See :method:`predict` for more details.
        """
        raise NotImplementedError

    def _predict(self, Xs, normalize):
        assert len(Xs) == self.output_dim, \
            'num inputs {} != output_dim {}'.format(len(Xs), self.output_dim)
        assert all(X.shape[1] == self.input_dim for X in Xs)
        mu, var = self._raw_predict(Xs)

        if self.normalizer and normalize:
            mu = [norm.inverse_mean(m) for norm, m in zip(self.normalizer, mu)]
            var = [norm.inverse_variance(v)
                   for norm, v in zip(self.normalizer, var)]

        return mu, var

[docs]    def predict(self, Xs):
        """
        Predict the functions at the new points `Xs`.

        :param Xs: The points at which to make a prediction for each output.
                   Should be empty if no output desired for a certain index.
                   This is a :class:`list` of :class:`numpy.ndarray` for each
                   output `d`, one-dimensional
                   of size `n_d` each. Length of `Xs` should be equal to the
                   number of outputs :py:attr:`output_dim`.
        :returns: `(mean, var)`:

            `mean`: posterior mean, a list of length :py:attr:`output_dim` with
                    one-dimensional numpy arrays of length `n_d` at index `d`.

            `var`: posterior variance, corresponding to each mean entry.

        .. Note:
            If you want the predictive quantiles (e.g. 95% confidence interval)
            use :func:`predict_quantiles`.
        """
        Xs = self._pad_dims(Xs)
        return self._predict(Xs, normalize=True)

[docs]    def predict_quantiles(self, Xs, quantiles=(2.5, 97.5)):
        """
        Identical to predict, but returns quantiles instead of mean and
        variance according to the Gaussian likelihood.

        :param quantiles: tuple of quantiles, default is (2.5, 97.5),
                          which is the 95% interval; shouldn't be 0 or 100
        :type quantiles: tuple of doubles
        :returns: list of quantiles for each output's input, as a numpy
                  array, 2-D, the first axis corresponding to the
                  input index and the second to the quantile index.
        """
        Xs = self._pad_dims(Xs)
        mu, var = self._predict(Xs, normalize=False)
        quantiles = np.fromiter(quantiles, dtype=float)
        quantiles = [
            np.outer(np.sqrt(v), scipy.stats.norm.ppf(quantiles / 100.))
            + m[:, np.newaxis]
            for m, v in zip(mu, var)]
        if self.normalizer:
            quantiles = [norm.inverse_mean(q)
                         for norm, q in zip(self.normalizer, quantiles)]
        return quantiles

[docs]    def optimize(self, **kwargs):
        """
        Optimize the model using :func:`log_likelihood` with a
        gradient descent method that involves the priors.

        `kwargs` are passed to the optimizer. See parameters for handled
        keywords.

        :param optimizer: A :py:class:`paramz.optimization.Optimizer`.
                          Pre-built ones available in
                          :py:mod:`runlmc.models.optimization`.

        """
        try:
            dfldict = {
                'optimizer': None,
                'start': None,
                'messages': False,
                'max_iters': 1,
                'ipython_notebook': True,
                'clear_after_finish': False
            }
            dfldict.update(kwargs)
            _LOG.info('%s: about to start optimizing - options:\n%s',
                      self.name, dfldict)
            super().optimize(**dfldict)
            _LOG.info('%s: completed optimization', self.name)
        except KeyboardInterrupt:
            print('{}: KeyboardInterrupt caught, terminating optimization.'
                  .format(self.name))
            raise

    def _validate_io(self, Xs, Ys):
        if not Xs:
            raise ValueError('Expecting at least 1 output')
        if len(Xs) != len(Ys):
            raise ValueError('Differing number of inputs {} and outputs {}'
                             .format(len(Xs), len(Ys)))
        for i, (X, Y) in enumerate(zip(Xs, Ys)):
            if len(X) != len(Y):
                raise ValueError('Ouput {} has {} inputs and {} observed vals'
                                 .format(i, len(X), len(Y)))
            if X.ndim not in [1, 2]:
                raise ValueError('Input {} mishapen, {} not 1D or 2D'
                                 .format(i, X.shape))
            if Y.ndim != 1:
                raise ValueError('Output {} mishapen, {} not 1D'
                                 .format(i, Y.shape))

        dims = set(X.shape[1] for X in Xs if X.ndim > 1)
        if not dims:
            dims = {1}
        if len(dims) != 1:
            raise ValueError(
                'Found inputs of varying dimensions {}'.format(dims))

        for i, Y in enumerate(Ys):
            if np.std(Y) == 0:
                raise ValueError('Output {} has std dev 0'.format(i))

        return dims.pop(), len(Xs)

    def _pad_dims(self, Xs):
        Xs = [X.reshape(-1, 1) if X.ndim == 1 else X for X in Xs]
        for i, X in enumerate(Xs):
            if X.shape[1] != self.input_dim:
                raise ValueError('input {} dim {} != expected dim {}'.format(
                    i, X.shape[1], self.input_dim))
        return Xs