bayesopt/html/gaussian__process__normal_8cpp_source.html

 /*
 -------------------------------------------------------------------------
    This file is part of BayesOpt, an efficient C++ library for
    Bayesian optimization.

    Copyright (C) 2011-2015 Ruben Martinez-Cantin <rmcantin@unizar.es>

    BayesOpt is free software: you can redistribute it and/or modify it
    under the terms of the GNU Affero General Public License as published by
    the Free Software Foundation, either version 3 of the License, or
    (at your option) any later version.

    BayesOpt is distributed in the hope that it will be useful, but
    WITHOUT ANY WARRANTY; without even the implied warranty of
    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
    GNU Affero General Public License for more details.

    You should have received a copy of the GNU Affero General Public License
    along with BayesOpt.  If not, see <http://www.gnu.org/licenses/>.
 ------------------------------------------------------------------------
 */

 #include <cstdlib>
 #include <boost/math/special_functions/fpclassify.hpp>
 #include <boost/numeric/ublas/banded.hpp>
 #include "ublas_trace.hpp"
 #include "ublas_elementwise.hpp"
 #include "gauss_distribution.hpp"
 #include "gaussian_process_normal.hpp"

 namespace bayesopt
 {

   namespace ublas = boost::numeric::ublas;

   GaussianProcessNormal::GaussianProcessNormal(size_t dim,
                            Parameters params,
                            const Dataset& data,
                            MeanModel& mean,
                            randEngine& eng):
     HierarchicalGaussianProcess(dim,params,data,mean,eng),
     mW0(params.mean.coef_mean.size()), mInvVarW(params.mean.coef_mean.size()),
     mD(params.mean.coef_mean.size(),params.mean.coef_mean.size())
   {
     mSigma = params.sigma_s;
     mW0 = params.mean.coef_mean;
     for (size_t ii = 0; ii < params.mean.coef_std.size(); ++ii)
       {
     double varii = params.mean.coef_std[ii] * params.mean.coef_std[ii];
     mInvVarW(ii) = 1/varii;
       }
      d_ = new GaussianDistribution(eng);
   }  // Constructor


   GaussianProcessNormal::~GaussianProcessNormal()
   {
     delete d_;
   } // Default destructor


   ProbabilityDistribution*
   GaussianProcessNormal::prediction(const vectord &query)
   {
     const double kq = computeSelfCorrelation(query);
     const vectord phi = mMean.getFeatures(query);

     vectord v = computeCrossCorrelation(query);

     inplace_solve(mL,v,ublas::lower_tag());

     vectord rq = phi - prod(v,mKF);

     vectord rho(rq);
     inplace_solve(mD,rho,ublas::lower_tag());

     double yPred = inner_prod(phi,mWMap) + inner_prod(v,mVf);
     double sPred = sqrt( mSigma * (kq - inner_prod(v,v)
                     + inner_prod(rho,rho)));

     if ((boost::math::isnan(yPred)) || (boost::math::isnan(sPred)))
       {
     throw std::runtime_error("Error in prediction. NaN found.");
       }


     d_->setMeanAndStd(yPred,sPred);
     return d_;
   }


   double GaussianProcessNormal::negativeLogLikelihood()
   {
     matrixd KK = computeCorrMatrix();
     const size_t n = KK.size1();
     const size_t p = mMean.nFeatures();

     vectord v0 = mData.mY - prod(trans(mMean.mFeatM),mW0);
     matrixd WW = zmatrixd(p,p);  //TODO: diagonal matrix
     utils::add_to_diagonal(WW,mInvVarW);
     matrixd FW = prod(trans(mMean.mFeatM),WW);
     KK += prod(FW,mMean.mFeatM);
     matrixd BB(n,n);
     utils::cholesky_decompose(KK,BB);
     inplace_solve(BB,v0,ublas::lower_tag());
     double zz = inner_prod(v0,v0);

     double lik = 1/(2*mSigma) * zz;
     lik += utils::log_trace(BB);
     return lik;
   }


   void GaussianProcessNormal::precomputePrediction()
   {
     const size_t p = mMean.nFeatures();

     mKF = trans(mMean.mFeatM);
     inplace_solve(mL,mKF,ublas::lower_tag());
     //TODO: make one line
     matrixd DD(p,p);
     DD = prod(trans(mKF),mKF);
     utils::add_to_diagonal(DD,mInvVarW);
     utils::cholesky_decompose(DD,mD);

     vectord vn = mData.mY;
     inplace_solve(mL,vn,ublas::lower_tag());
     mWMap = prod(mMean.mFeatM,vn) + utils::ublas_elementwise_prod(mInvVarW,mW0);
     utils::cholesky_solve(mD,mWMap,ublas::lower());

     mVf = mData.mY - prod(trans(mMean.mFeatM),mWMap);
     inplace_solve(mL,mVf,ublas::lower_tag());

     if (boost::math::isnan(mWMap(0)))
       {
     throw std::runtime_error("Error in precomputed prediction. NaN found.");
       }
   }

 } //namespace bayesopt
bayesopt::GaussianProcessNormal::prediction
ProbabilityDistribution * prediction(const vectord &query)
Function that returns the prediction of the GP for a query point in the hypercube [0...
Definition: gaussian_process_normal.cpp:64

bayesopt::KernelRegressor::computeCorrMatrix
matrixd computeCorrMatrix()
Computes the Correlation (Kernel or Gram) matrix.
Definition: kernelregressor.hpp:192

bayesopt::GaussianDistribution::setMeanAndStd
void setMeanAndStd(double mean, double std)
Sets the mean and std of the distribution.
Definition: gauss_distribution.hpp:44

bayesopt::GaussianProcessNormal::precomputePrediction
void precomputePrediction()
Precompute some values of the prediction that do not depends on the query.
Definition: gaussian_process_normal.cpp:116

bayesopt
Namespace of the library interface.
Definition: using.dox:1

ublas_elementwise.hpp
Elementwise operations for ublas vector/matrix.

bayesopt::KernelRegressor::mL
matrixd mL
Cholesky decomposition of the Correlation matrix.
Definition: kernelregressor.hpp:104

bayesopt::GaussianProcessML::d_
GaussianDistribution * d_
Predictive distributions.
Definition: gaussian_process_ml.hpp:81

gauss_distribution.hpp
Gaussian probability distribution.

bayesopt::utils::ublas_elementwise_prod
v1 ublas_elementwise_prod(const v1 &a, const v2 &b)
Computes the elementwise product of two vectors or matrices.
Definition: ublas_elementwise.hpp:40

bayesopt::GaussianProcessNormal::negativeLogLikelihood
double negativeLogLikelihood()
Computes the negative log likelihood and its gradient of the data.
Definition: gaussian_process_normal.cpp:93

bayesopt::NonParametricProcess::mSigma
double mSigma
Signal variance.
Definition: nonparametricprocess.hpp:102

bayesopt::utils::cholesky_decompose
size_t cholesky_decompose(const MATRIX &A, TRIA &L)
decompose the symmetric positive definit matrix A into product L L^T.
Definition: ublas_cholesky.hpp:57

bayesopt::utils::cholesky_solve
void cholesky_solve(const TRIA &L, MATRIX &x, ublas::lower)
solve system L L^T x = b inplace
Definition: ublas_cholesky.hpp:222

bayesopt::MeanModel::mFeatM
matrixd mFeatM
Value of the mean features at the input points.
Definition: mean_functors.hpp:153

bayesopt::Dataset::mY
vectord mY
Data values.
Definition: dataset.hpp:64

gaussian_process_normal.hpp
Gaussian process with normal prior on the parameters.