bayesopt/html/student__t__process__nig_8cpp_source.html

 /*
 -------------------------------------------------------------------------
    This file is part of BayesOpt, an efficient C++ library for
    Bayesian optimization.

    Copyright (C) 2011-2015 Ruben Martinez-Cantin <rmcantin@unizar.es>

    BayesOpt is free software: you can redistribute it and/or modify it
    under the terms of the GNU Affero General Public License as published by
    the Free Software Foundation, either version 3 of the License, or
    (at your option) any later version.

    BayesOpt is distributed in the hope that it will be useful, but
    WITHOUT ANY WARRANTY; without even the implied warranty of
    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
    GNU Affero General Public License for more details.

    You should have received a copy of the GNU Affero General Public License
    along with BayesOpt.  If not, see <http://www.gnu.org/licenses/>.
 ------------------------------------------------------------------------
 */

 #include <cstdlib>
 #include <boost/math/special_functions/fpclassify.hpp>
 #include <boost/numeric/ublas/banded.hpp>
 #include "log.hpp"
 #include "student_t_process_nig.hpp"
 #include "ublas_trace.hpp"
 #include "ublas_elementwise.hpp"
 #include "student_t_distribution.hpp"

 namespace bayesopt
 {

   namespace ublas = boost::numeric::ublas;

   StudentTProcessNIG::StudentTProcessNIG(size_t dim, Parameters params,
                      const Dataset& data,
                      MeanModel& mean, randEngine& eng):
     HierarchicalGaussianProcess(dim,params,data, mean, eng),
     mAlpha(params.alpha), mBeta (params.beta),
     mW0(params.mean.coef_mean.size()), mInvVarW(params.mean.coef_mean.size()),
     mD(params.mean.coef_mean.size(),params.mean.coef_mean.size())
   {
     mW0 = params.mean.coef_mean;
     for (size_t ii = 0; ii < params.mean.coef_mean.size(); ++ii)
       {
     double varii = params.mean.coef_std[ii] * params.mean.coef_std[ii];
     mInvVarW(ii) = 1/varii;
       }
      d_ = new StudentTDistribution(eng);
   }  // Constructor


   StudentTProcessNIG::~StudentTProcessNIG()
   {
     delete d_;
   } // Default destructor


   ProbabilityDistribution* StudentTProcessNIG::prediction(const vectord &query)
   {
     double kq = computeSelfCorrelation(query);
     vectord kn = computeCrossCorrelation(query);
     vectord phi = mMean.getFeatures(query);

     vectord v(kn);
     inplace_solve(mL,v,ublas::lower_tag());

     vectord rq = phi - prod(v,mKF);

     vectord rho(rq);
     inplace_solve(mD,rho,ublas::lower_tag());

     double yPred = inner_prod(phi,mWMap) + inner_prod(v,mVf);
     double sPred = sqrt( mSigma * (kq - inner_prod(v,v)
                    + inner_prod(rho,rho)));

     if ((boost::math::isnan(yPred)) || (boost::math::isnan(sPred)))
       {
     throw std::runtime_error("Error in prediction. NaN found.");
       }


     d_->setMeanAndStd(yPred,sPred);
     return d_;
   }


   double StudentTProcessNIG::negativeLogLikelihood()
   {
     matrixd KK = computeCorrMatrix();
     const size_t n = KK.size1();
     const size_t p = mMean.nFeatures();
     const size_t nalpha = (n+2*mAlpha);

     vectord v0 = mData.mY - prod(trans(mMean.mFeatM),mW0);
     matrixd WW = zmatrixd(p,p);  //TODO: diagonal matrix
     utils::add_to_diagonal(WW,mInvVarW);
     matrixd FW = prod(trans(mMean.mFeatM),WW);
     KK += prod(FW,mMean.mFeatM);
     matrixd BB(n,n);
     utils::cholesky_decompose(KK,BB);
     inplace_solve(BB,v0,ublas::lower_tag());
     double zz = inner_prod(v0,v0);
     double sigmaMap = (mBeta/mAlpha + zz)/nalpha;

     double lik = nalpha/2 * std::log(1+zz/(2*mBeta*sigmaMap));
     lik += utils::log_trace(BB);
     lik += n/2 * std::log(sigmaMap);
     return lik;
   }


   void StudentTProcessNIG::precomputePrediction()
   {
     size_t n = mData.getNSamples();
     size_t p = mMean.nFeatures();

     mKF = trans(mMean.mFeatM);
     inplace_solve(mL,mKF,ublas::lower_tag());
     //TODO: make one line
     matrixd DD(p,p);
     DD = prod(trans(mKF),mKF);
     utils::add_to_diagonal(DD,mInvVarW);
     utils::cholesky_decompose(DD,mD);

     vectord vn = mData.mY;
     inplace_solve(mL,vn,ublas::lower_tag());
     mWMap = prod(mMean.mFeatM,vn) + utils::ublas_elementwise_prod(mInvVarW,mW0);
     utils::cholesky_solve(mD,mWMap,ublas::lower());

     mVf = mData.mY - prod(trans(mMean.mFeatM),mWMap);
     inplace_solve(mL,mVf,ublas::lower_tag());

     vectord v0 = mData.mY - prod(trans(mMean.mFeatM),mW0);
     //TODO: check for "cheaper" version
     //matrixd KK = prod(mL,trans(mL));
     matrixd KK = computeCorrMatrix();
     matrixd WW = zmatrixd(p,p);  //TODO: diagonal matrix
     utils::add_to_diagonal(WW,mInvVarW);
     const matrixd FW = prod(trans(mMean.mFeatM),WW);
     KK += prod(FW,mMean.mFeatM);
     matrixd BB(n,n);
     utils::cholesky_decompose(KK,BB);
     inplace_solve(BB,v0,ublas::lower_tag());
     mSigma = (mBeta/mAlpha + inner_prod(v0,v0))/(n+2*mAlpha);

     int dof = static_cast<int>(n+2*mAlpha);

     if ((boost::math::isnan(mWMap(0))) || (boost::math::isnan(mSigma)))
       {
     throw std::runtime_error("Error in precomputed prediction. NaN found.");
       }


     if (dof <= 0)
       {
     dof = n;
     FILE_LOG(logERROR) << "ERROR: Incorrect alpha. Dof invalid."
                << "Forcing Dof <= num of points.";
       }

     d_->setDof(dof);
   }

 } //namespace bayesopt
bayesopt::KernelRegressor::computeCorrMatrix
matrixd computeCorrMatrix()
Computes the Correlation (Kernel or Gram) matrix.
Definition: kernelregressor.hpp:192

bayesopt
Namespace of the library interface.
Definition: using.dox:1

student_t_process_nig.hpp
Student&#39;s t process with Normal-Inverse-Gamma hyperprior on mean and signal variance parameters...

bayesopt::StudentTProcessJeffreys::d_
StudentTDistribution * d_
Predictive distributions.
Definition: student_t_process_jef.hpp:80

bayesopt::StudentTProcessNIG::prediction
ProbabilityDistribution * prediction(const vectord &query)
Function that returns the prediction of the GP for a query point in the hypercube [0...
Definition: student_t_process_nig.cpp:62

bayesopt::StudentTProcessNIG::precomputePrediction
void precomputePrediction()
Precompute some values of the prediction that do not depends on the query.
Definition: student_t_process_nig.cpp:117

ublas_elementwise.hpp
Elementwise operations for ublas vector/matrix.

bayesopt::StudentTDistribution::setMeanAndStd
void setMeanAndStd(double mean, double std)
Sets the mean and std of the distribution.
Definition: student_t_distribution.hpp:45

bayesopt::StudentTDistribution::setDof
void setDof(size_t dof)
Sets the degrees of freedom (dof) the distribution.
Definition: student_t_distribution.hpp:51

bayesopt::KernelRegressor::mL
matrixd mL
Cholesky decomposition of the Correlation matrix.
Definition: kernelregressor.hpp:104

bayesopt::utils::ublas_elementwise_prod
v1 ublas_elementwise_prod(const v1 &a, const v2 &b)
Computes the elementwise product of two vectors or matrices.
Definition: ublas_elementwise.hpp:40

bayesopt::NonParametricProcess::mSigma
double mSigma
Signal variance.
Definition: nonparametricprocess.hpp:102

bayesopt::utils::cholesky_decompose
size_t cholesky_decompose(const MATRIX &A, TRIA &L)
decompose the symmetric positive definit matrix A into product L L^T.
Definition: ublas_cholesky.hpp:57

bayesopt::utils::cholesky_solve
void cholesky_solve(const TRIA &L, MATRIX &x, ublas::lower)
solve system L L^T x = b inplace
Definition: ublas_cholesky.hpp:222

log.hpp
Modules and helper macros for logging.

bayesopt::MeanModel::mFeatM
matrixd mFeatM
Value of the mean features at the input points.
Definition: mean_functors.hpp:153

bayesopt::StudentTProcessNIG::negativeLogLikelihood
double negativeLogLikelihood()
Computes the negative log likelihood and its gradient of the data.
Definition: student_t_process_nig.cpp:91

bayesopt::Dataset::mY
vectord mY
Data values.
Definition: dataset.hpp:64

student_t_distribution.hpp
Student&#39;s t probability distribution.

bayesopt::ProbabilityDistribution
Definition: prob_distribution.hpp:35