developer-doc/html/_kernel_functions_8cpp_source.html

 /* +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++

    Copyright (c) 2013 The plumed team

    (see the PEOPLE file at the root of the distribution for a list of names)


    See http://www.plumed-code.org for more information.


    This file is part of plumed, version 2.0.


    plumed is free software: you can redistribute it and/or modify

    it under the terms of the GNU Lesser General Public License as published by

    the Free Software Foundation, either version 3 of the License, or

    (at your option) any later version.


    plumed is distributed in the hope that it will be useful,

    but WITHOUT ANY WARRANTY; without even the implied warranty of

    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

    GNU Lesser General Public License for more details.


    You should have received a copy of the GNU Lesser General Public License

    along with plumed.  If not, see <http://www.gnu.org/licenses/>.

 +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ */

 #include "KernelFunctions.h"

 #include "IFile.h"

 #include <iostream>

 #include <cmath>


 namespace PLMD {


 //+PLUMEDOC INTERNAL kernelfunctions

 /*

 Functions that are used to construct histograms


 Constructing histograms is something you learnt to do relatively early in life. You perform an experiment a number of times,

 count the number of times each result comes up and then draw a bar graph that describes how often each of the results came up.

 This only works when there are a finite number of possible results.  If the result a number between 0 and 1 the bar chart is

 less easy to draw as there are as many possible results as there are numbers between zero and one - an infinite number.

 To resolve this problem we replace probability, \f$P\f$ with probability density, \f$\pi\f$, and write the probability of getting

 a number between \f$a\f$ and \f$b\f$ as:


 \f[

 P = \int_{a}^b \textrm{d}x \pi(x)

 \f]


 To calculate probability densities from a set of results we use a process called kernel density estimation.

 Histograms are accumulated by adding up kernel functions, \f$K\f$, with finite spatial extent, that integrate to one.

 These functions are centered on each of the \f$n\f$-dimensional data points, \f$\mathbf{x}_i\f$. The overall effect of this

 is that each result we obtain in our experiments contributes to the probability density in a finite sized region of the space.


 Expressing all this mathematically in kernel density estimation we write the probability density as:


 \f[

 \pi(\mathbf{x}) =  \sum_i K\left[ (\mathbf{x} - \mathbf{x}_i)^T \Sigma (\mathbf{x} - \mathbf{x}_i) \right]

 \f]


 where \f$\Sigma\f$ is an \f$n \times n\f$ matrix called the bandwidth that controls the spatial extent of

 the kernel. Whenever we accumulate a histogram (e.g. in \ref HISTOGRAM or in \ref METAD) we use this

 technique.


 There is thus some flexibility in the particular function we use for \f$K[\mathbf{r}]\f$ in the above.

 The following variants are available.


 <table align=center frame=void width=95%% cellpadding=5%%>

 <tr>

 <td> TYPE </td> <td> FUNCTION </td>

 </tr> <tr>

 <td> gaussian </td> <td> \f$f(r) = \frac{1}{(2 \pi)^{n} \sqrt{|\Sigma^{-1}|}} \exp\left(-0.5 r^2 \right)\f$ </td>

 </tr> <tr>

 <td> triangular </td> <td> \f$f(r) = \frac{3}{V} ( 1 - | r | )H(1-|r|) \f$ </td>

 </tr> <tr>

 <td> uniform </td> <td> \f$f(r) = \frac{1}{V}H(1-|r|)\f$ </td>

 </tr>

 </table>


 In the above \f$H(y)\f$ is a function that is equal to one when \f$y>0\f$ and zero when \f$y \le 0\f$. \f$n\f$ is

 the dimensionality of the vector \f$\mathbf{x}\f$ and \f$V\f$ is the volume of an elipse in an \f$n\f$ dimensional

 space which is given by:


 \f{eqnarray*}{

 V &=& | \Sigma^{-1} | \frac{ \pi^{\frac{n}{2}} }{\left( \frac{n}{2} \right)! } \qquad \textrm{for even} \quad n \\

 V &=& | \Sigma^{-1} | \frac{ 2^{\frac{n+1}{2}} \pi^{\frac{n-1}{2}} }{ n!! }

 \f}


 In \ref METAD the normalization constants are ignored so that the value of the function at \f$r=0\f$ is equal

 to one.  In addition in \ref METAD we must be able to differentiate the bias in order to get forces.  This limits

 the kernels we can use in this method.

 */

 //+ENDPLUMEDOC


 KernelFunctions::KernelFunctions( const std::vector<double>& at, const std::vector<double>& sig, const std::string& type, const bool multivariate, const double& w, const bool norm ):

 center(at),

 width(sig)

 {

   if (multivariate==true)diagonal=false;

   if (multivariate==false)diagonal=true;


   // Setup the kernel type

   if(type=="GAUSSIAN" || type=="gaussian"){

       ktype=gaussian;

   } else if(type=="UNIFORM" || type=="uniform"){

       ktype=uniform;

   } else if(type=="TRIANGULAR" || type=="triangular"){

       ktype=triangular;

   } else {

       plumed_merror(type+" is an invalid kernel type\n");

   }


   if( norm ){

     double det;

     unsigned ncv=ndim();

     if(diagonal){

        det=1; for(unsigned i=0;i<width.size();++i) det*=width[i];

     } else {

        Matrix<double> mymatrix( getMatrix() ), myinv( ncv, ncv );

        Invert(mymatrix,myinv); double logd;

        logdet( myinv, logd );

        det=std::exp(logd);

     }

     double volume;

     if( ktype==gaussian ){

        for(unsigned i=0;i<width.size();++i) det*=width[i];

        volume=pow( 2*pi, 0.5*ncv ) * pow( det, 0.5 );

     } else if( ktype==uniform || ktype==triangular ){

        if( ncv%2==1 ){

           double dfact=1;

           for(unsigned i=1;i<ncv;i+=2) dfact*=static_cast<double>(i);

           volume=( pow( pi, (ncv-1)/2 ) ) * ( pow( 2., (ncv+1)/2 ) ) / dfact;

        } else {

           double fact=1.;

           for(unsigned i=1;i<ncv/2;++i) fact*=static_cast<double>(i);

           volume=pow( pi,ncv/2 ) / fact;

        }

        if(ktype==uniform) volume*=det;

        else if(ktype==triangular) volume*=det / 3.;

     } else {

        plumed_merror("not a valid kernel type");

     }

     height=w / volume;

   } else {

     height=w;

   }

 }


 double KernelFunctions::getCutoff( const double& width ) const {

   const double DP2CUTOFF=6.25;

   if( ktype==gaussian ) return sqrt(2.0*DP2CUTOFF)*width;

   else if(ktype==triangular ) return width;

   else if(ktype==uniform) return width;

   else plumed_merror("No valid kernel type");

   return 0.0;

 }


 std::vector<double> KernelFunctions::getContinuousSupport( ) const {

   unsigned ncv=ndim();

   std::vector<double> support( ncv );

   if(diagonal){

      for(unsigned i=0;i<ncv;++i) support[i]=getCutoff(width[i]);

   } else {

      Matrix<double> mymatrix( getMatrix() ), myinv( ncv,ncv );

      Invert(mymatrix,myinv);

      Matrix<double> myautovec(ncv,ncv); std::vector<double> myautoval(ncv);

      diagMat(myinv,myautoval,myautovec);

      double maxautoval;maxautoval=0.;

      unsigned ind_maxautoval;

      for (unsigned i=0;i<ncv;i++){

              if(myautoval[i]>maxautoval){maxautoval=myautoval[i];ind_maxautoval=i;}

      }

      for(unsigned i=0;i<ncv;++i){

          double extent=fabs(sqrt(maxautoval)*myautovec(i,ind_maxautoval));

          support[i]=getCutoff( extent );

      }

   }

  return support;

 }


 std::vector<unsigned> KernelFunctions::getSupport( const std::vector<double>& dx ) const {

   plumed_assert( ndim()==dx.size() );

   std::vector<unsigned> support( dx.size() );

   std::vector<double> vv=getContinuousSupport( );

   for(unsigned i=0;i<dx.size();++i) support[i]=static_cast<unsigned>(ceil( vv[i]/dx[i] ));

   return support;

 }


 double KernelFunctions::evaluate( const std::vector<Value*>& pos, std::vector<double>& derivatives, bool usederiv ) const {

   plumed_dbg_assert( pos.size()==ndim() && derivatives.size()==ndim() );

 #ifndef NDEBUG

   if( usederiv ) plumed_massert( ktype!=uniform, "step function can not be differentiated" );

 #endif


   double r2=0;

   if(diagonal){

      for(unsigned i=0;i<ndim();++i){

          derivatives[i]=-pos[i]->difference( center[i] ) / width[i];

          r2+=derivatives[i]*derivatives[i];

          derivatives[i] /= width[i];

      }

   } else {

      Matrix<double> mymatrix( getMatrix() );

      for(unsigned i=0;i<mymatrix.nrows();++i){

         double dp_i, dp_j; derivatives[i]=0;

         dp_i=pos[i]->difference( center[i] );

         for(unsigned j=0;j<mymatrix.ncols();++j){

           if(i==j) dp_j=dp_i;

           else dp_j=pos[j]->difference( center[j] );


           derivatives[i]+=mymatrix(i,j)*dp_j;

           r2+=dp_i*dp_j*mymatrix(i,j);

         }

      }

   }

   double kderiv, kval;

   if(ktype==gaussian){

      kval=height*std::exp(-0.5*r2); kderiv=-kval;

   } else {

      double r=sqrt(r2);

      if(ktype==triangular){

         if( r<1.0 ){

             if(r==0) kderiv=0;

             kderiv=-1; kval=height*( 1. - fabs(r) );

         } else {

             kval=0.; kderiv=0.;

         }

      } else if(ktype==uniform){

         kderiv=0.;

         if(r<1.0) kval=height;

         else kval=0;

      } else {

          plumed_merror("Not a valid kernel type");

      }

      kderiv*=height / r ;

   }

   for(unsigned i=0;i<ndim();++i) derivatives[i]*=kderiv;

   return kval;

 }


 KernelFunctions* KernelFunctions::read( IFile* ifile, const std::vector<std::string>& valnames ){

   std::string sss; ifile->scanField("multivariate",sss);

   std::vector<double> cc( valnames.size() ), sig;

   bool multivariate;

   if( sss=="false" ){

      multivariate=false;

      sig.resize( valnames.size() );

      for(unsigned i=0;i<valnames.size();++i){

          ifile->scanField(valnames[i],cc[i]);

          ifile->scanField("sigma_"+valnames[i],sig[i]);

      }

   } else if( sss=="true" ){

      multivariate=true;

      unsigned ncv=valnames.size();

      sig.resize( (ncv*(ncv+1))/2 );

      Matrix<double> upper(ncv,ncv), lower(ncv,ncv);

      for(unsigned i=0;i<ncv;++i){

          ifile->scanField(valnames[i],cc[i]);

          for(unsigned j=0;j<ncv-i;j++){ ifile->scanField("sigma_" +valnames[j+i] + "_" + valnames[j], lower(j+i,j) ); upper(j,j+i)=lower(j+i,j); }

      }

      Matrix<double> mymult( ncv, ncv ), invmatrix(ncv,ncv);

      mult(lower,upper,mymult); Invert( mymult, invmatrix );

      unsigned k=0;

      for(unsigned i=0;i<ncv;i++){

          for(unsigned j=i;j<ncv;j++){ sig[k]=invmatrix(i,j); k++; }

      }

   } else {

       plumed_merror("multivariate flag should equal true or false");

   }

   double h; ifile->scanField("height",h);

   return new KernelFunctions( cc, sig, "gaussian", multivariate ,h, false);

 }


 }

PLMD::KernelFunctions::uniform
Definition: KernelFunctions.h:37

PLMD::KernelFunctions::getSupport
std::vector< unsigned > getSupport(const std::vector< double > &dx) const
Get the support.
Definition: KernelFunctions.cpp:176

PLMD::KernelFunctions::read
static KernelFunctions * read(IFile *ifile, const std::vector< std::string > &valnames)
Read a kernel function from a file.
Definition: KernelFunctions.cpp:236

PLMD::Invert
int Invert(const Matrix< T > &A, Matrix< double > &inverse)
Definition: Matrix.h:246

PLMD::KernelFunctions::evaluate
double evaluate(const std::vector< Value * > &pos, std::vector< double > &derivatives, bool usederiv=true) const
Evaluate the kernel function.
Definition: KernelFunctions.cpp:184

PLMD::KernelFunctions::height
double height
The height of the kernel.
Definition: KernelFunctions.h:43

IFile.h

PLMD::KernelFunctions::getMatrix
Matrix< double > getMatrix() const
Convert the width into matrix form.
Definition: KernelFunctions.h:65

PLMD::Matrix::ncols
unsigned ncols() const
Return the number of columns.
Definition: Matrix.h:110

PLMD::KernelFunctions::getCutoff
double getCutoff(const double &width) const
Get the cutoff for a kernel.
Definition: KernelFunctions.cpp:144

DP2CUTOFF
#define DP2CUTOFF
Definition: MetaD.cpp:37

PLMD::KernelFunctions::getContinuousSupport
std::vector< double > getContinuousSupport() const
get it in continuous form
Definition: KernelFunctions.cpp:153

PLMD::KernelFunctions
Definition: KernelFunctions.h:32

PLMD::KernelFunctions::triangular
Definition: KernelFunctions.h:37

PLMD::KernelFunctions::ndim
unsigned ndim() const
Get the dimensionality of the kernel.
Definition: KernelFunctions.h:77

PLMD::KernelFunctions::center
std::vector< double > center
The center of the kernel function.
Definition: KernelFunctions.h:39

PLMD::mult
void mult(const Matrix< T > &A, const Matrix< T > &B, Matrix< T > &C)
Definition: Matrix.h:165

KernelFunctions.h

PLMD::KernelFunctions::ktype
enum PLMD::KernelFunctions::@4 ktype
What type of kernel are we using.

PLMD::Matrix::nrows
unsigned nrows() const
Return the number of rows.
Definition: Matrix.h:108

PLMD::KernelFunctions::width
std::vector< double > width
The width of the kernel.
Definition: KernelFunctions.h:41

PLMD::IFile
Class for input files.
Definition: IFile.h:40

w
void const char const char int double int double double int int double int double * w
Definition: Matrix.h:42

PLMD::KernelFunctions::diagonal
bool diagonal
Is the metric matrix diagonal.
Definition: KernelFunctions.h:35

PLMD::logdet
int logdet(const Matrix< T > &M, double &ldet)
Definition: Matrix.h:314

PLMD::diagMat
int diagMat(const Matrix< T > &A, std::vector< double > &eigenvals, Matrix< double > &eigenvecs)
Definition: Matrix.h:203

PLMD::pi
const double pi(3.141592653589793238462643383279502884197169399375105820974944592307)
PI.

PLMD::KernelFunctions::gaussian
Definition: KernelFunctions.h:37

PLMD::IFile::scanField
IFile & scanField(const std::string &, double &)
Read a double field.
Definition: IFile.cpp:121

PLMD::KernelFunctions::KernelFunctions
KernelFunctions(const std::vector< double > &at, const std::vector< double > &sig, const std::string &type, const bool multivariate, const double &w, const bool norm)
Definition: KernelFunctions.cpp:89

PLMD
Definition: Analysis.cpp:30

PLMD::Matrix< double >

PLMD::norm
T norm(const std::vector< T > &A)
Calculate the dot product between a vector and itself.
Definition: Matrix.h:61