hmc__functions_8cpp_source.html

 // Added these from Johnoel's code for the RNG below. Hopefully play nice

 // with everything else

 #include <iostream>

 #include <vector>

 #include <cstdlib>

 #include <cmath>

 #include <fstream>

 #include <sstream>

 #include <stack>

 #include <queue>


 #ifndef __OPENCC__

 #include <random>

 #endif


 //#include "nuts_da.h"


 using std::cout;

 using std::endl;

 using std::vector;

 using std::ifstream;

 using std::istringstream;

 using std::pow;

 using std::stack;

 using std::queue;


 #include "admodel.h"

 #ifndef OPT_LIB

 #include <cassert>

 #endif


 int function_minimizer::compute_next_window(int i, int warmup, int w1, int aws, int w3){

   int anw;

   anw = i+aws;

   if(anw == (warmup-w3) )

     return(anw);

   // Check that the next anw is not too long. This will be the anw for the

   // next time this is computed.

   int nwb = anw+2*aws;

   if(nwb >= warmup-w3){

     // if(i != warmup-w3){

     // cout << "Extending last slow window from" <<

     // anw << "to" << warmup-w3 << endl;

     // }

     anw = warmup-w3;

   }

   return(anw);

 }


 bool function_minimizer::slow_phase(int i, int warmup, int w1, int w3)

 {

   // After w1, before start of w3

   bool x1 = i>= w1; // after initial fast window

   bool x2 = i<= (warmup-w3); // but before last fast window

   bool x3 = i < warmup; // definitely not during sampling

   return(x1 & x2 & x3);

 }


 // Strip out the model name given full path

 std::string function_minimizer::get_filename(const char* f) {

   std::string s(f);

   size_t pos = s.find_last_of("/\\");

   std::string filename_exe = s.substr(pos + 1);

   size_t dot_pos = s.find_last_of(".");

   std::string filename = s.substr(pos + 1, dot_pos - pos - 1);

   return filename;

 }


 // This function is the heart of NUTS. It builds a single trajectory whose

 // length depends on input j. It keeps doubling in  direction v until

 // finished or a U-turn occurs.

 void function_minimizer::build_tree(int nvar, dvector& gr, dmatrix& chd, double eps, dvector& p,

             dvector& y, dvector& gr2, double logu, int v, int j, double H0,

             dvector& _thetaprime, dvector& _thetaplus, dvector& _thetaminus,

             dvector& _rplus, dvector& _rminus,

             double& _alphaprime, int& _nalphaprime, bool& _sprime,

             int& _nprime, int& _nfevals, bool& _divergent,

             const random_number_generator& rng,

             dvector& gr2_end, dvector& _grprime, dvector& _gr2prime, double& _nllprime,

             double& _Hprime, independent_variables& _parsaveprime) {


   if (j==0) {

     // Take a single step in direction v from points p,y, which are updated

     // internally by reference and thus represent the new point.

     double nll= leapfrog(nvar, gr, chd, eps*v, p, y, gr2);

     // These are the NLL and gradients at the last point

     // evaluated, saved via reference, so I don't have to

     // recalculate them when starting a new trajectory.

     gr2_end=gr2;

     // The new Hamiltonian value. ADMB returns negative log density so

     // correct it

     double Ham=-(nll+0.5*norm2(p));


     // Check for divergence. Either numerical (nll is nan) or a big

     // difference in H. Screws up all the calculations so catch it here.

     _divergent = (std::isnan(Ham) || logu > 1000+Ham);

     if(_divergent){

       _sprime=0;

       _alphaprime=0; // these will be NaN otherwise

       _nprime=0;

     } else {

       // No divergence

       _nprime = logu < Ham;

       _sprime=1;

       _alphaprime = min(1.0, exp(Ham-H0));

       // Update the tree elements, which are returned by reference in

       // leapfrog.

       _thetaprime = y;

       _thetaminus = y;

       _rminus = p;

       _thetaplus = y;

       _rplus = p;

       _grprime=gr; _gr2prime=gr2; _nllprime=nll; _Hprime=Ham;

       initial_params::copy_all_values(_parsaveprime,1.0);

     }

     _nalphaprime=1;

     _nfevals++;

   } else { // j > 1

     // Build first half of tree.

     build_tree(nvar, gr, chd, eps, p, y, gr2, logu, v, j-1,

          H0, _thetaprime,  _thetaplus, _thetaminus, _rplus, _rminus,

          _alphaprime, _nalphaprime, _sprime,

          _nprime, _nfevals, _divergent, rng,

          gr2_end, _grprime, _gr2prime, _nllprime, _Hprime, _parsaveprime);

     // If valid trajectory, build second half.

     if (_sprime == 1) {

       // Save copies of the global ones due to rerunning build_tree below

       // which will overwrite some of the global variables we need to

       // save. These are the ' versions of the paper, e.g., sprime'.

       dvector thetaprime0(1,nvar);

       independent_variables parsaveprime0(1,nvar);

       dvector gr2prime0(1,nvar); dvector grprime0(1,nvar);

       double nllprime0, Hprime0;

       dvector thetaplus0(1,nvar);

       dvector thetaminus0(1,nvar);

       dvector rplus0(1,nvar);

       dvector rminus0(1,nvar);

       thetaprime0=_thetaprime;

       parsaveprime0=_parsaveprime;

       grprime0=_grprime;

       gr2prime0=_gr2prime;

       nllprime0=_nllprime;

       Hprime0=_Hprime;

       thetaplus0=_thetaplus;

       thetaminus0=_thetaminus;

       rplus0=_rplus;

       rminus0=_rminus;

       int nprime0 = _nprime;

       double alphaprime0 = _alphaprime;

       int nalphaprime0 = _nalphaprime;


       // Make subtree to the left

       if (v == -1) {

   build_tree(nvar, gr, chd, eps, _rminus, _thetaminus, gr2, logu, v, j-1,

        H0, _thetaprime,  _thetaplus, _thetaminus, _rplus, _rminus,

        _alphaprime, _nalphaprime, _sprime,

        _nprime, _nfevals, _divergent, rng,

        gr2_end, _grprime, _gr2prime, _nllprime, _Hprime, _parsaveprime);

   // Update the leftmost point

   rminus0=_rminus;

   thetaminus0=_thetaminus;

   // Rest rightmost tree

   _thetaplus=thetaplus0;

   _rplus=rplus0;

       } else {

   // Make subtree to the right

   build_tree(nvar, gr, chd, eps, _rplus, _thetaplus, gr2, logu, v, j-1,

        H0, _thetaprime,  _thetaplus, _thetaminus, _rplus, _rminus,

        _alphaprime, _nalphaprime, _sprime,

        _nprime, _nfevals, _divergent, rng,

        gr2_end, _grprime, _gr2prime, _nllprime, _Hprime, _parsaveprime);

   // Update the rightmost point

   rplus0=_rplus;

   thetaplus0=_thetaplus;

   // Reset leftmost tree

   _thetaminus=thetaminus0;

   _rminus=rminus0;

       }


       // This is (n'+n''). Can be zero so need to be careful??

       int nprime_temp = nprime0 + _nprime;

       if(std::isnan(static_cast<double>(nprime_temp))) nprime_temp=0;

       // Choose whether to keep the proposal thetaprime.

       double rr=randu(rng); // runif(1)

       if (nprime_temp != 0 && rr < double(_nprime)/double(nprime_temp)) {

   // Update theta prime to be the new proposal for this tree so far.

   // _thetaprime already updated globally above so do nothing

       } else {

   // Reject it for the proposal from the last doubling.

   _thetaprime = thetaprime0;

   _parsaveprime=parsaveprime0;

   _grprime=grprime0;

   _gr2prime=gr2prime0;

   _nllprime=nllprime0;

   _Hprime=Hprime0;

       }


       // Update the global reference variables

       _alphaprime = alphaprime0 + _alphaprime;

       _nalphaprime = nalphaprime0 + _nalphaprime;

       // s' from the first execution above is 1 by definition (inside this

       // if statement), while _sprime is s''. So need to reset s':

       bool b = stop_criterion(nvar, thetaminus0, thetaplus0, rminus0, rplus0);

       _sprime = _sprime && b;

       _nprime = nprime_temp;

     } // end building second trajectory

   }   // end recursion branch (j>0)

 }     // end function


 bool function_minimizer::stop_criterion(int nvar, dvector& thetaminus, dvector& thetaplus,

           dvector& rminus, dvector& rplus)

 {

   dvector thetavec(1, nvar);

   thetavec=thetaplus-thetaminus;

   // Manual implementation of inner_product, equivalent to this

   // criterion = (thetavec*rminus+thetavec*rminus>=0) *

   //            (thetavec*rplus+thetavec*rplus>=0);

   double x1=0;

   double x2=0;

   for(int i=1; i<=nvar; i++){

     x1+=thetavec(i)*rminus(i);

     x2+=thetavec(i)*rplus(i);

   }

   // TRUE if both are TRUE, FALSE if at least one.

   bool criterion = (x1 >=0) && (x2 >=0);

   return criterion;

 }


 double function_minimizer::adapt_eps(int ii, int iseps, double eps, double alpha,

              double& adapt_delta, double& mu,

              dvector& epsvec, dvector& epsbar,

              dvector& Hbar){

   double gamma=0.05;  double t0=20;  double kappa=0.75;

   int m=ii+1;

   // If divergence, there is 0 acceptance probability so alpha=0.

   if(std::isnan(alpha)) alpha=0;

   Hbar(m)= (1-1/(iseps+t0))*Hbar(m-1) + (adapt_delta-alpha)/(iseps+t0);

   double logeps=mu-sqrt(iseps)*Hbar(m)/gamma;

   epsvec(m)=exp(logeps);

   double logepsbar= pow(iseps, -kappa)*logeps+(1-pow(iseps,-kappa))*log(epsbar(m-1));

   epsbar(m)=exp(logepsbar);

   return(epsvec(m));

 }


 double function_minimizer::get_hybrid_monte_carlo_value(int nvar, const independent_variables& y,dvector& g)

 {

   //initial_params::xinit(x);

   double f=0.0;

   if (mcmc2_flag==0 && lapprox)

     {

       cerr << "HMC not implemented for random effects models" << endl;

       ad_exit(1);

     }

   else

     {

       dvariable vf=0.0;

       dvar_vector vx=dvar_vector(y);

       vf=initial_params::reset(vx);

       *objective_function_value::pobjfun=0.0;

       userfunction();

       dvar_vector d(1,nvar);

       initial_params::stddev_vscale(d,vx);

       vf-=sum(log(d));

       vf+=*objective_function_value::pobjfun;

       f=value(vf);

       gradcalc(nvar,g);

     }

   return f;

 }


 void function_minimizer::print_mcmc_progress(int is, int nmcmc, int nwarmup, int chain, int refresh)

 {

   // Modified from Stan: sample::progress.hpp; 9/9/2016

   if(refresh>0){

     if (is==1 || is == nmcmc || is % refresh ==0 ){

       int width=1+(int)std::ceil(std::log10(static_cast<double>(nmcmc)));

       cout << "Chain " << chain << ": " << "Iteration: " << std::setw(width) << is

      << "/" << nmcmc << " [" << std::setw(3)

      << int(100.0 * (double(is) / double(nmcmc) ))

      << "%]" << (is <= nwarmup ? " (Warmup)" : " (Sampling)") << endl;

     }

   }

 }


 void function_minimizer::print_mcmc_timing(double time_warmup, double time_total, int chain) {

   double time_sampling=time_total-time_warmup;

   std::string title= "Elapsed Time: ";

   std::string title2="Chain " + std::to_string(chain) + ": ";

   std::string u; // units

   // Depending on how long it ran convert to sec/min/hour/days so

   // the outputs are interpretable

   if(time_total<=60){

     u=" seconds";

   } else if(time_total > 60 && time_total <=60*60){

     time_total/=60; time_sampling/=60; time_warmup/=60;

     u=" minutes";

   } else if(time_total > (60*60) && time_total <= (360*24)){

     time_total/=(60*60); time_sampling/=(60*60); time_warmup/=(60*60);

     u=" hours";

   } else {

     time_total/=(24*60*60); time_sampling/=(24*60*60); time_warmup/=(24*60*60);

     u=" days";

   }

   cout << title2 << title; printf("%5.2f", time_warmup); cout << u << " (Warmup   | ";

   printf("%.0f", 100*(time_warmup/time_total)); cout << "%)" << endl;

   cout << title2 << std::string(title.size(), ' '); printf("%5.2f", time_sampling);

   cout  << u << " (Sampling | " ;

   printf("%.0f", 100*(time_sampling/time_total)); cout <<"%)" << endl;

   cout << title2 << std::string(title.size(), ' '); printf("%5.2f", time_total);

   cout  << u << " (Total    | 100%)";

   cout << endl;

 }


 // This function holds the position (y) and momentum (p) vectors fixed and

 // takes a single step of size eps. This process repeats until a reasonable

 // eps is found. Thus need to make sure y and p are constant and only eps

 // changes.

 double function_minimizer::find_reasonable_stepsize(int nvar, dvector y, dvector p, dmatrix& chd,

                 bool verbose_adapt_mass, bool verbose_find_epsilon,

                 int chain)

 {

   double eps=1;        // initial eps

   independent_variables z(1,nvar); // rotated bounded parameters

   dvector p2(1,nvar);   // updated momentum

   dvector y2(1,nvar);   // updated position

   dvector gr(1,nvar);      // gradients

   dvector gr2(1,nvar);    // updated rotated gradient


   // Calculate initial Hamiltonian value

   double pprob1=0.5*norm2(p);

   z=rotate_pars(chd,y);

   double nllbegin=get_hybrid_monte_carlo_value(nvar,z,gr);

   dvector gr2begin=rotate_gradient(gr,chd); // rotated gradient

   double H1=nllbegin+pprob1;


   // Calculate H after a single step of size eps

   double nll2=leapfrog(nvar, gr, chd, eps, p2, y2, gr2);

   double pprob2=0.5*norm2(p2);

   double H2=nll2+pprob2;

   double alpha=exp(H1-H2);

   // Determine whether eps=1 is too big or too small, i.e. whether to halve

   // or double. If a=1, then eps keeps doubling until alpha passes 0.5;

   // otherwise it halves until that happens.

   double a;

   if(alpha < 0.5 || std::isnan(alpha)){

     // If divergence occurs or eps too big, halve it

     a=-1;

   } else {

     // If stepsize too small, double it

     a=1;

   }


   for(int k=2; k<50; k++){

     if(verbose_find_epsilon){

       cout << "Chain " << chain <<  ": Find epsilson: iteration=" << k-1 << "; eps=" << eps << "; NLL1=" << nllbegin << "; p1=" << pprob1 << "; H1=" << H1 <<

   "; NLL2=" << nll2 << "; p2=" << pprob2 <<"; H2=" << H2<< "; alpha=" << alpha << endl;

     }

     // Reinitialize position and momentum at each step.

     p2=p;

     y2=y;

     gr2=gr2begin;


     // Make one leapfrog step and check acceptance ratio

     nll2=leapfrog(nvar, gr, chd, eps, p2, y2, gr2);

     pprob2=0.5*norm2(p2);

     H2=nll2+pprob2;

     alpha=exp(H1-H2);


     // Check if the 1/2 threshold has been crossed

     if(!std::isnan(alpha) && pow(alpha,a) < pow(2,-a)){

       if(verbose_find_epsilon){

   cout << "Chain " << chain <<  ": Final epsilson: iteration=" << k << "; eps=" << eps << "; NLL1=" << nllbegin << "; p1=" << pprob1 << "; H1=" << H1 <<

     "; NLL2=" << nll2 << "; p2=" << pprob2 <<"; H2=" << H2<< "; alpha=" << alpha << endl;

       }

       if(verbose_adapt_mass) {cout << "Chain " << chain << ": Found reasonable step size of " << eps << endl;}

       return(eps);

     } else {

       // Otherwise either halve or double eps and do another iteration

       eps=pow(2,a)*eps;

     }

   }

   cerr << "Chain " << chain <<": Final epsilson: iteration=" << 50 << "; eps=" << eps << "; NLL1=" << nllbegin << "; p1=" << pprob1 << "; H1=" << H1 <<

     "; NLL2=" << nll2 << "; p2=" << pprob2 <<"; H2=" << H2<< "; alpha=" << alpha << endl;

   cerr << "Chain " << chain << ": Could not find reasonable initial step size. Is something wrong with model/initial value?" << endl;

   ad_exit(1);

   return(eps); // dummy to avoid compile warnings

 } // end of function


 double function_minimizer::leapfrog(int nvar, dvector& gr, dmatrix& chd, double eps, dvector& p, dvector& x,

             dvector& gr2)

 {

   independent_variables y(1,nvar); // bounded parameters

   dvector phalf;

   // Update momentum by half step

   phalf=p-eps/2*gr2;

   // Update parameters by full step

   x+=eps*phalf;

   // Transform parameters via mass matrix to get new gradient

   y=rotate_pars(chd,x);

   // Get NLL and set updated gradient in gr by reference

   double nll=get_hybrid_monte_carlo_value(nvar,y,gr);

   // Update gradient via mass matrix

   gr2=rotate_gradient(gr, chd);

   // Last half step for momentum

   p=phalf-eps/2*gr2;

   return(nll);

 }


 // This function reads in the hessian file to get the MLE values at the

 // end. This is needed when the user doesn't pass an initial vector with

 // -mcpin b/c the model is not necessarily run with -est. With adnuts it is

 // not by default so need a default starting value.

 void function_minimizer::read_mle_hmc(int nvar, dvector& mle) {

   int debug = 0;//flag to print debugging info to terminal

   adstring tmpstring = "admodel.hes";

   uistream cif((char*)tmpstring);

   if (!cif) {

     cerr << "Error reading admodel.hes file to get MLE values. Try re-optimizing model." << endl;

     ad_exit(1);

   }

   int tmp_nvar = 0;

   cif >> tmp_nvar;

   if (nvar !=tmp_nvar) {

 //    cerr << "The number of variables in admodel.hes " << tmp_nvar << " does not match " << nvar <<

 //   ". Try re-optimizing model." << endl;

 //    ad_exit(1);

       cout<<"NOTE: the number of active parameters ("<<nvar<<") does not equal the dimension in admodel.hes ("<<tmp_nvar<<")."<<endl;

       cout<<"      This could mean admodel.hes is old or random effects are in use."<<endl;

   }

   dmatrix hess(1,tmp_nvar,1,tmp_nvar);

   cif >> hess;

   if (!cif) {

     cerr << "Error reading the Hessian matrix from admodel.hes. Try re-optimizing model." << endl;

     ad_exit(1);

   } else {

       if (debug) cout<<"the hessian matrix"<<endl<<hess<<endl;

   }

   int oldHbf;

   cif >> oldHbf;

   if (!cif) {

     cerr << "Error reading the hybrid flag from admodel.hes. Try re-optimizing model." << endl;

     ad_exit(1);

   }

   dvector sscale(1,tmp_nvar);

   cif >> sscale;

   if (!cif) {

     cerr << "Error reading the transformation scales from admodel.hes. Try re-optimizing model." << endl;

     ad_exit(1);

   } else {

       if (debug) cout<<"sscale = "<<sscale<<endl;

   }

   // Read in the MLEs finally

   int temp=0;

   cif >> temp;

   if (debug) cout<<"flag = "<<temp<<endl;

   // temp is a unique flag to make sure the mle values were written (that

   // admodel.hes is not too old)

   if(temp != -987 || !cif){

     cerr << "Error reading the check value from admodel.hes. Try re-optimizing model." << endl;

     ad_exit(1);

   }

   cif >> mle;

   if (debug) cout<<"mle = "<<mle<<endl;

   if(!cif){

     cerr << "Error reading the bounded MLE values from admodel.hes. Try re-optimizing model." << endl;

     ad_exit(1);

   }

 }


 // Function written by Dave to help speed up some of the MCMC

 // calculations. The code has chd*x which rotates the space but

 // this is often a vector or at least a lower triangular

 // matrix. Thus we can make it more efficient. Can go from x to

 // y, or y to x, depending on if you pass m=chd or m=inverse(chd)

 /*

 @param


  */

 dvector function_minimizer::rotate_pars(const dmatrix& m, const dvector& x)

 {

   if (x.indexmin() != m.colmin() || x.indexmax() != m.colmax())

     {

       cerr << " Incompatible array bounds in "

   "dvector rotate_pars(const dmaxtrix& m, const dvector& x)\n";

       ad_exit(21);

     }


   dvector tmp(m.rowmin(),m.rowmax());

   int mmin=m.rowmin();

   int mmax=m.rowmax();

   int xmin=x.indexmin();


   // If the metric is a dense matrix, chd will be lower diagonal so just

   // loop over those. If doing adapt_mass then chd is still passed

   // through as a matrix (poor programming) but only the digonal will be

   // non-zero. Hence we can skip the off-diagonals and speed up the

   // calculation.

   if(diagonal_metric_flag==0){

     for (int i=mmin; i<=mmax; i++)

       {

   tmp[i]=0;

   double * pm= (double *) &(m(i,xmin));

   double * px= (double *) &(x(xmin));

   double tt=0.0;

   for (int j=xmin; j<=i; j++)

     {

       tt+= *pm++ * *px++;

     }

   tmp[i]=tt;

       }

   } else if(diagonal_metric_flag==1){

     // Only the diagonals are nonzero so skip the offdiagonals completely

     for (int i=mmin; i<=mmax; i++)

       {

   double * pm= (double *) &(m(i,i));

   double * px= (double *) &(x(i));

   tmp[i]= *pm * *px;

       }

   } else {

     cerr << "Invalid value for diagonal_metric_flag in rotate_pars" << endl;

     ad_exit(21);

   }

   return(tmp);

 }


 // See help for rotate_pars above, it's the same except rotating a gradient

 // vector rather than a par vector (although math is different)

 dvector function_minimizer::rotate_gradient(const dvector& x, const dmatrix& m)

 {

   if (x.indexmin() != m.colmin() || x.indexmax() != m.colmax())

     {

       cerr << " Incompatible array bounds in "

   "dvector rotate_gradient(const dvector& x, const dmatrix& m)\n";

       ad_exit(21);

     }

   int mmin=m.colmin();

   int mmax=m.colmax();

   dvector tmp(mmin,mmax);

   if(diagonal_metric_flag==0){

     for (int j = mmin; j <= mmax; ++j)

       {

   dvector column = extract_column(m, j);

   double* pm = (double*)&column(j);

   double* px = (double*)&x(j);

   double sum = *px * *pm;

   for (int i=j; i < mmax; ++i)

     {

       sum += *(++px) * *(++pm);

     }

   tmp[j] = sum;

       }

   } else if(diagonal_metric_flag==1)

     {

       for (int i=mmin; i<=mmax; i++)

   {

     double * pm= (double *) &(m(i,i));

     double * px= (double *) &(x(i));

     tmp[i] = *pm * *px;

   }

     }else {

     cerr << "Invalid value for diagonal_metric_flag in rotate_gradient" << endl;

     ad_exit(21);

   }

   return(tmp);

 }


 void function_minimizer::add_sample_diag(const int nvar, int& n, dvector& m, dvector& m2,

             const independent_variables& q) {

   n++;

   //convert q to dvector ( better way to do this?)

   dvector aq(1,nvar);

   aq=q;

   dvector delta=aq - m;

   m += delta / n;

   m2 += elem_prod(aq-m, delta);

 }


 void function_minimizer::add_sample_dense(const int nvar, int& n, dvector& m, dmatrix& m2,

             const independent_variables& q) {

   n++;

   //convert q to dvector ( better way to do this?)

   dvector aq(1,nvar);

   aq=q;

   dvector delta=aq - m;

   m += delta / n;

   m2 += outer_prod(aq-m, delta);

 }


 bool function_minimizer::calculate_chd_and_inverse(int nvar, const dmatrix& metric,

                dmatrix& chd, dmatrix& chdinv){


   // Save copy before modifying it

   dmatrix chd0(1,nvar,1,nvar);

   chd0=chd;

   bool success = true;

   if(diagonal_metric_flag==0){

     // will fail if not positive definite

     success = choleski_decomp_hmc(metric, chd); // cholesky decomp of mass matrix

     if(success){

       chdinv=inv(chd);

     } else {

       // wasn't positive definite so don't update it (better to

       // do diagonal?)), reset to original

       chd=chd0;

     }

   } else {

     // If diagonal, chd is just sqrt of diagonals and inverse the reciprocal

     chd.initialize(); chdinv.initialize();

     for(int i=1;i<=nvar;i++){

       if(metric(i,i)<0){

   cerr << "Element " << i << " of diagonal mass matrix was <0... setting to 1 instead" << endl;

   chd(i,i)=1;

       } else{

   chd(i,i)=sqrt(metric(i,i));

       }

       chdinv(i,i)=1/chd(i,i);

     }

   }

   return(success);

 }


 /* This function is a copy of choleski_decomp from dmat15.cpp,

  except tweaked for use with adaptive dense stepsize in HMC.  The

  main difference is that instead of exiting on error it gives a

  more informative error, also it returns a flag for whether it

  succeeded, and updates L by reference.  -Cole 3/2020


  @param metric A covariance matrix as estimated from warmup samples

  @param L A cholesky decomposed matrix

  @return A boolean whether algorithm succeeded, and L by reference


  */

 bool function_minimizer::choleski_decomp_hmc(const dmatrix& metric, dmatrix& L) {

   // kludge to deal with constantness

   dmatrix & M= * (dmatrix *) &metric;

   if (M.colsize() != M.rowsize())

   {

     cerr << "Error in choleski_decomp_hmc. Mass matrix not square" << endl;

     ad_exit(1);

   }

   int rowsave=M.rowmin();

   int colsave=M.colmin();

   M.rowshift(1);

   M.colshift(1);

   int n=M.rowmax();

   //   dmatrix L(1,n,1,n);

   // #ifndef SAFE_INITIALIZE

   L.initialize();

   // #endif


   int i,j,k;

   double tmp;

   bool success=true;

   adstring tmpstring = "Mass matrix not positive definite when updating dense mass matrix adaptation.";

   if (M(1,1)<=0) {success=false; return success;}

   // I didn't touch the actual algorithm

   L(1,1)=sqrt(M(1,1));

   for (i=2;i<=n;i++) {

     L(i,1)=M(i,1)/L(1,1);

   }

   for (i=2;i<=n;i++) {

     for (j=2;j<=i-1;j++) {

       tmp=M(i,j);

       for (k=1;k<=j-1;k++) {

         tmp-=L(i,k)*L(j,k);

       }

       L(i,j)=tmp/L(j,j);

     }

     tmp=M(i,i);

     for (k=1;k<=i-1;k++) {

       tmp-=L(i,k)*L(i,k);

     }

     if (tmp<=0) {success=false; return success;}

     L(i,i)=sqrt(tmp);

   }

   L.rowshift(rowsave);

   L.colshift(colsave);

   return success;

 }

adstring
Definition: adstring.hpp:70

function_minimizer::lapprox
laplace_approximation_calculator * lapprox
Definition: admodel.h:1862

log10
dvector log10(const dvector &vec)
Returns dvector with the common (base-10) logarithm of vec.
Definition: dvect6.cpp:273

elem_prod
d3_array elem_prod(const d3_array &a, const d3_array &b)
Returns d3_array results with computed elements product of a(i, j, k) * b(i, j, k).
Definition: d3arr2a.cpp:92

function_minimizer::rotate_pars
dvector rotate_pars(const dvector &m, const dvector &x)

function_minimizer::read_mle_hmc
void read_mle_hmc(int nvar, dvector &mle)
Definition: hmc_functions.cpp:432

x
#define x

dvector
Vector of double precision numbers.
Definition: dvector.h:50

function_minimizer::stop_criterion
bool stop_criterion(int nvar, dvector &thetaminus, dvector &thetaplus, dvector &rminus, dvector &rplus)
Definition: hmc_functions.cpp:214

dvector::indexmin
int indexmin() const
Get minimum valid index.
Definition: dvector.h:199

sum
double sum(const d3_array &darray)
Author: David Fournier Copyright (c) 2008-2012 Regents of the University of California.
Definition: d3arr.cpp:21

function_minimizer::compute_next_window
int compute_next_window(int i, int warmup, int w1, int aws, int w3)
Definition: hmc_functions.cpp:34

function_minimizer::print_mcmc_progress
void print_mcmc_progress(int is, int nmcmc, int nwarmup, int chain, int refresh)
Definition: hmc_functions.cpp:284

ad_exit
exitptr ad_exit
Definition: gradstrc.cpp:53

function_minimizer::choleski_decomp_hmc
bool choleski_decomp_hmc(const dmatrix &metric, dmatrix &L)
Definition: hmc_functions.cpp:686

initial_params::reset
static dvariable reset(const dvar_vector &x)
Definition: model.cpp:345

dvar_vector
ADMB variable vector.
Definition: fvar.hpp:2172

function_minimizer::leapfrog
double leapfrog(int nvar, dvector &gr, dmatrix &chd, double eps, dvector &p, dvector &x, dvector &gr2)
Function to take a single HMC leapfrog step, given current position and momentum variables.
Definition: hmc_functions.cpp:408

dmatrix::colsize
unsigned int colsize() const
Definition: fvar.hpp:2948

function_minimizer::rotate_gradient
dvector rotate_gradient(const dvector &x, const dmatrix &m)
Definition: hmc_functions.cpp:547

gradcalc
void gradcalc(int nvar, const dvector &g)
Definition: sgradclc.cpp:77

debug
static int debug
Definition: output_checks.cpp:234

function_minimizer::find_reasonable_stepsize
double find_reasonable_stepsize(int nvar, dvector y, dvector p, dmatrix &chd, bool verbose_adapt_mass, bool verbose_find_epsilon, int chain)
Definition: hmc_functions.cpp:331

extract_column
dvector extract_column(const dmatrix &matrix, int j)
Extract copy of jth column vector from matrix m.
Definition: dmat6.cpp:34

initial_params::stddev_vscale
static int stddev_vscale(const dvar_vector &d, const dvar_vector &x)
Definition: model.cpp:191

function_minimizer::calculate_chd_and_inverse
bool calculate_chd_and_inverse(int nvar, const dmatrix &metric, dmatrix &chd, dmatrix &chdinv)
Calculate the Cholesky decomposition and its inverse given a mass matrix.
Definition: hmc_functions.cpp:641

randu
double randu(const random_number_generator &rng)
Uniform random number generator.
Definition: rngen.cpp:198

random_number_generator
Description not yet available.
Definition: fvar.hpp:7951

endl
prnstream & endl(prnstream &)

independent_variables
Description not yet available.
Definition: fvar.hpp:1937

dmatrix::rowmax
int rowmax() const
Definition: fvar.hpp:2929

sqrt
d3_array sqrt(const d3_array &arr3)
Author: David Fournier Copyright (c) 2008-2012 Regents of the University of California.
Definition: d3arr2c.cpp:11

function_minimizer::get_hybrid_monte_carlo_value
double get_hybrid_monte_carlo_value(int nvar, const independent_variables &y, dvector &g)
Written by Dave, commented by Cole starting 8/31/2016 Description not yet available.
Definition: hmc_functions.cpp:258

min
#define min(a, b)
Definition: cbivnorm.cpp:188

dvector::indexmax
int indexmax() const
Get maximum valid index.
Definition: dvector.h:204

objective_function_value::pobjfun
static objective_function_value * pobjfun
Definition: admodel.h:2394

admodel.h
Description not yet available.

exp
d3_array exp(const d3_array &arr3)
Returns d3_array results with computed exp from elements in arr3.
Definition: d3arr2a.cpp:28

M
#define M
Definition: rngen.cpp:57

dmatrix::colmin
int colmin(void) const
Definition: fvar.hpp:2939

outer_prod
dmatrix outer_prod(const dvector &v1, const dvector &v2)
Description not yet available.
Definition: dmat23.cpp:17

dmatrix
Description not yet available.
Definition: fvar.hpp:2819

norm2
double norm2(const d3_array &a)
Return sum of squared elements in a.
Definition: d3arr2a.cpp:167

initial_params::copy_all_values
static void copy_all_values(const dvector &x, const int &ii)
Definition: model3.cpp:9

function_minimizer::adapt_eps
double adapt_eps(int ii, int iseps, double eps, double alpha, double &adapt_delta, double &mu, dvector &epsvec, dvector &epsbar, dvector &Hbar)
Definition: hmc_functions.cpp:234

function_minimizer::print_mcmc_timing
void print_mcmc_timing(double time_warmup, double time_total, int chain)
Definition: hmc_functions.cpp:298

function_minimizer::slow_phase
bool slow_phase(int is, int warmup, int w1, int w3)
Definition: hmc_functions.cpp:53

function_minimizer::mcmc2_flag
int mcmc2_flag
Definition: admodel.h:1885

dmatrix::rowshift
void rowshift(int min)
Changes the range of valid indices for the rows.
Definition: dmat9.cpp:48

pos
size_t pos(const adstring &substr, const adstring &s)
Definition: string3.cpp:56

eps
double eps
Definition: ftweak.cpp:13

dmatrix::colshift
void colshift(int min)
Description not yet available.
Definition: dmat9.cpp:68

dmatrix::rowsize
unsigned int rowsize() const
Definition: fvar.hpp:2934

uistream
Description not yet available.
Definition: fvar.hpp:3516

function_minimizer::diagonal_metric_flag
int diagonal_metric_flag
Definition: admodel.h:1887

column
dvector column(const dmatrix &matrix, int j)
Author: David Fournier Copyright (c) 2008-2012 Regents of the University of California.
Definition: dmat6.cpp:13

value
dvector value(const df1_one_vector &v)
Definition: df11fun.cpp:69

function_minimizer::userfunction
virtual void userfunction(void)=0

function_minimizer::get_filename
std::string get_filename(const char *f)
Definition: hmc_functions.cpp:63

function_minimizer::add_sample_dense
void add_sample_dense(const int nvar, int &is2, dvector &m, dmatrix &m2, const independent_variables &q)
Calculate running covariance using Welford&#39;s &quot;online&quot; algorithm.
Definition: hmc_functions.cpp:621

dmatrix::initialize
void initialize(void)
Author: David Fournier Copyright (c) 2008-2012 Regents of the University of California.
Definition: dmat7.cpp:12

dmatrix::rowmin
int rowmin() const
Definition: fvar.hpp:2925

function_minimizer::build_tree
void build_tree(int nvar, dvector &gr, dmatrix &chd, double eps, dvector &p, dvector &y, dvector &gr2, double logu, int v, int j, double H0, dvector &_thetaprime, dvector &_thetaplus, dvector &_thetaminus, dvector &_rplus, dvector &_rminus, double &_alphaprime, int &_nalphaprime, bool &_sprime, int &_nprime, int &_nfevals, bool &_divergent, const random_number_generator &rng, dvector &gr2_end, dvector &_grprime, dvector &_gr2prime, double &_nllprime, double &_Hprime, independent_variables &_parsaveprime)
Definition: hmc_functions.cpp:75

dvariable
Fundamental data type for reverse mode automatic differentiation.
Definition: fvar.hpp:1518

inv
df1_one_variable inv(const df1_one_variable &x)
Definition: df11fun.cpp:384

log
d3_array log(const d3_array &arr3)
Author: David Fournier Copyright (c) 2008-2012 Regents of the University of California.
Definition: d3arr2a.cpp:13

function_minimizer::add_sample_diag
void add_sample_diag(const int nvar, int &n, dvector &m, dvector &m2, const independent_variables &q)
Calculate running covariance using Welford&#39;s &quot;online&quot; algorithm.
Definition: hmc_functions.cpp:598

pow
d3_array pow(const d3_array &m, int e)
Description not yet available.
Definition: d3arr6.cpp:17

dmatrix::colmax
int colmax(void) const
Definition: fvar.hpp:2943