stan-dev · syclik · Nov 26, 2013 · Nov 1, 2013 · Nov 2, 2013 · Nov 11, 2013
diff --git a/src/docs/stan-reference/commands.tex b/src/docs/stan-reference/commands.tex
@@ -2147,8 +2147,9 @@ \section{Running the Print Command}
    accept_stat__   0.88  5.6e-03  1.8e-01  0.51  0.95   1.0   1000    16881   1.00
    stepsize__      0.30  1.3e-15  8.9e-16  0.30  0.30  0.30   0.50      8.5   1.00
    treedepth__      1.4  2.6e-02  8.0e-01  0.00   1.0   2.0    946    15978   1.00
+   n_divergent__    1.4  0.0e+00  0.0e+00  0.00   0.0   0.0   1000    16949   1.00
    alpha             17  1.8e+00  2.5e+01   1.9   9.5    50    181     3054   1.00
-   beta              10  1.1e+00  1.4e+01   1.2   6.2    31    181     3057    1.0
+   beta              10  1.1e+00  1.4e+01   1.2   6.2    31    181     3057   1.00
 
    Samples were drawn using hmc with nuts.
    For each parameter, N_Eff is a crude measure of effective sample size,
@@ -2168,7 +2169,10 @@ \section{Running the Print Command}
   step size used by NUTS in its Hamiltonian simulation, and
   \code{treedepth\_\_} is the depth of tree used by NUTS, which is the
   log (base 2) of the number of leapfrog steps taken during the
-  Hamiltonian simulation.  }\label{bin-print-eg.figure}
+  Hamiltonian simulation.  \code{n\_divergent\_\_} gives the number
+  of leapfrog iterations with diverging error; because NUTS terminates
+  at the first divergent iteration this should always be either 0 or 1.}
+\label{bin-print-eg.figure}
 \end{figure}
 %\end{quote}
 %

diff --git a/src/docs/stan-reference/introduction.tex b/src/docs/stan-reference/introduction.tex
@@ -603,7 +603,7 @@ \subsubsection{Sampler Output}
 \begin{quote}
 \begin{Verbatim}[fontsize=\small]
 ...
-lp__,accept_stat__,stepsize__,treedepth__,theta
+lp__,accept_stat__,stepsize__,treedepth__,n_divergent__,theta
 ...
 \end{Verbatim}
 \end{quote}
@@ -630,6 +630,8 @@ \subsubsection{Sampler Output}
 \\
 \NUTS & \Verb| treedepth__  | & Tree depth
 \\
+\NUTS & \Verb| n_divergent__  | & Number of divergent iterations
+\\
 \end{tabular}
 \end{center}
 
@@ -661,27 +663,27 @@ \subsubsection{Sampler Output}
 \begin{quote}
 \begin{Verbatim}[fontsize=\small]
 ...
--6.85935,1,1.81311,0,0.194323
--6.85935,0.0001295,1.81311,0,0.194323
--6.79366,1,1.81311,0,0.288971
--6.77936,1,1.81311,0,0.282131
--6.77936,0.886654,1.81311,0,0.282131
--6.74812,1,1.81311,0,0.248232
--6.74812,0.0793306,1.81311,0,0.248232
--7.04438,0.777304,1.81311,0,0.353339
--7.04438,0.480879,1.81311,0,0.353339
--7.07619,0.849599,1.81311,0,0.158857
+-6.85935,1,1.81311,0,0,0.194323
+-6.85935,0.0001295,1.81311,0,0,0.194323
+-6.79366,1,1.81311,0,0,0.288971
+-6.77936,1,1.81311,0,0,0.282131
+-6.77936,0.886654,1.81311,0,0,0.282131
+-6.74812,1,1.81311,0,0,0.248232
+-6.74812,0.0793306,1.81311,0,0,0.248232
+-7.04438,0.777304,1.81311,0,0,0.353339
+-7.04438,0.480879,1.81311,0,0,0.353339
+-7.07619,0.849599,1.81311,0,0,0.158857
 ...
--6.74838,0.540129,1.81311,0,0.253368
--6.74838,0.638693,1.81311,0,0.253368
--6.74838,0.546,1.81311,0,0.253368
--7.01801,0.794591,1.81311,0,0.348376
--7.01801,0.0564743,1.81311,0,0.348376
--7.17267,0.863864,1.81311,0,0.375023
--6.86632,1,1.81311,0,0.192719
--6.86632,0.0077144,1.81311,0,0.192719
--8.21853,0.512368,1.81311,0,0.084075
--8.7342,0.862726,1.81311,0,0.0669754
+-6.74838,0.540129,1.81311,0,0,0.253368
+-6.74838,0.638693,1.81311,0,0,0.253368
+-6.74838,0.546,1.81311,0,0,0.253368
+-7.01801,0.794591,1.81311,0,0,0.348376
+-7.01801,0.0564743,1.81311,0,0,0.348376
+-7.17267,0.863864,1.81311,0,0,0.375023
+-6.86632,1,1.81311,0,0,0.192719
+-6.86632,0.0077144,1.81311,0,0,0.192719
+-8.21853,0.512368,1.81311,0,0,0.084075
+-8.7342,0.862726,1.81311,0,0,0.0669754
 ...
 \end{Verbatim}
 \end{quote}
@@ -735,6 +737,7 @@ \subsubsection{Summarizing Sampler Output}
 accept_stat__    0.64  1.2e-02  3.6e-01   5.1e-03  0.74   1.0    882    76898   1.00
 stepsize__        1.8  7.8e-15  5.6e-15   1.8e+00   1.8   1.8   0.50       44   1.00
 treedepth__     0.076  8.6e-03  2.7e-01   0.0e+00  0.00   1.0    942    82167   1.00
+n_divergence__   0.00  0.0e+00  0.0e+00   0.0e+00  0.00  0.00   1000    90909   1.00
 theta            0.25  4.2e-03  1.2e-01   9.0e-02  0.23  0.47    827    72146   1.00
 
 Samples were drawn using hmc with nuts.

diff --git a/src/stan/mcmc/hmc/nuts/base_nuts.hpp b/src/stan/mcmc/hmc/nuts/base_nuts.hpp
@@ -36,7 +36,7 @@ namespace stan {
 
       base_nuts(M &m, BaseRNG& rng, std::ostream* o, std::ostream* e):
       base_hmc<M, P, H, I, BaseRNG>(m, rng, o, e),
-      _depth(0), _max_depth(5), _max_delta(1000)
+      _depth(0), _max_depth(5), _max_delta(1000), _n_divergence(0)
       {};
 
       ~base_nuts() {};
@@ -88,12 +88,13 @@ namespace stan {
         int n_valid = 0;
 
         this->_depth = 0;
+        this->_n_divergence = 0;
+
+        util.n_tree = 0;
+        util.sum_prob = 0;
 
         while (util.criterion && (this->_depth <= this->_max_depth) ) {
 
-          util.n_tree = 0;
-          util.sum_prob = 0;
-
           // Randomly sample a direction in time
           ps_point* z = 0;
           Eigen::VectorXd* rho = 0;
@@ -156,21 +157,23 @@ namespace stan {
       }
 
       void write_sampler_param_names(std::ostream& o) {
-        o << "stepsize__,treedepth__,";
+        o << "stepsize__,treedepth__,n_divergence__,";
       }
 
       void write_sampler_params(std::ostream& o) {
-        o << this->_epsilon << "," << this->_depth << ",";
+        o << this->_epsilon << "," << this->_depth << "," << this->_n_divergence << ",";
       }
 
       void get_sampler_param_names(std::vector<std::string>& names) {
         names.push_back("stepsize__");
         names.push_back("treedepth__");
+        names.push_back("n_divergence__");
       }
 
       void get_sampler_params(std::vector<double>& values) {
         values.push_back(this->_epsilon);
         values.push_back(this->_depth);
+        values.push_back(this->_n_divergence);
       }
 
       virtual bool compute_criterion(ps_point& start, P& finish, Eigen::VectorXd& rho) = 0;
@@ -197,7 +200,8 @@ namespace stan {
           if (boost::math::isnan(h)) h = std::numeric_limits<double>::infinity();
 
           util.criterion = util.log_u + (h - util.H0) < this->_max_delta;
-
+          if (!util.criterion) ++(this->_n_divergence);
+
           util.sum_prob += stan::math::min(1, std::exp(util.H0 - h));
           util.n_tree += 1;
 
@@ -244,6 +248,8 @@ namespace stan {
       int _depth;
       int _max_depth;
       double _max_delta;
+
+      int _n_divergence;
 
     };
 

diff --git a/src/test/io/mcmc_writer_test.cpp b/src/test/io/mcmc_writer_test.cpp
@@ -52,7 +52,7 @@ TEST(StanIoMcmcWriter, print_sample_names) {
   std::string line;
   std::getline(sample_stream, line);
 
-  EXPECT_EQ("lp__,accept_stat__,stepsize__,treedepth__,mu1,mu2", line);
+  EXPECT_EQ("lp__,accept_stat__,stepsize__,treedepth__,n_divergence__,mu1,mu2", line);
 
 }
 
@@ -100,6 +100,7 @@ TEST(StanIoMcmcWriter, print_sample_params) {
   expected_stream << accept_stat << ",";
   expected_stream << sampler.get_current_stepsize() << ",";
   expected_stream << 0 << ",";
+  expected_stream << 0 << ",";
   expected_stream << real.at(0) << ",";
   expected_stream << real.at(1);
 
@@ -233,7 +234,7 @@ TEST(StanIoMcmcWriter, print_diagnostic_names) {
   std::getline(diagnostic_stream, line);
 
   // FIXME: make this work, too
-  EXPECT_EQ("lp__,accept_stat__,stepsize__,treedepth__,mu1,mu2,p_mu1,p_mu2,g_mu1,g_mu2", line);
+  EXPECT_EQ("lp__,accept_stat__,stepsize__,treedepth__,n_divergence__,mu1,mu2,p_mu1,p_mu2,g_mu1,g_mu2", line);
 
 }
 
@@ -285,6 +286,7 @@ TEST(StanIoMcmcWriter, print_diagnostic_params) {
   expected_stream << accept_stat << ",";
   expected_stream << sampler.get_current_stepsize() << ",";
   expected_stream << 0 << ",";
+  expected_stream << 0 << ",";
   expected_stream << real.at(0) << ",";
   expected_stream << real.at(1) << ",";
   expected_stream << 0 << ",";