Merge pull request stan-dev#510 from stan-dev/feature/issue-38-univariate-normal-distribution-on-sufficient-statistics

Bob Carpenter · web-flow · commit 52d5635c9d9d · 2017-03-21T12:40:43.000-04:00
Feature/issue 38 univariate normal distribution on sufficient statistics
diff --git a/stan/math/prim/scal.hpp b/stan/math/prim/scal.hpp
@@ -333,6 +333,8 @@
 #include <stan/math/prim/scal/prob/normal_log.hpp>
 #include <stan/math/prim/scal/prob/normal_lpdf.hpp>
 #include <stan/math/prim/scal/prob/normal_rng.hpp>
+#include <stan/math/prim/scal/prob/normal_sufficient_log.hpp>
+#include <stan/math/prim/scal/prob/normal_sufficient_lpdf.hpp>
 #include <stan/math/prim/scal/prob/pareto_ccdf_log.hpp>
 #include <stan/math/prim/scal/prob/pareto_cdf.hpp>
 #include <stan/math/prim/scal/prob/pareto_cdf_log.hpp>
diff --git a/stan/math/prim/scal/meta/max_size.hpp b/stan/math/prim/scal/meta/max_size.hpp
@@ -21,14 +21,26 @@ namespace stan {
   }
 
   template <typename T1, typename T2, typename T3, typename T4>
-  size_t max_size(const T1& x1, const T2& x2, const T3& x3, const T4& x4) {
+  size_t max_size(const T1& x1, const T2& x2, const T3& x3,
+                  const T4& x4) {
     size_t result = length(x1);
     result = result > length(x2) ? result : length(x2);
     result = result > length(x3) ? result : length(x3);
     result = result > length(x4) ? result : length(x4);
     return result;
   }
 
+  template <typename T1, typename T2, typename T3, typename T4,
+            typename T5>
+  size_t max_size(const T1& x1, const T2& x2, const T3& x3,
+                  const T4& x4, const T5& x5) {
+    size_t result = length(x1);
+    result = result > length(x2) ? result : length(x2);
+    result = result > length(x3) ? result : length(x3);
+    result = result > length(x4) ? result : length(x4);
+    result = result > length(x5) ? result : length(x5);
+    return result;
+  }
+
 }
 #endif
-
diff --git a/stan/math/prim/scal/prob/normal_lpdf.hpp b/stan/math/prim/scal/prob/normal_lpdf.hpp
@@ -29,15 +29,16 @@ namespace stan {
      *
      * <p>The result log probability is defined to be the sum of the
      * log probabilities for each observation/mean/deviation triple.
+     * @tparam T_y Underlying type of scalar in sequence.
+     * @tparam T_loc Type of location parameter.
+     * @tparam T_scale Type of scale parameter.
      * @param y (Sequence of) scalar(s).
      * @param mu (Sequence of) location parameter(s)
      * for the normal distribution.
      * @param sigma (Sequence of) scale parameters for the normal
      * distribution.
      * @return The log of the product of the densities.
      * @throw std::domain_error if the scale is not positive.
-     * @tparam T_y Underlying type of scalar in sequence.
-     * @tparam T_loc Type of location parameter.
      */
     template <bool propto,
               typename T_y, typename T_loc, typename T_scale>
diff --git a/stan/math/prim/scal/prob/normal_sufficient_log.hpp b/stan/math/prim/scal/prob/normal_sufficient_log.hpp
@@ -0,0 +1,43 @@
+#ifndef STAN_MATH_PRIM_SCAL_PROB_NORMAL_SUFFICIENT_LOG_HPP
+#define STAN_MATH_PRIM_SCAL_PROB_NORMAL_SUFFICIENT_LOG_HPP
+
+#include <stan/math/prim/scal/meta/return_type.hpp>
+#include <stan/math/prim/scal/prob/normal_sufficient_lpdf.hpp>
+
+namespace stan {
+  namespace math {
+
+    /**
+     * @deprecated use <code>normal_lpdf</code>
+     */
+    template <bool propto,
+              typename T_y, typename T_s, typename T_n,
+              typename T_loc, typename T_scale>
+    inline
+    typename return_type<T_y, T_s, T_loc, T_scale>::type
+    normal_sufficient_log(const T_y& y_bar, const T_s& s_squared,
+                          const T_n& n_obs, const T_loc& mu,
+                          const T_scale& sigma) {
+      return normal_sufficient_lpdf<propto, T_y, T_s, T_n,
+                                    T_loc, T_scale>(y_bar, s_squared,
+                                                    n_obs, mu, sigma);
+    }
+
+    /**
+     * @deprecated use <code>normal_lpdf</code>
+     */
+    template <typename T_y, typename T_s, typename T_n,
+              typename T_loc, typename T_scale>
+    inline
+    typename return_type<T_y, T_s, T_loc, T_scale>::type
+    normal_sufficient_log(const T_y& y_bar, const T_s& s_squared,
+                          const T_n& n_obs, const T_loc& mu,
+                          const T_scale& sigma) {
+      return normal_sufficient_lpdf<T_y, T_s, T_n,
+                                    T_loc, T_scale>(y_bar, s_squared,
+                                                    n_obs, mu, sigma);
+    }
+
+  }
+}
+#endif
diff --git a/stan/math/prim/scal/prob/normal_sufficient_lpdf.hpp b/stan/math/prim/scal/prob/normal_sufficient_lpdf.hpp
@@ -0,0 +1,176 @@
+#ifndef STAN_MATH_PRIM_SCAL_PROB_NORMAL_SUFFICIENT_LPDF_HPP
+#define STAN_MATH_PRIM_SCAL_PROB_NORMAL_SUFFICIENT_LPDF_HPP
+
+#include <stan/math/prim/scal/meta/return_type.hpp>
+#include <stan/math/prim/scal/prob/normal_lpdf.hpp>
+
+#include <stan/math/prim/scal/meta/OperandsAndPartials.hpp>
+#include <stan/math/prim/scal/meta/scalar_seq_view.hpp>
+#include <stan/math/prim/scal/err/check_consistent_sizes.hpp>
+#include <stan/math/prim/scal/err/check_finite.hpp>
+#include <stan/math/prim/scal/err/check_positive.hpp>
+#include <stan/math/prim/scal/err/check_nonnegative.hpp>
+#include <stan/math/prim/scal/fun/constants.hpp>
+#include <stan/math/prim/scal/fun/value_of.hpp>
+#include <stan/math/prim/scal/meta/include_summand.hpp>
+#include <stan/math/prim/scal/meta/VectorBuilder.hpp>
+#include <stan/math/prim/scal/meta/max_size.hpp>
+
+namespace stan {
+
+  namespace math {
+
+    /**
+     * The log of the normal density for the specified scalar(s) given
+     * the specified mean(s) and deviation(s).
+     * y, s_quared, mu, or sigma can each be either
+     * a scalar, a std vector or Eigen vector.
+     * n can be either a single int or an std vector of ints.
+     * Any vector inputs must be the same length.
+     *
+     * <p>The result log probability is defined to be the sum of the
+     * log probabilities for each observation/mean/deviation triple.
+     * 
+     * @tparam T_y Type of sample average parameter.
+     * @tparam T_s Type of sample squared errors parameter.
+     * @tparam T_n Type of sample size parameter.
+     * @tparam T_loc Type of location parameter.
+     * @tparam T_scale Type of scale parameter.
+     * @param y_bar (Sequence of) scalar(s) (sample average(s)).
+     * @param s_squared (Sequence of) sum(s) of sample squared errors
+     * @param n_obs (Sequence of) sample size(s)
+     * @param mu (Sequence of) location parameter(s)
+     * for the normal distribution.
+     * @param sigma (Sequence of) scale parameters for the normal
+     * distribution.
+     * @return The log of the product of the densities.
+     * @throw std::domain_error if either n or sigma are not positive,
+     * if s_squared is negative or if any parameter is not finite.
+     */
+    template <bool propto,
+              typename T_y, typename T_s, typename T_n, typename T_loc,
+              typename T_scale>
+    typename return_type<T_y, T_s, T_loc, T_scale>::type
+    normal_sufficient_lpdf(const T_y& y_bar, const T_s& s_squared,
+                           const T_n& n_obs, const T_loc& mu,
+                           const T_scale& sigma) {
+      static const char*
+        function = "stan::math::normal_sufficient_lpdf(%1%)";
+      typedef typename
+        stan::partials_return_type<T_y, T_s, T_n, T_loc, T_scale>::type
+        T_partials_return;
+
+      using std::log;
+      using stan::is_constant_struct;
+      using stan::math::check_positive;
+      using stan::math::check_finite;
+      using stan::math::check_not_nan;
+      using stan::math::check_consistent_sizes;
+      using stan::math::value_of;
+      using stan::math::include_summand;
+
+      // check if any vectors are zero length
+      if (!(stan::length(y_bar)
+            && stan::length(s_squared)
+            && stan::length(n_obs)
+            && stan::length(mu)
+            && stan::length(sigma)))
+        return 0.0;
+
+      // set up return value accumulator
+      T_partials_return logp(0.0);
+
+      // validate args (here done over var, which should be OK)
+      check_finite(function,
+                    "Location parameter sufficient statistic", y_bar);
+      check_finite(function,
+                    "Scale parameter sufficient statistic", s_squared);
+      check_nonnegative(function,
+                    "Scale parameter sufficient statistic", s_squared);
+      check_finite(function,
+                    "Number of observations", n_obs);
+      check_positive(function,
+                    "Number of observations", n_obs);
+      check_finite(function,
+                    "Location parameter", mu);
+      check_finite(function, "Scale parameter", sigma);
+      check_positive(function, "Scale parameter", sigma);
+      check_consistent_sizes(function,
+                             "Location parameter sufficient statistic",
+                             y_bar,
+                             "Scale parameter sufficient statistic",
+                             s_squared,
+                             "Number of observations", n_obs,
+                             "Location parameter", mu,
+                             "Scale parameter", sigma);
+      // check if no variables are involved and prop-to
+      if (!include_summand<propto, T_y, T_s, T_loc, T_scale>::value)
+        return 0.0;
+
+      // set up template expressions wrapping scalars into vector views
+      OperandsAndPartials<T_y, T_s, T_loc, T_scale>
+        operands_and_partials(y_bar, s_squared, mu, sigma);
+
+      scalar_seq_view<const T_y> y_bar_vec(y_bar);
+      scalar_seq_view<const T_s> s_squared_vec(s_squared);
+      scalar_seq_view<const T_n> n_obs_vec(n_obs);
+      scalar_seq_view<const T_loc> mu_vec(mu);
+      scalar_seq_view<const T_scale> sigma_vec(sigma);
+      size_t N = max_size(y_bar, s_squared, n_obs, mu, sigma);
+
+      for (size_t i = 0; i < N; i++) {
+        const T_partials_return y_bar_dbl = value_of(y_bar_vec[i]);
+        const T_partials_return s_squared_dbl =
+          value_of(s_squared_vec[i]);
+        const T_partials_return n_obs_dbl = n_obs_vec[i];
+        const T_partials_return mu_dbl = value_of(mu_vec[i]);
+        const T_partials_return sigma_dbl = value_of(sigma_vec[i]);
+        const T_partials_return sigma_squared = pow(sigma_dbl, 2);
+
+        if (include_summand<propto>::value)
+          logp += NEG_LOG_SQRT_TWO_PI * n_obs_dbl;
+
+        if (include_summand<propto, T_scale>::value)
+          logp -= n_obs_dbl * log(sigma_dbl);
+
+        const T_partials_return cons_expr =
+          (s_squared_dbl
+           + n_obs_dbl * pow(y_bar_dbl - mu_dbl, 2));
+
+        logp -= cons_expr / (2 * sigma_squared);
+
+        // gradients
+        if (!is_constant_struct<T_y>::value ||
+!is_constant_struct<T_loc>::value) {
+          const T_partials_return common_derivative =
+            n_obs_dbl * (mu_dbl - y_bar_dbl) / sigma_squared;
+          if (!is_constant_struct<T_y>::value)
+            operands_and_partials.d_x1[i] += common_derivative;
+          if (!is_constant_struct<T_loc>::value)
+            operands_and_partials.d_x3[i] -= common_derivative;
+        }
+        if (!is_constant_struct<T_s>::value)
+          operands_and_partials.d_x2[i] -=
+            0.5 / sigma_squared;
+        if (!is_constant_struct<T_scale>::value)
+          operands_and_partials.d_x4[i]
+            += cons_expr / pow(sigma_dbl, 3) - n_obs_dbl / sigma_dbl;
+      }
+      return operands_and_partials.value(logp);
+    }
+
+    template <typename T_y, typename T_s, typename T_n,
+              typename T_loc, typename T_scale>
+    inline
+    typename return_type<T_y, T_s, T_loc, T_scale>::type
+    normal_sufficient_lpdf(const T_y& y_bar, const T_s& s_squared,
+                          const T_n& n_obs, const T_loc& mu,
+                          const T_scale& sigma) {
+      return
+        normal_sufficient_lpdf<false>(y_bar, s_squared,
+                                      n_obs, mu, sigma);
+    }
+
+  }
+}
+#endif
diff --git a/test/prob/normal_sufficient/normal_sufficient_test.hpp b/test/prob/normal_sufficient/normal_sufficient_test.hpp
@@ -0,0 +1,114 @@
+// Arguments: Doubles, Doubles, Ints, Doubles, Doubles
+#include <stan/math/prim/scal.hpp>
+
+using std::vector;
+using std::numeric_limits;
+using stan::math::var;
+
+class AgradDistributionNormalSufficient : public AgradDistributionTest {
+public:
+  void valid_values(vector<vector<double> >& parameters,
+                    vector<double>& log_prob) {
+    vector<double> param(5);
+
+    //observed values: -0.1, 0.1
+    param[0] = 0;           // y_bar
+    param[1] = 0.02;           // s_squared
+    param[2] = 2;           // n_obs
+    param[3] = -2.3;           // mu
+    param[4] = 2.1;           // sigma
+    parameters.push_back(param);
+    log_prob.push_back(-4.52356581482502); // expected log_prob
+
+    //observed values: 0, 1
+    param[0] = 0.5;           // y_bar
+    param[1] = 0.5;           // s_squared
+    param[2] = 2;           // n_obs
+    param[3] = 0;           // mu
+    param[4] = 1;           // sigma
+    parameters.push_back(param);
+    log_prob.push_back(-2.33787706640935); // expected log_prob
+
+
+    //observed values: 0, 2
+    param[0] = 1;           // y_bar
+    param[1] = 2;           // s_squared
+    param[2] = 2;           // n_obs
+    param[3] = 1;           // mu
+    param[4] = 1;           // sigma
+    parameters.push_back(param);
+    log_prob.push_back(-2.83787706640935); // expected log_prob
+
+    //observed values: 1, 2
+    param[0] = 1.5;           // y_bar
+    param[1] = 0.5;           // s_squared
+    param[2] = 2;           // n_obs
+    param[3] = -1;           // mu
+    param[4] = 3;           // sigma
+    parameters.push_back(param);
+    log_prob.push_back(-4.75732386596779); // expected log_prob
+  }
+
+  void invalid_values(vector<size_t>& index,
+          vector<double>& value) {
+    // y
+
+    // mu
+    index.push_back(3U);
+    value.push_back(numeric_limits<double>::infinity());
+
+    index.push_back(3U);
+    value.push_back(-numeric_limits<double>::infinity());
+
+    // sigma
+    index.push_back(4U);
+    value.push_back(0.0);
+
+    index.push_back(4U);
+    value.push_back(-1.0);
+
+    index.push_back(4U);
+    value.push_back(-numeric_limits<double>::infinity());
+  }
+
+  template <typename T_y, typename T_s, typename T_n,
+      typename T_loc, typename T_scale, typename T5>
+  typename stan::return_type<T_y, T_s, T_n, T_loc, T_scale>::type
+  log_prob(const T_y& y_bar, const T_s& s_squared, const T_n& n_obs,
+     const T_loc& mu, const T_scale& sigma,
+     const T5&) {
+    return stan::math::normal_sufficient_lpdf(y_bar, s_squared, n_obs, mu, sigma);
+  }
+
+  template <bool propto,
+      typename T_y, typename T_s, typename T_n,
+      typename T_loc, typename T_scale, typename T5>
+  typename stan::return_type<T_y, T_s, T_n, T_loc, T_scale>::type
+  log_prob(const T_y& y_bar, const T_s& s_squared, const T_n& n_obs,
+     const T_loc& mu, const T_scale& sigma,
+     const T5&) {
+    return stan::math::normal_sufficient_lpdf<propto>(y_bar, s_squared, n_obs, mu, sigma);
+  }
+
+
+  template <typename T_y, typename T_s, typename T_n,
+      typename T_loc, typename T_scale, typename T5>
+  typename stan::return_type<T_y, T_s, T_n, T_loc, T_scale>::type
+  log_prob_function(const T_y& y_bar, const T_s& s_squared, const T_n& n_obs,
+     const T_loc& mu, const T_scale& sigma,
+     const T5&) {
+    using stan::math::include_summand;
+    using stan::math::pi;
+    using stan::math::square;
+    typename stan::return_type<T_y, T_s, T_n, T_loc, T_scale>::type lp(0.0);
+    if (include_summand<true,T_scale>::value)
+      lp -= n_obs * log(sigma);
+
+      lp -= (s_squared + n_obs * pow(y_bar - mu, 2)) / (2 * pow(sigma, 2));
+
+    if (include_summand<true>::value)
+      lp -= log(sqrt(2.0 * pi()));
+    return lp;
+  }
+};
+