complete the implementation of LaplacianInferenceMethodWithLBFGS

shogun-toolbox · Mar 12, 2014 · f2a43b5 · f2a43b5
1 parent e8262c7
commit f2a43b5
Show file tree

Hide file tree

Showing 2 changed files with 138 additions and 2 deletions.
diff --git a/src/shogun/machine/gp/LaplacianInferenceMethodWithLBFGS.cpp b/src/shogun/machine/gp/LaplacianInferenceMethodWithLBFGS.cpp
@@ -19,6 +19,7 @@
 #ifdef HAVE_EIGEN3
 #include <shogun/mathematics/Math.h>
 #include <shogun/optimization/lbfgs/lbfgs.h>
+#include <cstdio>
 
 namespace shogun {
 
@@ -38,7 +39,139 @@ CLaplacianInferenceMethodWithLBFGS::CLaplacianInferenceMethodWithLBFGS(
 CLaplacianInferenceMethodWithLBFGS::~CLaplacianInferenceMethodWithLBFGS() {
 }
 
+float64_t CLaplacianInferenceMethodWithLBFGS::evaluate(void *obj,
+                                                       const float64_t *alpha,
+                                                       float64_t *gradient,
+                                                       const int dim,
+                                                       const float64_t step) {
+  // Note that alpha = alpha_pre_iter - step * gradient_pre_iter
+  /* Unfortunately we can not use dynamic_cast to cast the void * pointer to an
+   * object pointer. Therefore, make sure this method is private.  
+   */
+  CLaplacianInferenceMethodWithLBFGS * obj_prt
+      = static_cast<CLaplacianInferenceMethodWithLBFGS *>(obj);
+  float64_t * alpha_cast = const_cast<float64_t *>(alpha);
+  Eigen::Map<Eigen::VectorXd> eigen_alpha(alpha_cast, dim);
+  float64_t psi = 0.0;
+  obj_prt->get_psi_wrt_alpha(&eigen_alpha, &psi);
+  Eigen::Map<Eigen::VectorXd> eigen_gradient(gradient, dim);
+  obj_prt->get_gradient_wrt_alpha(&eigen_alpha, &eigen_gradient);
+  return psi;
+}
 
+void CLaplacianInferenceMethodWithLBFGS::update_alpha() {
+  float64_t psi_new;
+  float64_t psi_def;
+
+  // get mean vector and create eigen representation of it
+  SGVector<float64_t> mean_f = m_mean->get_mean_vector(m_features);
+  Eigen::Map<Eigen::VectorXd> eigen_mean_f(mean_f.vector, mean_f.vlen);
+
+  // create eigen representation of kernel matrix
+  Eigen::Map<Eigen::MatrixXd> eigen_ktrtr(m_ktrtr.matrix,
+                                          m_ktrtr.num_rows,
+                                          m_ktrtr.num_cols);
+
+  // create shogun and eigen representation of function vector
+  m_mu = SGVector<float64_t>(mean_f.vlen);  // f
+  Eigen::Map<Eigen::VectorXd> eigen_mu(m_mu, m_mu.vlen);
+
+  if (m_alpha.vlen != m_labels->get_num_labels()) {
+    // set alpha a zero vector
+    m_alpha = SGVector<float64_t>(m_labels->get_num_labels());
+    m_alpha.zero();
+
+    // f = mean, if length of alpha and length of y doesn't match
+    eigen_mu = eigen_mean_f;
+    psi_new = -SGVector<float64_t>::sum(m_model->get_log_probability_f(
+            m_labels, m_mu));
+  } else {
+    // compute f = K * alpha + m
+    Eigen::Map<Eigen::VectorXd> eigen_alpha(m_alpha.vector, m_alpha.vlen);
+    eigen_mu = eigen_ktrtr * (eigen_alpha * CMath::sq(m_scale)) + eigen_mean_f;
+
+    psi_new = eigen_alpha.dot(eigen_mu - eigen_mean_f) / 2.0 -\
+        SGVector<float64_t>::sum(
+            m_model->get_log_probability_f(m_labels, m_mu));  // f
+
+    psi_def = -SGVector<float64_t>::sum(
+        m_model->get_log_probability_f(m_labels, mean_f));  // mean_f
+
+    // if default is better, then use it
+    if (psi_def < psi_new) {
+      m_alpha.zero();
+      eigen_mu = eigen_mean_f;  // f=mean_f
+      psi_new = psi_def;
+    }
+  }
+  Eigen::Map<Eigen::VectorXd> eigen_alpha(m_alpha.vector, m_alpha.vlen);
+  index_t dim = m_alpha.vlen;
+
+  // use for passing variables to compute function value and gradient
+  m_shared.dim = dim;
+  m_shared.kernel = &eigen_ktrtr;
+  m_shared.mean_f = &eigen_mean_f;
+
+  lbfgs_parameter_t param;
+
+  /* Initialize the default parameters for the L-BFGS optimization. */
+  lbfgs_parameter_init(&param);
+
+  /* In order to use the provided lbfgs function, we have to pass the object via
+   * void * pointer, which the evaluate method will use static_cast to cast
+   * the pointer to an object pointer.
+   * Therefore, make sure the evaluate method is a private method of the class. 
+   * Because the evaluate method is defined in a class, we have to pass the
+   * method pointer to the lbfgs function via static method
+   * If we also use the progress method, make sure the method is static and
+   * private. 
+   */
+  void * obj_prt = static_cast<void *>(this);
+
+  int ret = lbfgs(m_alpha.vlen, m_alpha.vector, &psi_new,
+                  CLaplacianInferenceMethodWithLBFGS::evaluate,
+                  NULL, obj_prt, &param);
+  // clean up
+  m_shared.dim = 0;
+  m_shared.kernel = NULL;
+  m_shared.mean_f = NULL;
+
+  /* Note that ret should be zero if the minimization 
+   * process terminates without an error.
+   * A non-zero value indicates an error. 
+   */
+  if (ret != 0) {
+  /*
+   * If some error happened during the L-BFGS optimization, we use the original
+   * Newton method.
+   */
+    CLaplacianInferenceMethod::update_alpha();
+    return;
+  }
+
+  // compute f = K * alpha + m
+  eigen_mu = eigen_ktrtr * (eigen_alpha * CMath::sq(m_scale)) + eigen_mean_f;
+
+  // get log probability derivatives
+  dlp  = m_model->get_log_probability_derivative_f(m_labels, m_mu, 1);
+  d2lp = m_model->get_log_probability_derivative_f(m_labels, m_mu, 2);
+  d3lp = m_model->get_log_probability_derivative_f(m_labels, m_mu, 3);
+
+  // W = -d2lp
+  W = d2lp.clone();
+  W.scale(-1.0);
+
+  // compute sW
+  Eigen::Map<Eigen::VectorXd> eigen_W(W.vector, W.vlen);
+  // create shogun and eigen representation of sW
+  sW = SGVector<float64_t>(W.vlen);
+  Eigen::Map<Eigen::VectorXd> eigen_sW(sW.vector, sW.vlen);
+
+  if (eigen_W.minCoeff() > 0)
+    eigen_sW = eigen_W.cwiseSqrt();
+  else
+    eigen_sW.setZero();
+}
 
 void CLaplacianInferenceMethodWithLBFGS::get_psi_wrt_alpha(
     Eigen::Map<Eigen::VectorXd>* alpha,

diff --git a/src/shogun/machine/gp/LaplacianInferenceMethodWithLBFGS.h b/src/shogun/machine/gp/LaplacianInferenceMethodWithLBFGS.h
@@ -97,8 +97,11 @@ namespace shogun {
     CSharedInfoForLBFGS m_shared;
 
    private:
-    /** only uses for dimension checking */
-    void check(int left, int right, int line);
+    static float64_t evaluate(void *obj,
+                              const float64_t *alpha,
+                              float64_t *gradient,
+                              const int dim,
+                              const float64_t step);
   };
 
 } /* namespace shogun */