WIP: first cut at sparse LR-SDP solver

stephentu · Dec 22, 2014 · 186ffaa · rcurtin · Dec 22, 2014 · stephentu
1 parent d95a736
commit 186ffaa
Show file tree

Hide file tree

Showing 6 changed files with 234 additions and 175 deletions.
diff --git a/src/mlpack/core/optimizers/lrsdp/lrsdp.cpp b/src/mlpack/core/optimizers/lrsdp/lrsdp.cpp
@@ -11,9 +11,10 @@ using namespace mlpack;
 using namespace mlpack::optimization;
 using namespace std;
 
-LRSDP::LRSDP(const size_t numConstraints,
+LRSDP::LRSDP(const size_t numSparseConstraints,
+             const size_t numDenseConstraints,
              const arma::mat& initialPoint) :
-    function(numConstraints, initialPoint),
+    function(numSparseConstraints, numDenseConstraints, initialPoint),
     augLag(function)
 { }
 

diff --git a/src/mlpack/core/optimizers/lrsdp/lrsdp.hpp b/src/mlpack/core/optimizers/lrsdp/lrsdp.hpp
@@ -26,28 +26,15 @@ class LRSDP
  public:
   /**
    * Create an LRSDP to be optimized.  The solution will end up being a matrix
-   * of size (rank) x (rows).  To construct each constraint and the objective
+   * of size (rows) x (rank).  To construct each constraint and the objective
    * function, use the functions A(), B(), and C() to set them correctly.
    *
    * @param numConstraints Number of constraints in the problem.
-   * @param rank Rank of the solution (<= rows).
-   * @param rows Number of rows in the solution.
-   */
-  LRSDP(const size_t numConstraints,
-        const arma::mat& initialPoint);
-
-  /**
-   * Create an LRSDP to be optimized, passing in an already-created
-   * AugLagrangian object.  The given initial point should be set to the size
-   * (rows) x (rank), where (rank) is the reduced rank of the problem.
-   *
-   * @param numConstraints Number of constraints in the problem.
    * @param initialPoint Initial point of the optimization.
-   * @param auglag Pre-initialized AugLagrangian<LRSDP> object.
    */
-  LRSDP(const size_t numConstraints,
-        const arma::mat& initialPoint,
-        AugLagrangian<LRSDPFunction>& augLagrangian);
+  LRSDP(const size_t numSparseConstraints,
+        const size_t numDenseConstraints,
+        const arma::mat& initialPoint);
 
   /**
    * Optimize the LRSDP and return the final objective value.  The given
@@ -57,25 +44,43 @@ class LRSDP
    */
   double Optimize(arma::mat& coordinates);
 
-  //! Return the objective function matrix (C).
-  const arma::mat& C() const { return function.C(); }
-  //! Modify the objective function matrix (C).
-  arma::mat& C() { return function.C(); }
-
-  //! Return the vector of A matrices (which correspond to the constraints).
-  const std::vector<arma::mat>& A() const { return function.A(); }
-  //! Modify the veector of A matrices (which correspond to the constraints).
-  std::vector<arma::mat>& A() { return function.A(); }
-
-  //! Return the vector of modes for the A matrices.
-  const arma::uvec& AModes() const { return function.AModes(); }
-  //! Modify the vector of modes for the A matrices.
-  arma::uvec& AModes() { return function.AModes(); }
-
-  //! Return the vector of B values.
-  const arma::vec& B() const { return function.B(); }
-  //! Modify the vector of B values.
-  arma::vec& B() { return function.B(); }
+  //! Return the sparse objective function matrix (C_sparse).
+  inline const arma::sp_mat& C_sparse() const { return function.C_sparse(); }
+
+  //! Modify the sparse objective function matrix (C_sparse).
+  inline arma::sp_mat& C_sparse() { return function.C_sparse(); }
+
+  //! Return the dense objective function matrix (C_dense).
+  inline const arma::mat& C_dense() const { return function.C_dense(); }
+
+  //! Modify the dense objective function matrix (C_dense).
+  inline arma::mat& C_dense() { return function.C_dense(); }
+
+  //! Return the vector of sparse A matrices (which correspond to the sparse
+  // constraints).
+  inline const std::vector<arma::sp_mat>& A_sparse() const { return function.A_sparse(); }
+
+  //! Modify the veector of sparse A matrices (which correspond to the sparse
+  // constraints).
+  inline std::vector<arma::sp_mat>& A_sparse() { return function.A_sparse(); }
+
+  //! Return the vector of dense A matrices (which correspond to the dense
+  // constraints).
+  inline const std::vector<arma::mat>& A_dense() const { return function.A_dense(); }
+
+  //! Modify the veector of dense A matrices (which correspond to the dense
+  // constraints).
+  inline std::vector<arma::mat>& A_dense() { return function.A_dense(); }
+
+  //! Return the vector of sparse B values.
+  inline const arma::vec& B_sparse() const { return function.B_sparse(); }
+  //! Modify the vector of sparse B values.
+  inline arma::vec& B_sparse() { return function.B_sparse(); }
+
+  //! Return the vector of dense B values.
+  inline const arma::vec& B_dense() const { return function.B_dense(); }
+  //! Modify the vector of dense B values.
+  inline arma::vec& B_dense() { return function.B_dense(); }
 
   //! Return the function to be optimized.
   const LRSDPFunction& Function() const { return function; }

diff --git a/src/mlpack/core/optimizers/lrsdp/lrsdp_function.cpp b/src/mlpack/core/optimizers/lrsdp/lrsdp_function.cpp
@@ -10,14 +10,24 @@
 
 using namespace mlpack;
 using namespace mlpack::optimization;
+using namespace std;
 
-LRSDPFunction::LRSDPFunction(const size_t numConstraints,
+LRSDPFunction::LRSDPFunction(const size_t numSparseConstraints,
+                             const size_t numDenseConstraints,
                              const arma::mat& initialPoint):
-    a(numConstraints),
-    b(numConstraints),
-    initialPoint(initialPoint),
-    aModes(numConstraints)
-{ }
+    c_sparse(initialPoint.n_rows, initialPoint.n_rows),
+    c_dense(initialPoint.n_rows, initialPoint.n_rows, arma::fill::zeros),
+    hasModifiedSparseObjective(false),
+    hasModifiedDenseObjective(false),
+    a_sparse(numSparseConstraints),
+    b_sparse(numSparseConstraints),
+    a_dense(numDenseConstraints),
+    b_dense(numDenseConstraints),
+    initialPoint(initialPoint)
+{
+  if (initialPoint.n_rows < initialPoint.n_cols)
+    throw invalid_argument("initialPoint n_cols > n_rows");
+}
 
 double LRSDPFunction::Evaluate(const arma::mat& coordinates) const
 {
@@ -34,17 +44,11 @@ void LRSDPFunction::Gradient(const arma::mat& /* coordinates */,
 double LRSDPFunction::EvaluateConstraint(const size_t index,
                                  const arma::mat& coordinates) const
 {
-  arma::mat rrt = coordinates * trans(coordinates);
-  if (aModes[index] == 0)
-    return trace(a[index] * rrt) - b[index];
-  else
-  {
-    double value = -b[index];
-    for (size_t i = 0; i < a[index].n_cols; ++i)
-      value += a[index](2, i) * rrt(a[index](0, i), a[index](1, i));
-
-    return value;
-  }
+  const arma::mat rrt = coordinates * trans(coordinates);
+  if (index < NumSparseConstraints())
+    return trace(a_sparse[index] * rrt) - b_sparse[index];
+  const size_t index1 = index - NumSparseConstraints();
+  return trace(a_dense[index1] * rrt) - b_dense[index1];
 }
 
 void LRSDPFunction::GradientConstraint(const size_t /* index */,
@@ -58,18 +62,53 @@ void LRSDPFunction::GradientConstraint(const size_t /* index */,
 // Return a string representation of the object.
 std::string LRSDPFunction::ToString() const
 {
-  std::stringstream convert;
+  std::ostringstream convert;
   convert << "LRSDPFunction [" << this << "]" << std::endl;
-  convert << "  Number of constraints: " << a.size() << std::endl;
-  convert << "  Constraint matrix (A_i) size: " << initialPoint.n_rows << "x"
+  convert << "  Number of constraints: " << NumConstraints() << std::endl;
+  convert << "  Problem size: n=" << initialPoint.n_rows << ", r="
       << initialPoint.n_cols << std::endl;
-  convert << "  A_i modes: " << aModes.t();
-  convert << "  Constraint b_i values: " << b.t();
-  convert << "  Objective matrix (C) size: " << c.n_rows << "x" << c.n_cols
-      << std::endl;
+  convert << "  Sparse Constraint b_i values: " << b_sparse.t();
+  convert << "  Dense Constraint b_i values: " << b_dense.t();
   return convert.str();
 }
 
+template <typename MatrixType>
+static inline void
+updateObjective(double &objective,
+                const arma::mat &rrt,
+                const std::vector<MatrixType> &ais,
+                const arma::vec &bis,
+                const arma::vec &lambda,
+                size_t lambda_offset,
+                double sigma)
+{
+  for (size_t i = 0; i < ais.size(); ++i)
+  {
+    // Take the trace subtracted by the b_i.
+    double constraint = trace(ais[i] * rrt) - bis[i];
+    objective -= (lambda[lambda_offset + i] * constraint);
+    objective += (sigma / 2.) * constraint * constraint;
+  }
+}
+
+template <typename MatrixType>
+static inline void
+updateGradient(arma::mat &s,
+               const arma::mat &rrt,
+               const std::vector<MatrixType> &ais,
+               const arma::vec &bis,
+               const arma::vec &lambda,
+               size_t lambda_offset,
+               double sigma)
+{
+  for (size_t i = 0; i < ais.size(); ++i)
+  {
+    const double constraint = trace(ais[i] * rrt) - bis[i];
+    const double y = lambda[lambda_offset + i] - sigma * constraint;
+    s -= y * ais[i];
+  }
+}
+
 namespace mlpack {
 namespace optimization {
 
@@ -84,32 +123,27 @@ double AugLagrangianFunction<LRSDPFunction>::Evaluate(
   //     (sigma / 2) * sum_{i = 1}^{m} (Tr(A_i * (R R^T)) - b_i)^2
 
   // Let's start with the objective: Tr(C * (R R^T)).
-  // Simple, possibly slow solution.
-  arma::mat rrt = coordinates * trans(coordinates);
-  double objective = trace(function.C() * rrt);
+  // Simple, possibly slow solution-- see below for optimization opportunity
+  //
+  // TODO: Note that Tr(C^T * (R R^T)) = Tr( (CR)^T * R ), so
+  // multiplying C*R first, and then taking the trace dot should be more memory
+  // efficient
+  //
+  // Similarly for the constraints, taking A*R first should be more efficient
+  const arma::mat rrt = coordinates * trans(coordinates);
+  double objective = 0.;
+  if (function.hasSparseObjective())
+    objective += trace(function.C_sparse() * rrt);
+  if (function.hasDenseObjective())
+    objective += trace(function.C_dense() * rrt);
 
   // Now each constraint.
-  for (size_t i = 0; i < function.B().n_elem; ++i)
-  {
-    // Take the trace subtracted by the b_i.
-    double constraint = -function.B()[i];
-
-    if (function.AModes()[i] == 0)
-    {
-      constraint += trace(function.A()[i] * rrt);
-    }
-    else
-    {
-      for (size_t j = 0; j < function.A()[i].n_cols; ++j)
-      {
-        constraint += function.A()[i](2, j) *
-            rrt(function.A()[i](0, j), function.A()[i](1, j));
-      }
-    }
-
-    objective -= (lambda[i] * constraint);
-    objective += (sigma / 2) * std::pow(constraint, 2.0);
-  }
+  updateObjective(
+      objective, rrt, function.A_sparse(), function.B_sparse(),
+      lambda, 0, sigma);
+  updateObjective(
+      objective, rrt, function.A_dense(), function.B_dense(),
+      lambda, function.NumSparseConstraints(), sigma);
 
   return objective;
 }
@@ -125,45 +159,23 @@ void AugLagrangianFunction<LRSDPFunction>::Gradient(
   //   with
   // S' = C - sum_{i = 1}^{m} y'_i A_i
   // y'_i = y_i - sigma * (Trace(A_i * (R R^T)) - b_i)
-  arma::mat rrt = coordinates * trans(coordinates);
-  arma::mat s = function.C();
+  const arma::mat rrt = coordinates * trans(coordinates);
+  arma::mat s(function.n(), function.n(), arma::fill::zeros);
 
-  for (size_t i = 0; i < function.B().n_elem; ++i)
-  {
-    double constraint = -function.B()[i];
-
-    if (function.AModes()[i] == 0)
-    {
-      constraint += trace(function.A()[i] * rrt);
-    }
-    else
-    {
-      for (size_t j = 0; j < function.A()[i].n_cols; ++j)
-      {
-        constraint += function.A()[i](2, j) *
-            rrt(function.A()[i](0, j), function.A()[i](1, j));
-      }
-    }
-
-    double y = lambda[i] - sigma * constraint;
-
-    if (function.AModes()[i] == 0)
-    {
-      s -= (y * function.A()[i]);
-    }
-    else
-    {
-      // We only need to subtract the entries which could be modified.
-      for (size_t j = 0; j < function.A()[i].n_cols; ++j)
-      {
-        s(function.A()[i](0, j), function.A()[i](1, j)) -= y;
-      }
-    }
-  }
+  if (function.hasSparseObjective())
+    s += function.C_sparse();
+  if (function.hasDenseObjective())
+    s += function.C_dense();
+
+  updateGradient(
+      s, rrt, function.A_sparse(), function.B_sparse(),
+      lambda, 0, sigma);
+  updateGradient(
+      s, rrt, function.A_dense(), function.B_dense(),
+      lambda, function.NumSparseConstraints(), sigma);
 
   gradient = 2 * s * coordinates;
 }
 
 }; // namespace optimization
 }; // namespace mlpack
-