AtheMathmo · AtheMathmo · Sep 24, 2016 · Sep 18, 2016 · Sep 18, 2016 · Sep 18, 2016
diff --git a/Cargo.toml b/Cargo.toml
@@ -13,3 +13,6 @@ license = "MIT"
 [dependencies]
 num = {version = "0.1.34", default-features = false }
 matrixmultiply = "0.1.8"
+
+[dev-dependencies]
+rand = "0.3"
diff --git a/benches/lib.rs b/benches/lib.rs
@@ -2,7 +2,9 @@
 
 extern crate rulinalg;
 extern crate test;
+extern crate rand;
 
 mod linalg {
 	mod matrix;
+	mod svd;
 }
diff --git a/benches/linalg/svd.rs b/benches/linalg/svd.rs
@@ -0,0 +1,29 @@
+use test::Bencher;
+use rand;
+use rand::{Rng, SeedableRng};
+use rulinalg::matrix::Matrix;
+
+fn reproducible_random_matrix(rows: usize, cols: usize) -> Matrix<f64> {
+    const STANDARD_SEED: [usize; 4] = [12, 2049, 4000, 33];
+    let mut rng = rand::StdRng::from_seed(&STANDARD_SEED);
+    let elements: Vec<_> = rng.gen_iter::<f64>().take(rows * cols).collect();
+    Matrix::new(rows, cols, elements)
+}
+
+#[bench]
+fn svd_10_10(b: &mut Bencher) {
+    let mat = reproducible_random_matrix(10, 10);
+
+    b.iter(||
+        mat.clone().svd()
+    )
+}
+
+#[bench]
+fn svd_100_100(b: &mut Bencher) {
+    let mat = reproducible_random_matrix(100, 100);
+
+    b.iter(||
+        mat.clone().svd()
+    )
+}
diff --git a/src/epsilon.rs b/src/epsilon.rs
@@ -0,0 +1,24 @@
+use libnum::Float;
+use std::f32;
+use std::f64;
+
+/// Expose the machine epsilon of floating point numbers.
+/// This trait should only need to exist for a short time,
+/// until the Float trait from the Num crate has the same
+/// capabilities.
+pub trait MachineEpsilon: Float {
+    /// Returns the machine epsilon for the given Float type.
+    fn epsilon() -> Self;
+}
+
+impl MachineEpsilon for f32 {
+    fn epsilon() -> f32 {
+        f32::EPSILON
+    }
+}
+
+impl MachineEpsilon for f64 {
+    fn epsilon() -> f64 {
+        f64::EPSILON
+    }
+}
diff --git a/src/lib.rs b/src/lib.rs
@@ -79,6 +79,10 @@ pub mod error;
 pub mod utils;
 pub mod vector;
 
+// Remove this module once epsilon() makes it into the num crate.
+mod epsilon;
+pub use epsilon::MachineEpsilon;
+
 /// Trait for linear algebra metrics.
 ///
 /// Currently only implements basic euclidean norm.

diff --git a/src/matrix/decomposition.rs b/src/matrix/decomposition.rs
@@ -23,6 +23,7 @@ use error::{Error, ErrorKind};
 
 use libnum::{One, Zero, Float, Signed};
 use libnum::{cast, abs};
+use epsilon::MachineEpsilon;
 
 impl<T: Any + Float> Matrix<T> {
     /// Cholesky decomposition
@@ -305,18 +306,119 @@ impl<T: Any + Float> Matrix<T> {
     }
 }
 
-impl<T: Any + Float + Signed> Matrix<T> {
+/// Ensures that all singular values in the given singular value decomposition
+/// are non-negative, making necessary corrections to the singular vectors.
+///
+/// The SVD is represented by matrices `(b, u, v)`, where `b` is the diagonal matrix
+/// containing the singular values, `u` is the matrix of left singular vectors
+/// and v is the matrix of right singular vectors.
+fn correct_svd_signs<T>(mut b: Matrix<T>, mut u: Matrix<T>, mut v: Matrix<T>)
+    -> (Matrix<T>, Matrix<T>, Matrix<T>) where T: Any + Float + Signed {
+
+    // When correcting the signs of the singular vectors, we can choose
+    // to correct EITHER u or v. We make the choice depending on which matrix has the
+    // least number of rows. Later we will need to multiply all elements in columns by
+    // -1, which might be significantly faster in corner cases if we pick the matrix
+    // with the least amount of rows.
+    {
+        let ref mut shortest_matrix = if u.rows() <= v.rows() { &mut u }
+                                      else { &mut v };
+        let column_length = shortest_matrix.rows();
+        let num_singular_values = cmp::min(b.rows(), b.cols());
+
+        for i in 0 .. num_singular_values {
+            if b[[i, i]] < T::zero() {
+                // Swap sign of singular value and column in u
+                b[[i, i]] = b[[i, i]].abs();
+
+                // Access the column as a slice and flip sign
+                let mut column = shortest_matrix.sub_slice_mut([0, i], column_length, 1);
+                column *= -T::one();
+            }
+        }
+    }
+    (b, u, v)
+}
+
+fn sort_svd<T>(mut b: Matrix<T>, mut u: Matrix<T>, mut v: Matrix<T>)
+    -> (Matrix<T>, Matrix<T>, Matrix<T>) where T: Any + Float + Signed {
+
+    assert!(u.cols() == b.cols() && b.cols() == v.cols());
+
+    // This unfortunately incurs two allocations since we have no (simple)
+    // way to iterate over a matrix diagonal, only to copy it into a new Vector
+    let mut indexed_sorted_values: Vec<_> = b.diag().into_vec()
+        .into_iter()
+        .enumerate()
+        .collect();
+
+    // Sorting a vector of indices simultaneously with the singular values
+    // gives us a mapping between old and new (final) column indices.
+    indexed_sorted_values.sort_by(|&(_, ref x), &(_, ref y)|
+        x.partial_cmp(y).expect("All singular values should be finite, and thus sortable.")
+         .reverse()
+    );
+
+    // Set the diagonal elements of the singular value matrix
+    for (i, &(_, value)) in indexed_sorted_values.iter().enumerate() {
+        b[[i, i]] = value;
+    }
+
+    // Assuming N columns, the simultaneous sorting of indices and singular values yields
+    // a set of N (i, j) pairs which correspond to columns which must be swapped. However,
+    // for any (i, j) in this set, there is also (j, i). Keeping both of these would make us
+    // swap the columns back and forth, so we must remove the duplicates. We can avoid
+    // any further sorting or hashsets or similar by noting that we can simply
+    // remove any (i, j) for which j >= i. This also removes (i, i) pairs,
+    // i.e. columns that don't need to be swapped.
+    let swappable_pairs = indexed_sorted_values.into_iter()
+        .enumerate()
+        .map(|(new_index, (old_index, _))| (old_index, new_index))
+        .filter(|&(old_index, new_index)| old_index < new_index);
+
+    for (old_index, new_index) in swappable_pairs {
+        u.swap_cols(old_index, new_index);
+        v.swap_cols(old_index, new_index);
+    }
+
+    (b, u, v)
+}
+
+impl<T: Any + Float + Signed + MachineEpsilon> Matrix<T> {
     /// Singular Value Decomposition
     ///
-    /// Computes the SVD using Golub-Reinsch algorithm.
+    /// Computes the SVD using the Golub-Reinsch algorithm.
     ///
-    /// Returns Σ, U, V where self = U Σ V<sup>T</sup>.
+    /// Returns Σ, U, V, such that `self` = U Σ V<sup>T</sup>. Σ is a diagonal matrix whose elements
+    /// correspond to the non-negative singular values of the matrix. The singular values are ordered in
+    /// non-increasing order. U and V have orthonormal columns, and each column represents the
+    /// left and right singular vectors for the corresponding singular value in Σ, respectively.
+    ///
+    /// Denoting the dimensions of self as M x N (rows x cols), the dimensions of the returned matrices
+    /// are as follows:
+    ///
+    /// - `Σ`: N x N
+    /// - `U`: M x N
+    /// - `V`: N x N
     ///
     /// # Failures
     ///
     /// This function may fail in some cases. The current decomposition whilst being
     /// efficient is fairly basic. Hopefully the algorithm can be made not to fail in the near future.
-    pub fn svd(mut self) -> Result<(Matrix<T>, Matrix<T>, Matrix<T>), Error> {
+    pub fn svd(self) -> Result<(Matrix<T>, Matrix<T>, Matrix<T>), Error> {
+        let (b, u, v) = try!(self.svd_unordered());
+        Ok(sort_svd(b, u, v))
+    }
+
+    fn svd_unordered(self) -> Result<(Matrix<T>, Matrix<T>, Matrix<T>), Error> {
+        let (b, u, v) = try!(self.svd_golub_reinsch());
+
+        // The Golub-Reinsch implementation sometimes spits out negative singular values,
+        // so we need to correct these.
+        Ok(correct_svd_signs(b, u, v))
+    }
+
+    fn svd_golub_reinsch(mut self) -> Result<(Matrix<T>, Matrix<T>, Matrix<T>), Error> {
         let mut flipped = false;
 
         // The algorithm assumes rows > cols. If this is not the case we transpose and fix later.
@@ -325,6 +427,7 @@ impl<T: Any + Float + Signed> Matrix<T> {
             flipped = true;
         }
 
+        let eps = T::from(3.0).unwrap() * T::epsilon();
         let n = self.cols;
 
         // Get the bidiagonal decomposition
@@ -346,8 +449,7 @@ impl<T: Any + Float + Signed> Matrix<T> {
                 unsafe {
                     b_ii = *b.get_unchecked([i, i]);
                     b_sup_diag = b.get_unchecked([i, i + 1]).abs();
-                    diag_abs_sum = T::min_positive_value() *
-                                   (b_ii.abs() + *b.get_unchecked([i + 1, i + 1]));
+                    diag_abs_sum = eps * (b_ii.abs() + b.get_unchecked([i + 1, i + 1]).abs());
                 }
                 if b_sup_diag <= diag_abs_sum {
                     // Adjust q or p to define boundaries of sup-diagonal box
@@ -382,7 +484,7 @@ impl<T: Any + Float + Signed> Matrix<T> {
                     b_sup_diag = *b.get_unchecked([i, i + 1]);
                 }
 
-                if b_ii.abs() < T::min_positive_value() {
+                if b_ii.abs() < eps {
                     let (c, s) = Matrix::<T>::givens_rot(b_ii, b_sup_diag);
                     let givens = Matrix::new(2, 2, vec![c, s, -s, c]);
                     let b_i = MatrixSliceMut::from_matrix(&mut b, [i, i], 1, 2);
@@ -1063,6 +1165,7 @@ impl<T> Matrix<T> where T: Any + Copy + One + Zero + Neg<Output=T> +
 mod tests {
     use matrix::{Matrix, BaseMatrix};
     use vector::Vector;
+    use super::sort_svd;
 
     fn validate_bidiag(mat: &Matrix<f64>,
                        b: &Matrix<f64>,
@@ -1123,6 +1226,8 @@ mod tests {
         for (idx, row) in b.iter_rows().enumerate() {
             assert!(!row.iter().take(idx).any(|&x| x > 1e-10));
             assert!(!row.iter().skip(idx + 1).any(|&x| x > 1e-10));
+            // Assert non-negativity of diagonal elements
+            assert!(row[idx] >= 0.0);
         }
 
         let recovered = u * b * v.transpose();
@@ -1134,36 +1239,119 @@ mod tests {
             .iter()
             .zip(recovered.data().iter())
             .any(|(&x, &y)| (x - y).abs() > 1e-10));
+
+        // The transposition is due to the fact that there does not exist
+        // any column iterators at the moment, and we need to simultaneously iterate
+        // over the columns. Once they do exist, we should rewrite
+        // the below iterators to use iter_cols() or whatever instead.
+        let ref u_transposed = u.transpose();
+        let ref v_transposed = v.transpose();
+        let ref mat_transposed = mat.transpose();
+
+        let mut singular_triplets = u_transposed.iter_rows().zip(b.diag().into_iter()).zip(v_transposed.iter_rows())
+            // chained zipping results in nested tuple. Flatten it.
+            .map(|((u_col, singular_value), v_col)| (Vector::new(u_col), singular_value, Vector::new(v_col)));
+
+        assert!(singular_triplets.by_ref()
+            // For a matrix M, each singular value σ and left and right singular vectors u and v respectively
+            // satisfy M v = σ u, so we take the difference
+            .map(|(ref u, sigma, ref v)| mat * v - u * sigma)
+            .flat_map(|v| v.into_vec().into_iter())
+            .all(|x| x.abs() < 1e-10));
+
+        assert!(singular_triplets.by_ref()
+            // For a matrix M, each singular value σ and left and right singular vectors u and v respectively
+            // satisfy M_transposed u = σ v, so we take the difference
+            .map(|(ref u, sigma, ref v)| mat_transposed * u - v * sigma)
+            .flat_map(|v| v.into_vec().into_iter())
+            .all(|x| x.abs() < 1e-10));
     }
 
     #[test]
-    fn test_svd_non_square() {
-        let mat = Matrix::new(5,
-                              3,
-                              vec![1f64, 2.0, 3.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0,
-                                   7.0, 1.0, 1.0]);
+    fn test_sort_svd() {
+        let u = Matrix::new(2, 3, vec![1.0, 2.0, 3.0,
+                                       4.0, 5.0, 6.0]);
+        let b = Matrix::new(3, 3, vec![4.0, 0.0, 0.0,
+                                       0.0, 8.0, 0.0,
+                                       0.0, 0.0, 2.0]);
+        let v = Matrix::new(3, 3, vec![21.0, 22.0, 23.0,
+                                       24.0, 25.0, 26.0,
+                                       27.0, 28.0, 29.0]);
+        let (b, u, v) = sort_svd(b, u, v);
+
+        assert_eq!(b.data(), &vec![8.0, 0.0, 0.0,
+                                  0.0, 4.0, 0.0,
+                                  0.0, 0.0, 2.0]);
+        assert_eq!(u.data(), &vec![2.0, 1.0, 3.0,
+                                  5.0, 4.0, 6.0]);
+        assert_eq!(v.data(), &vec![22.0, 21.0, 23.0,
+                                  25.0, 24.0, 26.0,
+                                  28.0, 27.0, 29.0]);
+
+    }
+
+    #[test]
+    fn test_svd_tall_matrix() {
+        // Note: This matrix is not arbitrary. It has been constructed specifically so that
+        // the "natural" order of the singular values it not sorted by default.
+        let mat = Matrix::new(5, 4,
+                              vec![ 3.61833700244349288, -3.28382346228211697,  1.97968027781346501, -0.41869628192662156,
+                                    3.96046289599926427,  0.70730060716580723, -2.80552479438772817, -1.45283286109873933,
+                                    1.44435028724617442,  1.27749196276785826, -1.09858397535426366, -0.03159619816434689,
+                                    1.13455445826500667,  0.81521390274755756,  3.99123446373437263, -2.83025703359666192,
+                                   -3.30895752093770579, -0.04979044289857298,  3.03248594516832792,  3.85962479743330977]);
         let (b, u, v) = mat.clone().svd().unwrap();
 
+        let expected_values = vec![8.0, 6.0, 4.0, 2.0];
+
         validate_svd(&mat, &b, &u, &v);
 
-        let mat = Matrix::new(3,
-                              5,
-                              vec![1f64, 2.0, 3.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0,
-                                   7.0, 1.0, 1.0]);
+        // Assert the singular values are what we expect
+        assert!(expected_values.iter()
+            .zip(b.diag().data().iter())
+            .all(|(expected, actual)| (expected - actual).abs() < 1e-14));
+    }
+
+    #[test]
+    fn test_svd_short_matrix() {
+        // Note: This matrix is not arbitrary. It has been constructed specifically so that
+        // the "natural" order of the singular values it not sorted by default.
+        let mat = Matrix::new(4, 5,
+                              vec![ 3.61833700244349288,  3.96046289599926427,  1.44435028724617442,  1.13455445826500645, -3.30895752093770579,
+                                   -3.28382346228211697,  0.70730060716580723,  1.27749196276785826,  0.81521390274755756, -0.04979044289857298,
+                                    1.97968027781346545, -2.80552479438772817, -1.09858397535426366,  3.99123446373437263,  3.03248594516832792,
+                                   -0.41869628192662156, -1.45283286109873933, -0.03159619816434689, -2.83025703359666192,  3.85962479743330977]);
         let (b, u, v) = mat.clone().svd().unwrap();
 
+        let expected_values = vec![8.0, 6.0, 4.0, 2.0];
+
         validate_svd(&mat, &b, &u, &v);
+
+        // Assert the singular values are what we expect
+        assert!(expected_values.iter()
+            .zip(b.diag().data().iter())
+            .all(|(expected, actual)| (expected - actual).abs() < 1e-14));
     }
 
     #[test]
-    fn test_svd_square() {
-        let mat = Matrix::new(5,
-                              5,
-                              vec![1f64, 2.0, 3.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0,
-                                   7.0, 1.0, 1.0, 4.0, 2.0, 1.0, -1.0, 3.0, 5.0, 1.0, 1.0, 3.0,
-                                   2.0]);
+    fn test_svd_square_matrix() {
+        let mat = Matrix::new(5, 5,
+                              vec![1.0,  2.0,  3.0,  4.0,  5.0,
+                                   2.0,  4.0,  1.0,  2.0,  1.0,
+                                   3.0,  1.0,  7.0,  1.0,  1.0,
+                                   4.0,  2.0,  1.0, -1.0,  3.0,
+                                   5.0,  1.0,  1.0,  3.0,  2.0]);
+
+        let expected_values = vec![ 12.1739747429271112,   5.2681047320525831,   4.4942269799769843,
+                                     2.9279675877385123,   2.8758200827412224];
+
         let (b, u, v) = mat.clone().svd().unwrap();
         validate_svd(&mat, &b, &u, &v);
+
+        // Assert the singular values are what we expect
+        assert!(expected_values.iter()
+            .zip(b.diag().data().iter())
+            .all(|(expected, actual)| (expected - actual).abs() < 1e-12));
     }
 
     #[test]