Merge 37fdc56 into dc8d5b0

QuantEcon · Oct 6, 2014 · a4c1e5d · a4c1e5d
2 parents dc8d5b0 + 37fdc56
commit a4c1e5d
Show file tree

Hide file tree

Showing 7 changed files with 1,076 additions and 181 deletions.
diff --git a/quantecon/__init__.py b/quantecon/__init__.py
@@ -7,18 +7,20 @@
 from .discrete_rv import DiscreteRV
 from .ecdf import ECDF
 from .estspec import smooth, periodogram, ar_periodogram
+from .graph_tools import DiGraph
+from .gth_solve import gth_solve
 from .kalman import Kalman
 from .lae import LAE
 from .arma import ARMA
 from .lqcontrol import LQ
 from .lss import LSS
 from .matrix_eqn import solve_discrete_lyapunov, solve_discrete_riccati
-from .mc_tools import DMarkov, mc_sample_path, mc_compute_stationary
+from .mc_tools import MarkovChain, mc_compute_stationary, mc_sample_path
 from .quadsums import var_quadratic_sum, m_quadratic_sum
 from .rank_nullspace import rank_est, nullspace
 from .robustlq import RBLQ
 from .tauchen import approx_markov
 from . import quad as quad
 
 #Add Version Attribute
-from .version import version as __version__
+from .version import version as __version__
diff --git a/quantecon/graph_tools.py b/quantecon/graph_tools.py
@@ -0,0 +1,275 @@
+"""
+Filename: graph_tools.py
+
+Author: Daisuke Oyama
+
+Tools for dealing with a directed graph.
+
+"""
+import numpy as np
+from scipy import sparse
+from scipy.sparse import csgraph
+from fractions import gcd
+
+
+class DiGraph:
+    r"""
+    Class for a directed graph. It stores useful information about the
+    graph structure such as strong connectivity [1]_ and periodicity
+    [2]_.
+
+    Parameters
+    ----------
+    adj_matrix : array_like(ndim=2)
+        Adjacency matrix representing a directed graph. Must be of shape
+        n x n.
+
+    weighted : bool, optional(default=False)
+        Whether to treat `adj_matrix` as a weighted adjacency matrix.
+
+    Attributes
+    ----------
+    csgraph : scipy.sparse.csr_matrix
+        Compressed sparse representation of the digraph.
+
+    is_strongly_connected : bool
+        Indicate whether the digraph is strongly connected.
+
+    num_strongly_connected_components : int
+        The number of the strongly connected components.
+
+    strongly_connected_components : list(ndarray(int))
+        List of numpy arrays containing the strongly connected
+        components.
+
+    num_sink_strongly_connected_components : int
+        The number of the sink strongly connected components.
+
+    sink_strongly_connected_components : list(ndarray(int))
+        List of numpy arrays containing the sink strongly connected
+        components.
+
+    is_aperiodic : bool
+        Indicate whether the digraph is aperiodic.
+
+    period : int
+        The period of the digraph. Defined only for a strongly connected
+        digraph.
+
+    cyclic_components : list(ndarray(int))
+        List of numpy arrays containing the cyclic components.
+
+    Notes
+    -----
+    For the definitions, see the Wikipedia entries [1]_, [2]_.
+
+    References
+    ----------
+    .. [1] `Strongly connected component
+       <http://en.wikipedia.org/wiki/Strongly_connected_component>`_,
+       Wikipedia.
+
+    .. [2] `Aperiodic graph
+       <http://en.wikipedia.org/wiki/Aperiodic_graph>`_, Wikipedia.
+
+    """
+
+    def __init__(self, adj_matrix, weighted=False):
+        if weighted:
+            dtype = None
+        else:
+            dtype = bool
+        self.csgraph = sparse.csr_matrix(adj_matrix, dtype=dtype)
+
+        m, n = self.csgraph.shape
+        if n != m:
+            raise ValueError('input matrix must be square')
+
+        self.n = n  # Number of nodes
+
+        self._num_scc = None
+        self._scc_proj = None
+        self._sink_scc_labels = None
+
+        self._period = None
+
+    def _find_scc(self):
+        """
+        Set ``self._num_scc`` and ``self._scc_proj``
+        by calling ``scipy.sparse.csgraph.connected_components``:
+        * docs.scipy.org/doc/scipy/reference/sparse.csgraph.html
+        * github.com/scipy/scipy/blob/master/scipy/sparse/csgraph/_traversal.pyx
+
+        ``self._scc_proj`` is a list of length `n` that assigns to each node
+        the label of the strongly connected component to which it belongs.
+
+        """
+        # Find the strongly connected components
+        self._num_scc, self._scc_proj = \
+            csgraph.connected_components(self.csgraph, connection='strong')
+
+    @property
+    def num_strongly_connected_components(self):
+        if self._num_scc is None:
+            self._find_scc()
+        return self._num_scc
+
+    @property
+    def scc_proj(self):
+        if self._scc_proj is None:
+            self._find_scc()
+        return self._scc_proj
+
+    @property
+    def is_strongly_connected(self):
+        return (self.num_strongly_connected_components == 1)
+
+    def _condensation_lil(self):
+        """
+        Return the sparse matrix representation of the condensation digraph
+        in lil format.
+
+        """
+        condensation_lil = sparse.lil_matrix(
+            (self.num_strongly_connected_components,
+             self.num_strongly_connected_components), dtype=bool
+        )
+
+        scc_proj = self.scc_proj
+        for node_from, node_to in _csr_matrix_indices(self.csgraph):
+            scc_from, scc_to = scc_proj[node_from], scc_proj[node_to]
+            if scc_from != scc_to:
+                condensation_lil[scc_from, scc_to] = True
+
+        return condensation_lil
+
+    def _find_sink_scc(self):
+        """
+        Set self._sink_scc_labels, which is a list containing the labels of
+        the strongly connected components.
+
+        """
+        condensation_lil = self._condensation_lil()
+
+        # A sink SCC is a SCC such that none of its members is strongly
+        # connected to nodes in other SCCs
+        # Those k's such that graph_condensed_lil.rows[k] == []
+        self._sink_scc_labels = \
+            np.where(np.logical_not(condensation_lil.rows))[0]
+
+    @property
+    def sink_scc_labels(self):
+        if self._sink_scc_labels is None:
+            self._find_sink_scc()
+        return self._sink_scc_labels
+
+    @property
+    def num_sink_strongly_connected_components(self):
+        return len(self.sink_scc_labels)
+
+    @property
+    def strongly_connected_components(self):
+        if self.is_strongly_connected:
+            return [np.arange(self.n)]
+        else:
+            return [np.where(self.scc_proj == k)[0]
+                    for k in range(self.num_strongly_connected_components)]
+
+    @property
+    def sink_strongly_connected_components(self):
+        if self.is_strongly_connected:
+            return [np.arange(self.n)]
+        else:
+            return [np.where(self.scc_proj == k)[0]
+                    for k in self.sink_scc_labels.tolist()]
+
+    def _compute_period(self):
+        """
+        Set ``self._period`` and ``self._cyclic_components_proj``.
+
+        Use the algorithm described in:
+        J. P. Jarvis and D. R. Shier,
+        "Graph-Theoretic Analysis of Finite Markov Chains," 1996.
+
+        """
+        # Degenerate graph with a single node (which is strongly connected)
+        # csgraph.reconstruct_path would raise an exception
+        # github.com/scipy/scipy/issues/4018
+        if self.n == 1:
+            if self.csgraph[0, 0] == 0:  # No edge: "trivial graph"
+                self._period = 1  # Any universally accepted definition?
+                self._cyclic_components_proj = np.zeros(self.n, dtype=int)
+                return None
+            else:  # Self loop
+                self._period = 1
+                self._cyclic_components_proj = np.zeros(self.n, dtype=int)
+                return None
+
+        if not self.is_strongly_connected:
+            raise NotImplementedError(
+                'Not defined for a non strongly-connected digraph'
+            )
+
+        if np.any(self.csgraph.diagonal() > 0):
+            self._period = 1
+            self._cyclic_components_proj = np.zeros(self.n, dtype=int)
+            return None
+
+        # Construct a breadth-first search tree rooted at 0
+        node_order, predecessors = \
+            csgraph.breadth_first_order(self.csgraph, i_start=0)
+        bfs_tree_csr = \
+            csgraph.reconstruct_path(self.csgraph, predecessors)
+
+        # Edges not belonging to tree_csr
+        non_bfs_tree_csr = self.csgraph - bfs_tree_csr
+        non_bfs_tree_csr.eliminate_zeros()
+
+        # Distance to 0
+        level = np.zeros(self.n, dtype=int)
+        for i in range(1, self.n):
+            level[node_order[i]] = level[predecessors[node_order[i]]] + 1
+
+        # Determine the period
+        d = 0
+        for node_from, node_to in _csr_matrix_indices(non_bfs_tree_csr):
+            value = level[node_from] - level[node_to] + 1
+            d = gcd(d, value)
+            if d == 1:
+                self._period = 1
+                self._cyclic_components_proj = np.zeros(self.n, dtype=int)
+                return None
+
+        self._period = d
+        self._cyclic_components_proj = level % d
+
+    @property
+    def period(self):
+        if self._period is None:
+            self._compute_period()
+        return self._period
+
+    @property
+    def is_aperiodic(self):
+        return (self.period == 1)
+
+    @property
+    def cyclic_components(self):
+        if self.is_aperiodic:
+            return [np.arange(self.n)]
+        else:
+            return [np.where(self._cyclic_components_proj == k)[0]
+                    for k in range(self.period)]
+
+
+def _csr_matrix_indices(S):
+    """
+    Generate the indices of nonzero entries of a csr_matrix S
+
+    """
+    m, n = S.shape
+
+    for i in range(m):
+        for j in range(S.indptr[i], S.indptr[i+1]):
+            row_index, col_index = i, S.indices[j]
+            yield row_index, col_index
diff --git a/quantecon/gth_solve.py b/quantecon/gth_solve.py
@@ -0,0 +1,93 @@
+"""
+Filename: gth_solve.py
+
+Author: Daisuke Oyama
+
+Routine to compute the stationary distribution of an irreducible Markov
+chain by the Grassmann-Taksar-Heyman (GTH) algorithm.
+
+"""
+import numpy as np
+
+try:
+    xrange
+except:  # python3
+    xrange = range
+
+
+def gth_solve(A, overwrite=False):
+    r"""
+    This routine computes the stationary distribution of an irreducible
+    Markov transition matrix (stochastic matrix) or transition rate
+    matrix (generator matrix) `A`.
+
+    More generally, given a Metzler matrix (square matrix whose
+    off-diagonal entries are all nonnegative) `A`, this routine solves
+    for a nonzero solution `x` to `x (A - D) = 0`, where `D` is the
+    diagonal matrix for which the rows of `A - D` sum to zero (i.e.,
+    :math:`D_{ii} = \sum_j A_{ij}` for all :math:`i`). One (and only
+    one, up to normalization) nonzero solution exists corresponding to
+    each reccurent class of `A`, and in particular, if `A` is
+    irreducible, there is a unique solution; when there are more than
+    one solution, the routine returns the solution that contains in its
+    support the first index `i` such that no path connects `i` to any
+    index larger than `i`. The solution is normalized so that its 1-norm
+    equals one. This routine implements the Grassmann-Taksar-Heyman
+    (GTH) algorithm [1]_, a numerically stable variant of Gaussian
+    elimination, where only the off-diagonal entries of `A` are used as
+    the input data. For a nice exposition of the algorithm, see Stewart
+    [2]_, Chapter 10.
+
+    Parameters
+    ----------
+    A : array_like(float, ndim=2)
+        Stochastic matrix or generator matrix. Must be of shape n x n.
+    overwrite : bool, optional(default=False)
+        Whether to overwrite `A`; may improve performance.
+
+    Returns
+    -------
+    x : numpy.ndarray(float, ndim=1)
+        Stationary distribution of `A`.
+
+    References
+    ----------
+    .. [1] W. K. Grassmann, M. I. Taksar and D. P. Heyman, "Regenerative
+       Analysis and Steady State Distributions for Markov Chains,"
+       Operations Research (1985), 1107-1116.
+
+    .. [2] W. J. Stewart, Probability, Markov Chains, Queues, and
+       Simulation, Princeton University Press, 2009.
+
+    """
+    A1 = np.array(A, copy=not overwrite)
+
+    if len(A1.shape) != 2 or A1.shape[0] != A1.shape[1]:
+        raise ValueError('matrix must be square')
+
+    n = A1.shape[0]
+
+    x = np.zeros(n)
+
+    # === Reduction === #
+    for i in xrange(n-1):
+        scale = np.sum(A1[i, i+1:n])
+        if scale <= 0:
+            # There is one (and only one) recurrent class contained in
+            # {0, ..., i};
+            # compute the solution associated with that recurrent class.
+            n = i+1
+            break
+        A1[i+1:n, i] /= scale
+
+        A1[i+1:n, i+1:n] += np.dot(A1[i+1:n, i:i+1], A1[i:i+1, i+1:n])
+
+    # === Backward substitution === #
+    x[n-1] = 1
+    for i in xrange(n-2, -1, -1):
+        x[i] = np.sum((x[j] * A1[j, i] for j in xrange(i+1, n)))
+
+    # === Normalization === #
+    x /= np.sum(x)
+
+    return x