Source code for Environment.pykov

# -*- coding: utf-8 -*-

# PyKov is Python package for the creation, manipulation and study of Markov
# Chains.
# Copyright (C) 2014  Riccardo Scalco
#
# This program is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.

# Email: riccardo.scalco@gmail.com

"""Pykov documentation.

.. module:: A Python module for finite Markov chains.
    :platform: Unix, Windows, Mac

.. moduleauthor::
    Riccardo Scalco <riccardo.scalco@gmail.com>

"""
from __future__ import division, print_function  # Python 2 compatibility

import random
import math
import six
import numpy
import sys

from collections import OrderedDict

import scipy.sparse as ss
import scipy.sparse.linalg as ssl

if sys.version_info < (2, 6):
   from sets import Set
else:
   Set = set

__date__ = 'March 2015'
__version__ = 1.1
__license__ = 'GNU General Public License Version 3'
__authors__ = 'Riccardo Scalco'
__many_thanks_to__ = 'Sandra Steiner, Nicky Van Foreest, Adel Qalieh'


[docs]def _del_cache(fn):
    """
    Delete cache.
    """
    def wrapper(*args, **kwargs):
        self = args[0]
        try:
            del self._states
        except AttributeError:
            pass
        try:
            del self._succ
        except AttributeError:
            pass
        try:
            del self._pred
        except AttributeError:
            pass
        try:
            del self._steady
        except AttributeError:
            pass
        try:
            del self._guess
        except AttributeError:
            pass
        try:
            del self._fundamental_matrix
        except AttributeError:
            pass
        return fn(*args, **kwargs)
    return wrapper


[docs]class PykovError(Exception):

    """
    Exception definition form Pykov Errors.
    """

[docs]    def __init__(self, value):
        self.value = value

[docs]    def __str__(self):
        return repr(self.value)


[docs]class Vector(OrderedDict):

    """
    """

[docs]    def __init__(self, data=None, **kwargs):
        """
        >>> pykov.Vector({'A':.3, 'B':.7})
        {'A':.3, 'B':.7}
        >>> pykov.Vector(A=.3, B=.7)
        {'A':.3, 'B':.7}
        """
        OrderedDict.__init__(self)

        if data:
            self.update([item for item in six.iteritems(data)
                         if abs(item[1]) > numpy.finfo(numpy.float).eps])
        if len(kwargs):
            self.update([item for item in six.iteritems(kwargs)
                         if abs(item[1]) > numpy.finfo(numpy.float).eps])

[docs]    def __getitem__(self, key):
        """
        >>> q = pykov.Vector(C=.4, B=.6)
        >>> q['C']
        0.4
        >>> q['Z']
        0.0
        """
        try:
            return OrderedDict.__getitem__(self, key)
        except KeyError:
            return 0.0

[docs]    def __setitem__(self, key, value):
        """
        >>> q = pykov.Vector(C=.4, B=.6)
        >>> q['Z']=.2
        >>> q
        {'C': 0.4, 'B': 0.6, 'Z': 0.2}
        >>> q['Z']=0
        >>> q
        {'C': 0.4, 'B': 0.6}
        """
        if abs(value) > numpy.finfo(numpy.float).eps:
            OrderedDict.__setitem__(self, key, value)
        elif key in self:
            del self[key]

[docs]    def __mul__(self, M):
        """
        >>> p = pykov.Vector(A=.3, B=.7)
        >>> p * 3
        {'A': 0.9, 'B': 2.1}
        >>> q = pykov.Vector(C=.5, B=.5)
        >>> p * q
        0.35
        >>> T = pykov.Matrix({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> p * T
        {'A': 0.91, 'B': 0.09}
        >>> T * p
        {'A': 0.42, 'B': 0.3}
        """
        if isinstance(M, int) or isinstance(M, float):
            return self.__rmul__(M)
        if isinstance(M, Matrix):
            e2p, p2e = M._el2pos_()
            x = self._toarray(e2p)
            A = M._dok_(e2p).tocsr().transpose()
            y = A.dot(x)
            result = Vector()
            result._fromarray(y, e2p)
            return result
        elif isinstance(M, Vector):
            result = 0
            for state, value in six.iteritems(self):
                result += value * M[state]
            return result
        else:
            raise TypeError('unsupported operand type(s) for *:' +
                            ' \'Vector\' and ' + repr(type(M))[7:-1])

[docs]    def __rmul__(self, M):
        """
        >>> p = pykov.Vector(A=.3, B=.7)
        >>> 3 * p
        {'A': 0.9, 'B': 2.1}
        """
        if isinstance(M, int) or isinstance(M, float):
            result = Vector()
            for state, value in six.iteritems(self):
                result[state] = value * M
            return result
        else:
            raise TypeError('unsupported operand type(s) for *: ' +
                            repr(type(M))[7:-1] + ' and \'Vector\'')

[docs]    def __add__(self, v):
        """
        >>> p = pykov.Vector(A=.3, B=.7)
        >>> q = pykov.Vector(C=.5, B=.5)
        >>> p + q
        {'A': 0.3, 'C': 0.5, 'B': 1.2}
        """
        if isinstance(v, Vector):
            result = Vector()
            for state in set(six.iterkeys(self)) | set(v.keys()):
                result[state] = self[state] + v[state]
            return result
        else:
            raise TypeError('unsupported operand type(s) for +:' +
                            ' \'Vector\' and ' + repr(type(v))[7:-1])

[docs]    def __sub__(self, v):
        """
        >>> p = pykov.Vector(A=.3, B=.7)
        >>> q = pykov.Vector(C=.5, B=.5)
        >>> p - q
        {'A': 0.3, 'C': -0.5, 'B': 0.2}
        >>> q - p
        {'A': -0.3, 'C': 0.5, 'B': -0.2}
        """
        if isinstance(v, Vector):
            result = Vector()
            for state in set(six.iterkeys(self)) | set(v.keys()):
                result[state] = self[state] - v[state]
            return result
        else:
            raise TypeError('unsupported operand type(s) for -:' +
                            ' \'Vector\' and ' + repr(type(v))[7:-1])

[docs]    def _toarray(self, el2pos):
        """
        >>> p = pykov.Vector(A=.3, B=.7)
        >>> el2pos = {'A': 1, 'B': 0}
        >>> v = p._toarray(el2pos)
        >>> v
        array([ 0.7,  0.3])
        """
        p = numpy.zeros(len(el2pos))
        for key, value in six.iteritems(self):
            p[el2pos[key]] = value
        return p

[docs]    def _fromarray(self, arr, el2pos):
        """
        >>> p = pykov.Vector()
        >>> el2pos = {'A': 1, 'B': 0}
        >>> v = numpy.array([ 0.7,  0.3])
        >>> p._fromarray(v,el2pos)
        >>> p
        {'A': 0.3, 'B': 0.7}
        """
        for elem, pos in el2pos.items():
            self[elem] = arr[pos]
        return None

[docs]    def sort(self, reverse=False):
        """
        List of (state,probability) sorted according the probability.

        >>> p = pykov.Vector({'A':.3, 'B':.1, 'C':.6})
        >>> p.sort()
        [('B', 0.1), ('A', 0.3), ('C', 0.6)]
        >>> p.sort(reverse=True)
        [('C', 0.6), ('A', 0.3), ('B', 0.1)]
        """
        res = list(six.iteritems(self))
        res.sort(key=lambda lst: lst[1], reverse=reverse)
        return res

[docs]    def normalize(self):
        """
        Normalize the vector so that the entries sum is 1.

        >>> p = pykov.Vector({'A':3, 'B':1, 'C':6})
        >>> p.normalize()
        >>> p
        {'A': 0.3, 'C': 0.6, 'B': 0.1}
        """
        s = self.sum()
        for k in six.iterkeys(self):
            self[k] = self[k] / s

[docs]    def choose(self, random_func=None):
        """
        Choose a state according to its probability.

        >>> p = pykov.Vector(A=.3, B=.7)
        >>> p.choose()
        'B'

        Optionally, a function that generates a random number can be supplied.
        >>> def FakeRandom(min, max): return 0.01
        >>> p = pykov.Vector(A=.05, B=.4, C=.4, D=.15)
        >>> p.choose(FakeRandom)
        'A'

        .. seealso::

           `Kevin Parks recipe <http://code.activestate.com/recipes/117241/>`_
        """
        if random_func is None:
            random_func = random.uniform
        n = random_func(0, 1)
        for state, prob in six.iteritems(self):
            if n < prob:
                break
            n = n - prob
        return state

[docs]    def entropy(self):
        """
        Return the entropy.

        .. math::

           H(p) = \sum_i p_i \ln p_i

        .. seealso::

           Khinchin, A. I.
           Mathematical Foundations of Information Theory
           Dover, 1957.

        >>> p = pykov.Vector(A=.3, B=.7)
        >>> p.entropy()
        0.6108643020548935
        """
        return -sum([v * math.log(v) for v in self.values()])

[docs]    def relative_entropy(self, p):
        """
        Return the Kullback-Leibler distance.

        .. math::

           d(q,p) = \sum_i q_i \ln (q_i/p_i)

        .. note::

           The Kullback-Leibler distance is not symmetric.

        >>> p = pykov.Vector(A=.3, B=.7)
        >>> q = pykov.Vector(A=.4, B=.6)
        >>> p.relative_entropy(q)
        0.02160085414354654
        >>> q.relative_entropy(p)
        0.022582421084357485
        """
        states = set(six.iterkeys(self)) & set(p.keys())
        return sum([self[s] * math.log(self[s] / p[s]) for s in states])

[docs]    def copy(self):
        """
        Return a shallow copy.

        >>> p = pykov.Vector(A=.3, B=.7)
        >>> q = p.copy()
        >>> p['C'] = 1.
        >>> q
        {'A': 0.3, 'B': 0.7}
        """
        return Vector(self)

[docs]    def sum(self):
        """
        Sum the values.

        >>> p = pykov.Vector(A=.3, B=.7)
        >>> p.sum()
        1.0
        """
        return float(sum(self.values()))

[docs]    def dist(self, v):
        """
        Return the distance between the two probability vectors.

        .. math::

           d(q,p) = \sum_i |q_i - p_i|

        >>> p = pykov.Vector(A=.3, B=.7)
        >>> q = pykov.Vector(C=.5, B=.5)
        >>> q.dist(p)
        1.0
        """
        if isinstance(v, Vector):
            result = 0
            for state in set(six.iterkeys(self)) | set(v.keys()):
                result += abs(v[state] - self[state])
            return result


[docs]class Matrix(OrderedDict):

    """
    """

[docs]    def __init__(self, data=None):
        """
        >>> T = pykov.Matrix({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        """
        OrderedDict.__init__(self)

        if data:
            self.update([item for item in six.iteritems(data)
                        if abs(item[1]) > numpy.finfo(numpy.float).eps])

[docs]    def __getitem__(self, *args):
        """
        >>> T = pykov.Matrix({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> T[('A','B')]
        0.3
        >>> T['A','B']
        0.3
        >>>
        0.0
        """
        try:
            return OrderedDict.__getitem__(self, args[0])
        except KeyError:
            return 0.0

[docs]    @_del_cache
    def __setitem__(self, key, value):
        """
        >>> T = pykov.Matrix()
        >>> T[('A','B')] = .3
        >>> T
        {('A', 'B'): 0.3}
        >>> T['A','A'] = .7
        >>> T
        {('A', 'B'): 0.3, ('A', 'A'): 0.7}
        >>> T['B','B'] = 0
        >>> T
        {('A', 'B'): 0.3, ('A', 'A'): 0.7}
        >>> T['A','A'] = 0
        >>> T
        {('A', 'B'): 0.3}

        >>> T = pykov.Matrix({('A','B'): 3, ('A','A'): 7, ('B','A'): .1})
        >>> T.states()
        {'A', 'B'}
        >>> T['A','C']=1
        >>> T.states()
        {'A', 'B', 'C'}
        >>> T['A','C']=0
        >>> T.states()
        {'A', 'B'}
        """
        if abs(value) > numpy.finfo(numpy.float).eps:
            OrderedDict.__setitem__(self, key, value)
        elif key in self:
            del self[key]

[docs]    @_del_cache
    def __delitem__(self, key):
        """
        >>> T = pykov.Matrix({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> del T['B', 'A']
        >>> T
        {('A', 'B'): 0.3, ('A', 'A'): 0.7}
        """
        OrderedDict.__delitem__(self, key)

[docs]    @_del_cache
    def pop(self, key):
        """
        Remove specified key and return the corresponding value.
        See: help(OrderedDict.pop)

        >>> T = pykov.Matrix({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> T.pop(('A','B'))
        0.3
        >>> T
        {('B', 'A'): 1.0, ('A', 'A'): 0.7}
        """
        return OrderedDict.pop(self, key)

[docs]    @_del_cache
    def popitem(self):
        """
        Remove and return some (key, value) pair as a 2-tuple.
        See: help(OrderedDict.popitem)

        >>> T = pykov.Matrix({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> T.popitem()
        (('B', 'A'), 1.0)
        >>> T
        {('A', 'B'): 0.3, ('A', 'A'): 0.7}
        """
        return OrderedDict.popitem(self)

[docs]    @_del_cache
    def clear(self):
        """
        Remove all keys.
        See: help(OrderedDict.clear)

        >>> T = pykov.Matrix({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> T.clear()
        >>> T
        {}
        """
        OrderedDict.clear(self)

[docs]    @_del_cache
    def update(self, other):
        """
        Update with keys and their values present in other.
        See: help(OrderedDict.update)

        >>> T = pykov.Matrix({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> d = {('B', 'C'):2}
        >>> T.update(d)
        >>> T
        {('B', 'A'): 1.0, ('B', 'C'): 2, ('A', 'B'): 0.3, ('A', 'A'): 0.7}
        """
        OrderedDict.update(self, other)

[docs]    @_del_cache
    def setdefault(self, k, *args):
        """
        See: help(OrderedDict.setdefault)

        >>> T = pykov.Matrix({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> T.setdefault(('A','A'),1)
        0.7
        >>> T
        {('B', 'A'): 1.0, ('A', 'B'): 0.3, ('A', 'A'): 0.7}
        >>> T.setdefault(('A','C'),1)
        1
        >>> T
        {('B', 'A'): 1.0, ('A', 'B'): 0.3, ('A', 'A'): 0.7, ('A', 'C'): 1}
        """
        return OrderedDict.setdefault(self, k, *args)

[docs]    def copy(self):
        """
        Return a shallow copy.

        >>> T = pykov.Matrix({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> W = T.copy()
        >>> T[('B','B')] = 1.
        >>> W
        {('B', 'A'): 1.0, ('A', 'B'): 0.3, ('A', 'A'): 0.7}
        """
        return Matrix(self)

[docs]    def __reduce__(self):
        """Return state information for pickling"""
        # Required because we changed the OrderedDict.__init__ signature
        return (self.__class__, (), None, None, six.iteritems(self))

[docs]    def _dok_(self, el2pos, method=''):
        """
        """
        m = len(el2pos)
        S = ss.dok_matrix((m, m))
        if method == '':
            for k, v in six.iteritems(self):
                i = el2pos[k[0]]
                j = el2pos[k[1]]
                S[i, j] = float(v)
        elif method == 'transpose':
            for k, v in six.iteritems(self):
                i = el2pos[k[0]]
                j = el2pos[k[1]]
                S[j, i] = float(v)
        return S

[docs]    def _from_dok_(self, mat, pos2el):
        """
        """
        for ii, val in mat.items():
            self[pos2el[ii[0]], pos2el[ii[1]]] = val
        return None

[docs]    def _numpy_mat(self, el2pos):
        """
        Return a numpy.matrix object from a dictionary.

        -- Parameters --
        t_ij : the OrderedDict, values must be real numbers, keys should be tuples of
        two strings.
        el2pos : see _map()
        """
        m = len(el2pos)
        T = numpy.matrix(numpy.zeros((m, m)))
        for k, v in six.iteritems(self):
            T[el2pos[k[0]], el2pos[k[1]]] = v
        return T

[docs]    def _from_numpy_mat(self, T, pos2el):
        """
        Return a dictionary from a numpy.matrix object.

        -- Parameters --
        T : the numpy.matrix.
        pos2el : see _map()
        """
        for i in range(len(T)):
            for j in range(len(T)):
                if T[i, j]:
                    self[(pos2el[i], pos2el[j])] = T[i, j]
        return None

[docs]    def _el2pos_(self):
        """
        """
        el2pos = {}
        pos2el = {}
        for pos, element in enumerate(list(self.states())):
            el2pos[element] = pos
            pos2el[pos] = element
        return el2pos, pos2el

[docs]    def stochastic(self):
        """
        Make a right stochastic matrix.

        Set the sum of every row equal to one,
        raise ``PykovError`` if it is not possible.

        >>> T = pykov.Matrix({('A','B'): 3, ('A','A'): 7, ('B','A'): .2})
        >>> T.stochastic()
        >>> T
        {('B', 'A'): 1.0, ('A', 'B'): 0.3, ('A', 'A'): 0.7}
        >>> T[('A','C')]=1
        >>> T.stochastic()
        pykov.PykovError: 'Zero links from node C'
        """
        s = {}
        for k, v in self.succ().items():
            summ = float(sum(v.values()))
            if summ:
                s[k] = summ
            else:
                raise PykovError('Zero links from state ' + k)
        for k in six.iterkeys(self):
            self[k] = self[k] / s[k[0]]

[docs]    def pred(self, key=None):
        """
        Return the precedessors of a state (if not indicated, of all states).
        In Matrix notation: return the coloum of the indicated state.

        >>> T = pykov.Matrix({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> T.pred()
        {'A': {'A': 0.7, 'B': 1.0}, 'B': {'A': 0.3}}
        >>> T.pred('A')
        {'A': 0.7, 'B': 1.0}
        """
        try:
            if key is not None:
                return self._pred[key]
            else:
                return self._pred
        except AttributeError:
            self._pred = OrderedDict([(state, Vector()) for state in self.states()])
            for link, probability in six.iteritems(self):
                self._pred[link[1]][link[0]] = probability
            if key is not None:
                return self._pred[key]
            else:
                return self._pred

[docs]    def succ(self, key=None):
        """
        Return the successors of a state (if not indicated, of all states).
        In Matrix notation: return the row of the indicated state.

        >>> T = pykov.Matrix({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> T.succ()
        {'A': {'A': 0.7, 'B': 0.3}, 'B': {'A': 1.0}}
        >>> T.succ('A')
        {'A': 0.7, 'B': 0.3}
        """
        try:
            if key is not None:
                return self._succ[key]
            else:
                return self._succ
        except AttributeError:
            self._succ = OrderedDict([(state, Vector()) for state in self.states()])
            for link, probability in six.iteritems(self):
                self._succ[link[0]][link[1]] = probability
            if key is not None:
                return self._succ[key]
            else:
                return self._succ

[docs]    def remove(self, states):
        """
        Return a copy of the Chain, without the indicated states.

        .. warning::

           All the links where the states appear are deleted, so that the result
           will not be in general a stochastic matrix.
        ..

        >>> T = pykov.Matrix({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> T.remove(['B'])
        {('A', 'A'): 0.7}
        >>> T = pykov.Chain({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.,
                             ('C','D'): .5, ('D','C'): 1., ('C','B'): .5})
        >>> T.remove(['A','B'])
        {('C', 'D'): 0.5, ('D', 'C'): 1.0}
        """
        return Matrix(OrderedDict([(key, value) for key, value in six.iteritems(self) if
                                   key[0] not in states and key[1] not in states]))

[docs]    def states(self):
        """
        Return the set of states.

        >>> T = pykov.Matrix({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> T.states()
        {'A', 'B'}
        """
        try:
            return self._states
        except AttributeError:
            self._states = set()
            for link in six.iterkeys(self):
                self._states.add(link[0])
                self._states.add(link[1])
            return self._states

[docs]    def __pow__(self, n):
        """
        >>> T = pykov.Matrix({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> T**2
        {('A', 'B'): 0.21, ('B', 'A'): 0.70, ('A', 'A'): 0.79, ('B', 'B'): 0.30}
        >>> T**0
        {('A', 'A'): 1.0, ('B', 'B'): 1.0}
        """
        el2pos, pos2el = self._el2pos_()
        P = self._numpy_mat(el2pos)
        P = P**n
        res = Matrix()
        res._from_numpy_mat(P, pos2el)
        return res

[docs]    def pow(self, n):
        return self.__pow__(n)

[docs]    def __mul__(self, v):
        """
        >>> T = pykov.Matrix({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> T * 3
        {('B', 'A'): 3.0, ('A', 'B'): 0.9, ('A', 'A'): 2.1}
        >>> p = pykov.Vector(A=.3, B=.7)
        >>> T * p
        {'A': 0.42, 'B': 0.3}
        >>> W = pykov.Matrix({('N', 'M'): 0.5, ('M', 'N'): 0.7,
                              ('M', 'M'): 0.3, ('O', 'N'): 0.5,
                              ('O', 'O'): 0.5, ('N', 'O'): 0.5})
        >>> W * W
        {('N', 'M'): 0.15, ('M', 'N'): 0.21, ('M', 'O'): 0.35,
         ('M', 'M'): 0.44, ('O', 'M'): 0.25, ('O', 'N'): 0.25,
         ('O', 'O'): 0.5, ('N', 'O'): 0.25, ('N', 'N'): 0.6}
        """
        if isinstance(v, Vector):
            e2p, p2e = self._el2pos_()
            x = v._toarray(e2p)
            M = self._dok_(e2p).tocsr()
            y = M.dot(x)
            result = Vector()
            result._fromarray(y, e2p)
            return result
        elif isinstance(v, Matrix):
            e2p, p2e = self._el2pos_()
            M = self._dok_(e2p).tocsr()
            N = v._dok_(e2p).tocsr()
            C = M.dot(N).todok()
            if 'Chain' in repr(self.__class__):
                res = Chain()
            elif 'Matrix' in repr(self.__class__):
                res = Matrix()
            res._from_dok_(C, p2e)
            return res
        elif isinstance(v, int) or isinstance(v, float):
            return Matrix(OrderedDict([(key, value * v) for key, value in
                                       six.iteritems(self)]))
        else:
            raise TypeError('unsupported operand type(s) for *:' +
                            ' \'Matrix\' and ' + repr(type(v))[7:-1])

[docs]    def __rmul__(self, v):
        """
        >>> T = pykov.Matrix({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> 3 * T
        {('B', 'A'): 3.0, ('A', 'B'): 0.9, ('A', 'A'): 2.1}
        """
        if isinstance(v, int) or isinstance(v, float):
            return Matrix(OrderedDict([(key, value * v) for key, value in
                                      six.iteritems(self)]))
        else:
            raise TypeError('unsupported operand type(s) for *:' +
                            ' \'Matrix\' and ' + repr(type(v))[7:-1])

[docs]    def __add__(self, M):
        """
        >>> T = pykov.Matrix({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> I = pykov.Matrix({('A','A'):1, ('B','B'):1})
        >>> T + I
        {('B', 'A'): 1.0, ('A', 'B'): 0.3, ('A', 'A'): 1.7, ('B', 'B'): 1.0}
        """
        if isinstance(M, Matrix):
            result = Matrix()
            for link in set(six.iterkeys(self)) | set(M.keys()):
                result[link] = self[link] + M[link]
            return result
        else:
            raise TypeError('unsupported operand type(s) for +:' +
                            ' \'Matrix\' and ' + repr(type(M))[7:-1])

[docs]    def __sub__(self, M):
        """
        >>> T = pykov.Matrix({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> I = pykov.Matrix({('A','A'):1, ('B','B'):1})
        >>> T - I
        {('B', 'A'): 1.0, ('A', 'B'): 0.3, ('A', 'A'): -0.3, ('B', 'B'): -1}
        """
        if isinstance(M, Matrix):
            result = Matrix()
            for link in set(six.iterkeys(self)) | set(M.keys()):
                result[link] = self[link] - M[link]
            return result
        else:
            raise TypeError('unsupported operand type(s) for -:' +
                            ' \'Matrix\' and ' + repr(type(M))[7:-1])

[docs]    def trace(self):
        """
        Return the Matrix trace.

        >>> T = pykov.Matrix({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> T.trace()
        0.7
        """
        return sum([self[k, k] for k in self.states()])

[docs]    def eye(self):
        """
        Return the Identity Matrix.

        >>> T = pykov.Matrix({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> T.eye()
        {('A', 'A'): 1., ('B', 'B'): 1.}
        """
        return Matrix(OrderedDict([((state, state), 1.) for state in self.states()]))

[docs]    def ones(self):
        """
        Return a ``Vector`` instance with entries equal to one.

        >>> T = pykov.Matrix({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> T.ones()
        {'A': 1.0, 'B': 1.0}
        """
        return Vector(OrderedDict([(state, 1.) for state in self.states()]))

[docs]    def transpose(self):
        """
        Return the transpose Matrix.

        >>> T = pykov.Matrix({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> T.transpose()
        {('B', 'A'): 0.3, ('A', 'B'): 1.0, ('A', 'A'): 0.7}
        """
        return Matrix(OrderedDict([((key[1], key[0]), value) for key, value in
                                   six.iteritems(self)]))

[docs]    def _UMPFPACKSolve(self, b, x=None, method='UMFPACK_A'):
        """
        UMFPACK ( U nsymmetric M ulti F Rontal PACK age)

        Parameters
        ----------
        method:
          "UMFPACK_A"  : \mathbf{A} x = b (default)
          "UMFPACK_At" : \mathbf{A}^T x = b

        References
        ----------
        A column pre-ordering strategy for the unsymmetric-pattern multifrontal
        method, T. A. Davis, ACM Transactions on Mathematical Software, vol 30,
        no. 2, June 2004, pp. 165-195.
        """
        e2p, p2e = self._el2pos_()
        if method == "UMFPACK_At":
            A = self._dok_(e2p).tocsr().transpose()
        else:
            A = self._dok_(e2p).tocsr()
        bb = b._toarray(e2p)
        x = ssl.spsolve(A, bb, use_umfpack=True)
        res = Vector()
        res._fromarray(x, e2p)
        return res


[docs]class Chain(Matrix):

    """
    """

[docs]    def move(self, state, random_func=None):
        """
        Do one step from the indicated state, and return the final state.

        >>> T = pykov.Chain({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> T.move('A')
        'B'

        Optionally, a function that generates a random number can be supplied.
        >>> def FakeRandom(min, max): return 0.01
        >>> T.move('A', FakeRandom)
        'B'

        """
        return self.succ(state).choose(random_func)

[docs]    def pow(self, p, n):
        """
        Find the probability distribution after n steps, starting from an
        initial ``Vector``.

        >>> T = pykov.Chain({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> p = pykov.Vector(A=1)
        >>> T.pow(p,3)
        {'A': 0.7629999999999999, 'B': 0.23699999999999996}
        >>> p * T * T * T
        {'A': 0.7629999999999999, 'B': 0.23699999999999996}
        """
        return p * self**n

[docs]    def steady(self):
        """
        With the assumption of ergodicity, return the steady state.

        .. note::

           Inverse iteration method (P is the Markov chain)

           .. math::

              Q = \mathbf{I} - P

              Q^T x = e

              e = (0,0,\dots,0,1)
           ..
        ..


        .. seealso::

           W. Stewart: Introduction to the Numerical Solution of Markov Chains,
           Princeton University Press, Chichester, West Sussex, 1994.

        >>> T = pykov.Chain({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> T.steady()
        {'A': 0.7692307692307676, 'B': 0.23076923076923028}
        """
        try:
            return self._steady
        except AttributeError:
            e2p, p2e = self._el2pos_()
            m = len(e2p)
            P = self._dok_(e2p).tocsr()
            Q = ss.eye(m, format='csr') - P
            e = numpy.zeros(m)
            e[-1] = 1.
            Q = Q.transpose()
            # not elegant singular matrix error
            Q[0, 0] = Q[0, 0] + _machineEpsilon()
            x = ssl.spsolve(Q, e, use_umfpack=True)
            x = x / sum(x)
            res = Vector()
            res._fromarray(x, e2p)
            self._steady = res
            return res

[docs]    def entropy(self, p=None, norm=False):
        """
        Return the ``Chain`` entropy, calculated with the indicated probability
        Vector (the steady state by default).

        .. math::

           H_i = \sum_j P_{ij} \ln P_{ij}

           H = \sum \pi_i  H_i

        .. seealso::

           Khinchin, A. I.
           Mathematical Foundations of Information Theory
           Dover, 1957.

        >>> T = pykov.Chain({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> T.entropy()
        0.46989561696530169

        With normalization entropy belongs to [0,1]

        >>> T.entropy(norm=True)
        0.33895603665233132

        """
        if not p:
            p = self.steady()
        H = 0.
        for state in self.states():
            H += p[state] * sum([v * math.log(v) for v in
                                 self.succ(state).values()])
        if norm:
            n = len(self.states())
            return -H / (n * math.log(n))
        return -H

[docs]    def mfpt_to(self, state):
        """
        Return the Mean First Passage Times of every state to the indicated
        state.

        .. seealso::

           Kemeny J. G.; Snell, J. L.
           Finite Markov Chains.
           Springer-Verlag: New York, 1976.

        >>> d = {('R', 'N'): 0.25, ('R', 'S'): 0.25, ('S', 'R'): 0.25,
                 ('R', 'R'): 0.5, ('N', 'S'): 0.5, ('S', 'S'): 0.5,
                 ('S', 'N'): 0.25, ('N', 'R'): 0.5, ('N', 'N'): 0.0}
        >>> T = pykov.Chain(d)
        >>> T.mfpt_to('R')
        {'S': 3.333333333333333, 'N': 2.666666666666667}
        """
        if len(self.states()) == 2:
            self.states().remove(state)
            other = self.states().pop()
            self.states().add(state)
            self.states().add(other)
            return Vector({other: 1. / self[other, state]})
        T = self.remove([state])
        T = T.eye() - T
        return T._UMPFPACKSolve(T.ones())

[docs]    def adjacency(self):
        """
        Return the adjacency matrix.

        >>> T = pykov.Chain({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> T.adjacency()
        {('B', 'A'): 1, ('A', 'B'): 1, ('A', 'A'): 1}
        """
        return Matrix(OrderedDict.fromkeys(self, 1))

[docs]    def walk(self, steps, start=None, stop=None):
        """
        Return a random walk of n steps, starting and stopping at the
        indicated states.

        .. note::

           If not indicated or is `None`, then the starting state is chosen
           according to its steady probability.
           If the stopping state is not `None`, the random walk stops early if
           the stopping state is reached.

        >>> T = pykov.Chain({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> T.walk(10)
        ['B', 'A', 'B', 'A', 'A', 'B', 'A', 'A', 'A', 'B', 'A']
        >>> T.walk(10,'B','B')
        ['B', 'A', 'A', 'A', 'A', 'A', 'B']
        """
        if start is None:
            steady = self.steady()
            if len(steady) != 0:
                start = steady.choose()
            else:
                # There is no steady state, so choose a state uniformly at
                # random.
                start = random.sample(self.states(), 1)[0]
        if stop is None:
            result = [start]
            for i in range(steps):
                result.append(self.move(result[-1]))
            return result
        else:
            result = [start]
            for i in range(steps):
                result.append(self.move(result[-1]))
                if result[-1] == stop:
                    return result
            return result

[docs]    def walk_probability(self, walk):
        """
        Given a walk, return the log of its probability.

        >>> T = pykov.Chain({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> T.walk_probability(['A','A','B','A','A'])
        -1.917322692203401
        >>> probability = math.exp(-1.917322692203401)
        0.147
        >>> p = T.walk_probability(['A','B','B','B','A'])
        >>> math.exp(p)
        0.0
        """
        res = 0
        for step in zip(walk[:-1], walk[1:]):
            if not self[step]:
                return -float('Inf')
            res += math.log(self[step])
        return res

[docs]    def mixing_time(self, cutoff=.25, jump=1, p=None):
        """
        Return the mixing time.

        If the initial distribution (p) is not indicated,
        then it is set to p={'less probable state':1}.

        .. note::

           The mixing time is calculated here as the number of steps (n) needed to
           have

           .. math::

              |p(n)-\pi| < 0.25

              p(n)=p P^n

              \pi=\pi P
           ..

           The parameter ``jump`` controls the iteration step, for example with
           ``jump=2`` n has values 2,4,6,8,..
        ..

        >>> d = {('R','R'):1./2, ('R','N'):1./4, ('R','S'):1./4,
                 ('N','R'):1./2, ('N','N'):0., ('N','S'):1./2,
                 ('S','R'):1./4, ('S','N'):1./4, ('S','S'):1./2}
        >>> T = pykov.Chain(d)
        >>> T.mixing_time()
        2
        """
        res = []
        d = 1
        n = 0
        if not p:
            p = Vector({self.steady().sort()[0][0]: 1})
        res.append(p.dist(self.steady()))
        while d > cutoff:
            n = n + jump
            p = self.pow(p, jump)
            d = p.dist(self.steady())
            res.append(d)
        return n

[docs]    def absorbing_time(self, transient_set):
        """
        Mean number of steps needed to leave the transient set.

        Return the ``Vector tau``, the ``tau[i]`` is the mean number of steps needed
        to leave the transient set starting from state ``i``. The parameter
        ``transient_set`` is a subset of nodes.

        .. note::

           If the starting point is a ``Vector p``, then it is sufficient to
           calculate ``p * tau`` in order to weigh the mean times according the
           initial conditions.


        .. seealso:

           Kemeny J. G.; Snell, J. L.
           Finite Markov Chains.
           Springer-Verlag: New York, 1976.

        >>> d = {('R','R'):1./2, ('R','N'):1./4, ('R','S'):1./4,
                 ('N','R'):1./2, ('N','N'):0., ('N','S'):1./2,
                 ('S','R'):1./4, ('S','N'):1./4, ('S','S'):1./2}
        >>> T = pykov.Chain(d)
        >>> p = pykov.Vector({'N':.3, 'S':.7})
        >>> tau = T.absorbing_time(p.keys())
        >>> p * tau
        3.1333333333333329
        """
        Q = self.remove(self.states() - set(transient_set))
        K = Q.eye() - Q
        # means
        tau = K._UMPFPACKSolve(K.ones())
        return tau

[docs]    def absorbing_tour(self, p, transient_set=None):
        """
        Return a ``Vector v``, ``v[i]`` is the mean of the total number of times
        the process is in a given transient state ``i`` before to leave the
        transient set.

        .. note::
           ``v.sum()`` is equal to ``p * tau`` (see :meth:`absorbing_time` method).

        In not specified, the ``transient set`` is defined
        by means of the ``Vector p``.

        .. seealso::

           Kemeny J. G.; Snell, J. L.
           Finite Markov Chains.
           Springer-Verlag: New York, 1976.

        >>> d = {('R','R'):1./2, ('R','N'):1./4, ('R','S'):1./4,
                 ('N','R'):1./2, ('N','N'):0., ('N','S'):1./2,
                 ('S','R'):1./4, ('S','N'):1./4, ('S','S'):1./2}
        >>> T = pykov.Chain(d)
        >>> p = pykov.Vector({'N':.3, 'S':.7})
        >>> T.absorbing_tour(p)
        {'S': 2.2666666666666666, 'N': 0.8666666666666669}
        """
        if transient_set:
            Q = self.remove(self.states() - transient_set)
        else:
            Q = self.remove(self.states() - set(p.keys()))
        K = Q.eye() - Q
        return K._UMPFPACKSolve(p, method='UMFPACK_At')

[docs]    def fundamental_matrix(self):
        """
        Return the fundamental matrix.

        .. seealso::

           Kemeny J. G.; Snell, J. L.
           Finite Markov Chains.
           Springer-Verlag: New York, 1976.

        >>> T = pykov.Chain({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> T.fundamental_matrix()
        {('B', 'A'): 0.17751479289940991, ('A', 'B'): 0.053254437869822958,
        ('A', 'A'): 0.94674556213017902, ('B', 'B'): 0.82248520710059214}
        """
        try:
            return self._fundamental_matrix
        except AttributeError:
            el2pos, pos2el = self._el2pos_()
            p = self.steady()._toarray(el2pos)
            P = self._numpy_mat(el2pos)
            d = len(p)
            A = numpy.matrix([p for i in range(d)])
            I = numpy.matrix(numpy.identity(d))
            # E = numpy.matrix(numpy.ones((d, d)))
            D = numpy.zeros((d, d))
            diag = 1. / p
            for pos, val in enumerate(diag):
                D[pos, pos] = val
            Z = numpy.linalg.inv(I - P + A)
            res = Matrix()
            res._from_numpy_mat(Z, pos2el)
            self._fundamental_matrix = res
            return res

[docs]    def kemeny_constant(self):
        """
        Return the Kemeny constant of the transition matrix.

        >>> T = pykov.Chain({('A','B'): .3, ('A','A'): .7, ('B','A'): 1.})
        >>> T.kemeny_constant()
        1.7692307692307712
        """
        Z = self.fundamental_matrix()
        return Z.trace()

[docs]    def accessibility_matrix(self):
        """
        Return the accessibility matrix of the Markov chain.

        ..see also: http://www.ssc.wisc.edu/~jmontgom/commclasses.pdf
        """
        el2pos, pos2el = self._el2pos_()
        Z = self.adjacency()
        I = self.eye()
        n = len(self.states())

        A = (I + Z)**(n - 1)
        numpy_A = A._numpy_mat(el2pos)
        numpy_A = numpy_A > 0
        numpy_A = numpy_A.astype(int)
        res = Matrix()
        res._from_numpy_mat(numpy_A, pos2el)
        return res

[docs]    def is_accessible(self, i, j):
        """
        Return whether state j is accessible from state i.
        """

        A = self.accessibility_matrix()
        return A.get((i, j)) > 0

[docs]    def communicates(self, i, j):
        """
        Return whether states i and j communicate.
        """
        return self.is_accessible(i, j) and self.is_accessible(j, i)

[docs]    def communication_classes(self):
        """
        Return a Set of all communication classes of the Markov chain.

        ..see also: http://www.ssc.wisc.edu/~jmontgom/commclasses.pdf

        >>> T = pykov.Chain({('A','A'): 1.0, ('B','B'): 1.0})
        >>> T.communication_classes()
        """
        el2pos, pos2el = self._el2pos_()
        A = self.accessibility_matrix()

        numpy_A = A._numpy_mat(el2pos)
        numpy_A_trans = numpy.transpose(numpy_A)
        numpy_res = numpy.logical_and(numpy_A, numpy_A_trans)
        numpy_res = numpy_res.astype(int)

        # remove duplicate rows
        # remaining rows will give communication
        # ref: http://stackoverflow.com/questions/16970982/find-unique-rows-in-numpy-array
        a = numpy_res
        b = numpy.ascontiguousarray(a).view(
            numpy.dtype(
                (numpy.void, a.dtype.itemsize * a.shape[1])
            )
        )
        _, idx = numpy.unique(b, return_index=True)

        unique_a = a[idx]

        res = Set()
        for row in unique_a:
            # each iteration here is a comm. class
            comm_class = Set()
            number_of_elements = len(A.states())
            for el in range(number_of_elements):
                if row[0, el] == 1:
                    comm_class.add(pos2el[el])
            res.add(comm_class)
        return res


[docs]def readmat(filename):
    """
    Read an external file and return a Chain.

    The file must be of the form:

    A A .7
    A B .3
    B A 1

    Example
    -------
    >>> P = pykov.readmat('/mypath/mat')
    >>> P
    {('B', 'A'): 1.0, ('A', 'B'): 0.3, ('A', 'A'): 0.7}
    """
    with open(filename) as f:
        P = Chain()
        for line in f:
            tmp = line.split()
            P[(tmp[0], tmp[1])] = float(tmp[2])
        return P


[docs]def readtrj(filename):
    """
    In the case the :class:`Chain` instance must be created from a finite chain
    of states, the transition matrix is not fully defined.
    The function defines the transition probabilities as the maximum likelihood
    probabilities calculated along the chain. Having the file ``/mypath/trj``
    with the following format::

        1
        1
        1
        2
        1
        3

    the :class:`Chain` instance defined from that chain is:

    >>> t = pykov.readtrj('/mypath/trj')
    >>> t
    (1, 1, 1, 2, 1, 3)
    >>> p, P = maximum_likelihood_probabilities(t,lag_time=1, separator='0')
    >>> p
    {1: 0.6666666666666666, 2: 0.16666666666666666, 3: 0.16666666666666666}
    >>> P
    {(1, 2): 0.25, (1, 3): 0.25, (1, 1): 0.5, (2, 1): 1.0, (3, 3): 1.0}
    >>> type(P)
    <class 'pykov.Chain'>
    >>> type(p)
    <class 'pykov.Vector'>
    """
    with open(filename) as f:
        return tuple(line.strip() for line in f)


[docs]def _writefile(mylist, filename):
    """
    Export in a file the list.

    mylist could be a list of list.

    Example
    -------
    >>> L = [[2,3],[4,5]]
    >>> pykov.writefile(L,'tmp')
    >>> l = [1,2]
    >>> pykov.writefile(l,'tmp')
    """
    try:
        L = [[str(i) for i in line] for line in mylist]
    except TypeError:
        L = [str(i) for i in mylist]
    with open(filename, mode='w') as f:
        tmp = '\n'.join('\t'.join(x) for x in L)
        f.write(tmp)
    return None


[docs]def transitions(trj, nsteps=1, lag_time=1, separator='0'):
    """
    Return the temporal list of transitions observed.

    Parameters
    ----------
    trj : the symbolic trajectory.
    nsteps : number of steps.
    lag_time : step length.
    separator: the special symbol indicating the presence of sub-trajectories.

    Example
    -------
    >>> trj = [1,2,1,0,2,3,1,0,2,3,2,3,1,2,3]
    >>> pykov.transitions(trj,1,1,0)
    [(1, 2), (2, 1), (2, 3), (3, 1), (2, 3), (3, 2), (2, 3), (3, 1), (1, 2),
    (2, 3)]
    >>> pykov.transitions(trj,1,2,0)
    [(1, 1), (2, 1), (2, 2), (3, 3), (2, 1), (3, 2), (1, 3)]
    >>> pykov.transitions(trj,2,2,0)
    [(2, 2, 1), (3, 3, 2), (2, 1, 3)]
    """
    result = []
    for pos in range(len(trj) - nsteps * lag_time):
        if separator not in trj[pos:(pos + nsteps * lag_time + 1)]:
            tmp = trj[pos:(pos + nsteps * lag_time + 1):lag_time]
            result.append(tuple(tmp))
    return result


[docs]def maximum_likelihood_probabilities(trj, lag_time=1, separator='0'):
    """
    Return a Chain calculated by means of maximum likelihood probabilities.

    Return two objects:
    p : a Vector object, the probability distribution over the nodes.
    T : a Chain object, the Markov chain.

    Parameters
    ----------
    trj : the symbolic trajectory.
    lag_time : number of steps defining a transition.
    separator: the special symbol indicating the presence of sub-trajectories.

    Example
    -------
    >>> t = [1,2,3,2,3,2,1,2,2,3,3,2]
    >>> p, T = pykov.maximum_likelihood_probabilities(t)
    >>> p
    {1: 0.18181818181818182, 2: 0.4545454545454546, 3: 0.36363636363636365}
    >>> T
    {(1, 2): 1.0, (3, 2): 0.7499999999999999, (2, 3): 0.5999999999999999, (3,
    3): 0.25, (2, 2): 0.19999999999999998, (2, 1): 0.19999999999999998}
    """
    q_ij = {}
    tr = transitions(trj, nsteps=1, lag_time=lag_time, separator=separator)
    _remove_dead_branch(tr)
    tot = len(tr)
    for step in tr:
        q_ij[step] = q_ij.get(step, 0.) + 1
    for key in q_ij.keys():
        q_ij[key] = q_ij[key] / tot
    p_i = {}
    for k, v in q_ij.items():
        p_i[k[0]] = p_i.get(k[0], 0) + v
    t_ij = {}
    for k, v in q_ij.items():
        t_ij[k] = v / p_i[k[0]]
    T = Chain(t_ij)
    p = Vector(p_i)
    T._guess = Vector(p_i)
    return p, T


[docs]def _remove_dead_branch(transitions_list):
    """
    Remove dead branchs inserting a selfloop in every node that has not
    outgoing links.

    Example
    -------
    >>> trj = [1,2,3,1,2,3,2,2,4,3,5]
    >>> tr = pykov.transitions(trj, nsteps=1)
    >>> tr
    [(1, 2), (2, 3), (3, 1), (1, 2), (2, 3), (3, 2), (2, 2), (2, 4), (4, 3),
    (3, 5)]
    >>> pykov._remove_dead_branch(tr)
    >>> tr
    [(1, 2), (2, 3), (3, 1), (1, 2), (2, 3), (3, 2), (2, 2), (2, 4), (4, 3),
    (3, 5), (5, 5)]
    """
    head_set = set()
    tail_set = set()
    for step in transitions_list:
        head_set.add(step[1])
        tail_set.add(step[0])
    for head in head_set:
        if head not in tail_set:
            transitions_list.append((head, head))
    return None


[docs]def _machineEpsilon(func=float):
    """
    should be the same result of: numpy.finfo(numpy.float).eps
    """
    machine_epsilon = func(1)
    while func(1) + func(machine_epsilon) != func(1):
        machine_epsilon_last = machine_epsilon
        machine_epsilon = func(machine_epsilon) / func(2)
    return machine_epsilon_last


# --- Debugging

if __name__ == "__main__":
    # Code for debugging purposes.
    from doctest import testmod
    print("\nTesting automatically all the docstring written in each functions of this module :")
    testmod(verbose=True)