Source code for sisl.sparse

""" 
Sparsity pattern used to express matrices in concise manners.
"""
from __future__ import print_function, division

import warnings
from numbers import Integral, Real, Complex

# To speed up the extension algorithm we limit
# the lookup table
import numpy as np
from numpy import where, insert, diff
from numpy import array, asarray, empty, zeros, arange
from numpy import intersect1d, setdiff1d
from numpy import argsort, unique, in1d

from scipy.sparse import isspmatrix
from scipy.sparse import coo_matrix, isspmatrix_coo
from scipy.sparse import csr_matrix, isspmatrix_csr
from scipy.sparse import csc_matrix, isspmatrix_csc
from scipy.sparse import lil_matrix, isspmatrix_lil


from sisl._help import ensure_array, get_dtype
from sisl._help import _range as range, _zip as zip


# Although this re-implements the CSR in scipy.sparse.csr_matrix
# we use it slightly differently and thus require this new sparse pattern.

__all__ = ['SparseCSR', 'ispmatrix', 'ispmatrixd']


def indices_single(col, value, offset=0):
    """ Return indices of values in col with a possible offset """
    w = where(col == value)[0]
    if len(w) == 0:
        return -1
    else:
        return offset + w[0]

# Vectorize the function,
# The return-type is always numpy.int32
# The column indices are passed "as-is" via the
# excluded keyword
indices = np.vectorize(indices_single, otypes=[np.int32],
                       excluded=[0, 'col'])


[docs]class SparseCSR(object):
    """
    A compressed sparse row matrix, slightly different than ``scipy.sparse.csr_matrix``.

    This class holds all required information regarding the CSR matrix format.

    Note that this sparse matrix of data does not retain the number of columns
    in the matrix, i.e. it has no way of determining whether the input is 
    correct.
    """

    def __init__(self, arg1, dim=1, dtype=None,
                 nnzpr=20, nnz=None,
                 **kwargs):
        """ Initialize a new sparse CSR matrix

        This sparse matrix class tries to resemble the
        ``scipy.sparse.csr_matrix`` as much as possible with
        the difference of this class being multi-dimensional.

        Creating a new sparse matrix is much similar to the 
        ``scipy`` equivalent.

        `nzs` is only used if `nzs > nr * nzsr`.

        This class may be instantiated by verious means.

        - `SparseCSR(S)`
          where `S` is a ``scipy.sparse`` matrix
        - `SparseCSR((M,N)[, dtype])`
          the shape of the sparse matrix (equivalent
          to `SparseCSR((M,N,K)[, dtype])`.
        - `SparseCSR((M,N,K)[, dtype])`
          creating a sparse matrix with `M` rows, `N` columns
          and `K` elements per sparse element.

        Additionally these parameters control the
        creation of the sparse matrix

        Parameters
        ----------
        nnzpr : int, 20
           initial number of non-zero elements per row.
           Only used if `nnz` is not supplied
        nnz : int
           initial total number of non-zero elements
           This quantity has precedence over `nnzpr`
        dim : int, 1
           number of elements stored per sparse element, only used if (M,N) is passed
        dtype : numpy data type, `numpy.float64`
           data type of the matrix

        Attributes
        ----------
        ncol: int-array, `self.shape[0]`
           number of entries per row
        ptr: int-array, `self.shape[0]+1`
           pointer index in the 1D column indices of the corresponding row
        col: int-array, 
           column indices of the sparse elements
        data: 
           the data in the sparse matrix
        dim: int
           the extra dimension of the sparse matrix
        nnz: int
           number of contained sparse elements
        shape: tuple, 3*(,)
           size of contained matrix, M, N, K
        finalized: boolean
           whether the sparse matrix is finalized and non-set elements
           are removed
        """

        # step size in sparse elements
        # If there isn't enough room for adding
        # a non-zero element, the # of elements
        # for the insert row is increased at least by this number
        self._ns = 10

        if isspmatrix(arg1):
            # This is a sparse matrix
            # The data-type is infered from the
            # input sparse matrix.
            arg1 = arg1.tocsr()
            self.__init__((arg1.data, arg1.indices, arg1.indptr),
                          dim=dim, dtype=dtype, **kwargs)

        elif isinstance(arg1, (tuple, list)):

            if isinstance(arg1[0], Integral):
                self.__init_shape(arg1, dim=dim, dtype=dtype,
                                  nnzpr=nnzpr, nnz=nnz,
                                  **kwargs)

            elif len(arg1) != 3:
                raise ValueError(('The sparse array *must* be created '
                                  'with data, indices, indptr'))
            else:

                if dtype is None:
                    # The first element is the data
                    dtype = arg1[0].dtype

                # The first *must* be some sort of array
                if 'shape' in kwargs:
                    shape = kwargs['shape']
                else:
                    M = len(arg1[2])-1
                    N = ((np.amax(arg1[1]) // M) + 1) * M
                    shape = (M, N)

                self.__init_shape(shape, dim=dim, dtype=dtype,
                                  nnz=1,
                                  **kwargs)

                # Copy data to the arrays
                self.ptr = arg1[2]
                self.ncol = diff(self.ptr)
                self.col = arg1[1]
                self._nnz = len(self.col)
                self._D = np.empty([len(arg1[1]), self.shape[-1]], dtype=self.dtype)
                self._D[:, 0] = arg1[0]

                self.finalize()

    def __init_shape(self, arg1, dim=1, dtype=None,
                     nnzpr=20, nnz=None,
                     **kwargs):

        # The shape of the data...
        if len(arg1) == 2:
            # extend to extra dimension
            arg1 = arg1 + (dim,)
        elif len(arg1) != 3:
            raise ValueError("unrecognized shape input, either a 2-tuple or 3-tuple is required")

        # Set default dtype
        if dtype is None:
            dtype = np.float64

        # unpack size
        M, N, K = arg1

        # Store shape
        self._shape = (M, N, K)

        # Check default construction of sparse matrix
        nnzpr = max(nnzpr, 1)

        # Re-create options
        if nnz is None:
            # number of non-zero elements is NOT given
            nnz = M * nnzpr

        else:
            # number of non-zero elements is give AND larger
            # than the provided non-zero elements per row
            nnzpr = nnz // M

        # Correct input in case very few elements are requested
        nnzpr = max(nnzpr, 1)
        nnz = max(nnz, nnzpr * M)

        # Store number of columns currently hold
        # in the sparsity pattern
        self.ncol = np.zeros([M], np.int32)
        # Create pointer array
        self.ptr = np.cumsum(np.array([nnzpr] * (M+1), np.int32)) - nnzpr
        # Create column array
        self.col = np.empty(nnz, np.int32)
        # Store current number of non-zero elements
        self._nnz = 0

        # Important that this is zero
        # For instance one may set one dimension at a time
        # thus automatically zeroing the other dimensions.
        self._D = np.zeros([nnz, K], dtype)

        # Denote that this sparsity pattern hasn't been finalized
        self._finalized = False

[docs]    def empty(self, keep=False):
        """ Delete all sparse information from the sparsity pattern

        Essentially this deletes all entries.

        Parameters
        ----------
        keep: boolean, False
           if `True` it will keep the sparse elements _as is_.
           I.e. it will merely set the stored sparse elements as zero.
           This may be advantagegous when re-constructing a new sparse 
           matrix from an old sparse matrix
        """
        self._D[:, :] = 0.

        if not keep:
            self._finalized = False
            # The user does not wish to retain the
            # sparse pattern
            self.ncol[:] = 0
            self._nnz = 0
            # We do not mess with the other arrays
            # they may be obscure data any-way.

    @property
    def shape(self):
        """ Return shape of the sparse matrix """
        return self._shape

    @property
    def dim(self):
        """ Return extra dimensionality of the sparse matrix """
        return self.shape[2]

    @property
    def data(self):
        """ Return data contained in the sparse matrix """
        return self._D

    @property
    def dtype(self):
        """ Return the data-type in the sparse matrix """
        return self._D.dtype

    @property
    def nnz(self):
        """ Return number of non-zero elements in the sparsity pattern """
        return self._nnz

    def __len__(self):
        """ Return number of non-zero elements in the sparse pattern """
        return self.nnz

    @property
    def finalized(self):
        """ Whether the contained data is finalized and non-used elements have been removed """
        return self._finalized

[docs]    def finalize(self, sort=True):
        """ Finalizes the sparse matrix by removing all non-set elements

        One may still interact with the sparse matrix as one would previously.

        NOTE: This is mainly an internal used routine to ensure data structure
        when converting to ``scipy.sparse.csr_matrix``

        Parameters
        ----------
        sort: bool, True
           sort the column indices for each row
        """
        if self.finalized:
            return

        # Fast reference
        ptr = self.ptr
        ncol = self.ncol
        col = self.col
        D = self._D

        # We truncate all the connections
        iptr = 0
        for r in range(self.shape[0]):

            # number of elements in this row
            nor = ncol[r]

            # Starting pointer index
            sptr = ptr[r]
            eptr = sptr + nor

            # update current row pointer
            ptr[r] = iptr

            if nor == 0:
                continue

            # assert no two connections
            if unique(col[sptr:eptr]).shape[0] != nor:
                raise ValueError(
                    'You cannot have two hoppings between the same ' +
                    'orbitals ({}), something has went terribly wrong.'.format(r))

            # update the colunm vector and data
            col[iptr:iptr + nor] = col[sptr:eptr]
            D[iptr:iptr + nor, :] = D[sptr:eptr, :]

            # Simultaneausly we sort the entries
            if sort:
                si = argsort(col[iptr:iptr + nor])
                col[iptr:iptr + nor] = col[iptr + si]
                D[iptr:iptr + nor, :] = D[iptr + si, :]

            # update front of row
            iptr += nor

        # Correcting the size of the pointer array
        ptr[self.shape[0]] = iptr

        if iptr != self.nnz:
            print(iptr, self.nnz)
            raise ValueError('Final size in the sparse matrix finalization '
                             'went wrong.')

        # Truncate values to correct size
        self._D = self._D[:self.nnz, :]
        self.col = self.col[:self.nnz]

        # Check that all column indices are within the expected shape
        if np.any(self.shape[1] <= self.col):
            warnings.warn("Sparse matrix contains column indices outside the shape "
                          "of the matrix. Data may not represent what you had expected")

        # Signal that we indeed have finalized the data
        self._finalized = True

[docs]    def spsame(self, other):
        """ Check whether two sparse matrices have the same non-zero elements

        Parameters
        ----------
        other : SparseCSR

        Returns
        -------
        bool :
            True if the same non-zero elements are in the matrices.
        """

        if self.shape[:2] != other.shape[:2]:
            return False

        def samesect1d(a, b):
            n = len(a)
            if n != len(b):
                return False
            return len(intersect1d(a, b)) == n

        for r in range(self.shape[0]):
            # pointers
            sptr = self.ptr[r]
            sn = self.ncol[r]
            optr = other.ptr[r]
            on = other.ncol[r]

            if not samesect1d(self.col[sptr:sptr+sn],
                              other.col[optr:optr+on]):
                return False
        return True

[docs]    def spalign(self, other):
        """ Aligns this sparse matrix with the sparse elements of the other sparse matrix

        Routine for ensuring that all non-zero elements in `other` are also in this
        object.

        I.e. this will, possibly, change the sparse elements in-place.

        A `ValueError` will be raised if the shapes are not mergeable.

        Parameters
        ----------
        other : SparseCSR
           the other sparse matrix to align.
        """

        if self.shape[:2] != other.shape[:2]:
            raise ValueError('Aligning two sparse matrices requires same shapes')

        for r in range(self.shape[0]):

            # pointers
            sptr = self.ptr[r]
            sn = self.ncol[r]
            optr = other.ptr[r]
            on = other.ncol[r]

            adds = setdiff1d(other.col[optr:optr+on], self.col[sptr:sptr+sn])
            if len(adds) > 0:
                # simply extend the elements
                self._extend(r, adds)

[docs]    def iter_nnz(self, row=None):
        """ Iterations of the non-zero elements, returns a tuple of row and column with non-zero elements

        An iterator returning the current row index and the corresponding column index.

        >>> for r, c in self:

        In the above case `r` and `c` are rows and columns such that

        >>> self[r, c] 

        returns the non-zero element of the sparse matrix.

        Parameters
        ----------
        row : `int=<all>`, `array_like`
           only loop on the given row(s) default to all rows
        """
        if row is None:
            # loop on rows
            for r in range(self.shape[0]):
                n = self.ncol[r]
                ptr = self.ptr[r]
                for c in self.col[ptr:ptr+n]:
                    yield r, c
        else:
            for r in ensure_array(row):
                n = self.ncol[r]
                ptr = self.ptr[r]
                for c in self.col[ptr:ptr+n]:
                    yield r, c

    # Define default iterator
    __iter__ = iter_nnz

    def _extend(self, i, j):
        """ Extends the sparsity pattern to retain elements `j` in row `i`

        Parameters
        ----------
        i : int
           the row of the matrix
        j : int, array-like
           columns belonging to row ``i`` where a non-zero element is stored.

        Returns
        -------
        index : array-like
           the indicies of the existing/added elements. 
        """

        # We skip this check and let sisl die if wrong input is given...
        #if not isinstance(i, Integral):
        #    raise ValueError("Retrieving/Setting elements in a sparse matrix"
        #                     " must only be performed at one row-element at a time.\n"
        #                     "However, multiple columns at a time are allowed.")

        # Ensure flattened array...
        j = ensure_array(j)
        if len(j) == 0:
            return np.array([], np.int32)

        # fast reference
        ptr = self.ptr
        ncol = self.ncol
        col = self.col

        # To create the indices for the sparse elements
        # we first find which values are _not_ in the sparse
        # matrix
        if ncol[i] > 0:

            # Checks whether any non-zero elements are
            # already in the sparse pattern
            # If so we remove those from the j
            exists = intersect1d(j, col[ptr[i]:ptr[i]+ncol[i]],
                                 assume_unique=True)
        else:
            exists = np.array([], np.int32)

        # Get list of new elements to be added
        new_j = setdiff1d(j, exists, assume_unique=True)
        new_n = len(new_j)

        # Check how many elements cannot fit in the currently
        # allocated sparse matrix...
        new_nnz = ncol[i] + new_n - (ptr[i + 1] - ptr[i])

        if new_nnz > 0:

            # Ensure that it is not-set as finalized
            # There is no need to set it all the time.
            # Simply because the first call to finalize
            # will reduce the sparsity pattern, which
            # on first expansion calls this part.
            self._finalized = False

            # Get how much larger we wish to create the sparse matrix...
            ns = max(self._ns, new_nnz)

            # ...expand size of the sparsity pattern...

            # Insert pointer of new data
            iptr = ptr[i] + ncol[i]

            # Insert new empty elements in the column index
            # after the column
            self.col = insert(self.col, iptr,
                              empty(ns, self.col.dtype))

            # update reference
            col = self.col

            # Insert zero data in the data array
            # We use `zeros` as then one may set each dimension
            # individually...
            self._D = insert(self._D, ptr[i+1],
                             zeros([ns, self.shape[2]], self._D.dtype), axis=0)

            # Lastly, shift all pointers above this row to account for the
            # new non-zero elements
            ptr[i + 1:] += ns

        if new_n > 0:
            # Ensure that we write the new elements to the matrix...

            # new data begins from this index location
            old_ptr = ptr[i] + ncol[i]

            # assign the column indices for the new entries
            # NOTE that this may not assign them in the order
            # of entry as new_j is sorted and thus new_j != j
            col[old_ptr:old_ptr + new_n] = new_j[:]

            # Step the size of the stored non-zero elements
            ncol[i] += new_n

            # Step the number of non-zero elements
            self._nnz += new_n

        # Now we have extended the sparse matrix to hold all
        # information that is required...

        # ... retrieve the indices and return
        return indices(col[ptr[i]:ptr[i] + ncol[i]], j, ptr[i])

    def _get(self, i, j):
        """ Retrieves the data pointer arrays of the elements, if it is non-existing, it will return -1

        Parameters
        ----------
        i : int
           the row of the matrix
        j : int, array-like
           columns belonging to row ``i`` where a non-zero element is stored.

        Returns
        -------
        index : array-like
           the indicies of the existing elements. 
        """

        # Ensure flattened array...
        j = asarray(j, np.int32).flatten()

        # Make it a little easier
        ptr = self.ptr[i]

        return indices(self.col[ptr:ptr+self.ncol[i]], j, ptr)

    def __delitem__(self, key):
        """ Remove items from the sparse patterns """
        # Get indices of sparse data (-1 if non-existing)
        i = key[0]
        index = self._get(i, key[1])

        # First remove all negative indices.
        # The element isn't there anyway...
        index.sort()
        index = index[index >= 0]

        if len(index) == 0:
            # There are no elements to delete...
            return

        # Get short-hand
        ptr = self.ptr
        ncol = self.ncol

        # Get original values
        oC = self.col[ptr[i]:ptr[i]+ncol[i]]
        oD = self._D[ptr[i]:ptr[i]+ncol[i], :]

        # Now create the compressed data...
        index -= ptr[i]
        keep = in1d(arange(ncol[i]), index, invert=True)

        # Update new count of the number of
        # non-zero elements
        self.ncol[i] -= len(index)

        # Now update the column indices and the data
        self.col[ptr[i]:ptr[i]+self.ncol[i]] = oC[keep]
        self._D[ptr[i]:ptr[i]+self.ncol[i], :] = oD[keep, :]

        # Once we remove some things, it is NOT
        # finalized...
        self._finalized = False
        self._nnz -= len(index)

    def __getitem__(self, key):
        """ Intrinsic sparse matrix retrieval of a non-zero element
        """

        # Get indices of sparse data (-1 if non-existing)
        index = self._get(key[0], key[1])

        # Check which data to retrieve
        if len(key) > 2:

            # user requests a specific element

            data = empty(len(index), self._D.dtype)

            # get dimension retrieved
            d = key[2]

            # Copy data over
            for i, j in enumerate(index):
                if j < 0:
                    data[i] = 0.
                else:
                    data[i] = self._D[j, d]

        else:

            # user request all stored data

            data = empty([len(index), self.shape[2]], self._D.dtype)

            # Copy data over
            for i, j in enumerate(index):
                if j < 0:
                    data[i, :] = 0.
                else:
                    data[i, :] = self._D[j, :]

        # Return data
        return data

    def __setitem__(self, key, data):
        """ Intrinsic sparse matrix assignment of the item. 

        It will only allow to set the data in the sparse
        matrix if the dimensions match.

        If the `data` parameter is `None` or an array
        only with `None` then the data will not be stored.
        """
        # Ensure data type... possible casting...
        if data is None:
            return

        # Sadly, converting integers with None
        # will NOT produce nan's.
        # Hence, this will only work with floats, etc.
        # TODO we need some way to reduce these things
        # for integer stuff.
        data = asarray(data, self._D.dtype)
        isnan = np.isnan(data)
        if np.all(isnan):
            # If the entries are nan's
            # then we return without adding the
            # entry.
            return
        else:
            # Places where there are nan will be set
            # to zero
            data[isnan] = 0
            del isnan

        # Retrieve indices in the 1D data-structure
        index = self._extend(key[0], key[1])

        if len(key) > 2:
            # Explicit data of certain dimension
            self._D[index, key[2]] = data

        else:
            # Ensure correct shape
            data.shape = (-1, self.shape[2])

            # Now there are two cases
            if data.shape[0] == 1:
                # we copy all elements
                self._D[index, :] = data[None, :]

            else:
                # each element have different data
                self._D[index, :] = data[:, :]

[docs]    def copy(self, dims=None, dtype=None):
        """ Returns an exact copy of the sparse matrix

        Parameters
        ----------
        dims: array-like, (all)
           which dimensions to store in the copy
        dtype : `numpy.dtype`
           this defaults to the dtype of the object, 
           but one may change it if supplied.
        """
        # Create sparse matrix (with only one entry per
        # row, we overwrite it immediately afterward)
        if dims is None:
            dims = list(range(self.dim))

        # Create correct input
        dim = len(dims)
        shape = list(self.shape[:])
        shape[2] = dim

        if dtype is None:
            dtype = self.dtype

        new = self.__class__(shape, nnz=self.nnz,
                             dtype=dtype)

        # The default sizes are not passed
        # Hence we *must* copy the arrays
        # directly
        new.ptr = np.array(self.ptr, np.int32)
        new.ncol = np.array(self.ncol, np.int32)
        new.col = np.array(self.col, np.int32)
        new._nnz = self.nnz

        new._D = np.array(self._D, dtype=dtype)
        for dim in dims:
            new._D[:, dims] = self._D[:, dims]

        return new

[docs]    def tocsr(self, dim=0, **kwargs):
        """ Return the data in ``scipy.sparse.csr_matrix`` format

        Parameters
        ----------
        dim: int
           the dimension of the data to create the sparse matrix
        **kwargs:
           arguments passed to the ``scipy.sparse.csr_matrix`` routine
        """
        self.finalize()

        shape = self.shape[:2]
        return csr_matrix((self._D[:, dim], self.col, self.ptr), shape=shape, **kwargs)

    ###############################
    # Overload of math operations #
    ###############################
    def __add__(a, b):
        c = a.copy(dtype=get_dtype(b, other=a.dtype))
        c += b
        return c
    __radd__ = __add__

    def __iadd__(a, b):
        if isinstance(b, SparseCSR):
            if a.shape != b.shape:
                raise ValueError('Adding two sparse matrices requires the same shape')
            # Ensure that a is aligned with b
            a.spalign(b)

            # loop and add elements
            for r in range(a.shape[0]):
                # pointers
                bptr = b.ptr[r]
                bn = b.ncol[r]

                # Get positions of b-elements in a:
                in_a = a._get(r, b.col[bptr:bptr+bn])
                a._D[in_a, :] += b._D[bptr:bptr+bn, :]

        else:
            a._D += b
        return a

    def __sub__(a, b):
        c = a.copy(dtype=get_dtype(b, other=a.dtype))
        c -= b
        return c

    def __rsub__(a, b):
        if isinstance(b, SparseCSR):
            c = b.copy(dtype=get_dtype(a, other=b.dtype))
            c += -1 * a
        else:
            c = b + (-1) * a
        return c

    def __isub__(a, b):
        if isinstance(b, SparseCSR):
            if a.shape != b.shape:
                raise ValueError('Subtracting two sparse matrices requires the same shape')
            # Ensure that a is aligned with b
            a.spalign(b)

            # loop and add elements
            for r in range(a.shape[0]):
                # pointers
                bptr = b.ptr[r]
                bn = b.ncol[r]

                # Get positions of b-elements in a:
                in_a = a._get(r, b.col[bptr:bptr+bn])
                a._D[in_a, :] -= b._D[bptr:bptr+bn, :]

        else:
            a._D -= b
        return a

    def __mul__(a, b):
        c = a.copy(dtype=get_dtype(b, other=a.dtype))
        c *= b
        return c
    __rmul__ = __mul__

    def __imul__(a, b):
        if isinstance(b, SparseCSR):
            if a.shape != b.shape:
                raise ValueError('Multiplication of two sparse matrices requires the same shape')

            # Note that for multiplication of these two matrices
            # it is not required that they are aligned...
            # 0 * float == 0
            # Hence aligning is superfluous

            # loop and add elements
            for r in range(a.shape[0]):
                # pointers
                aptr = a.ptr[r]
                an = a.ncol[r]
                bptr = b.ptr[r]
                bn = b.ncol[r]

                acol = a.col[aptr:aptr+an]
                bcol = b.col[bptr:bptr+bn]

                # Get positions of b-elements in a:
                in_a = a._get(r, bcol)
                # remove all -1's
                in_a = in_a[in_a > -1]
                # Everything else *must* be zeroes! :)
                a._D[in_a, :] *= b._D[bptr:bptr+bn, :]

                # Now set everything *not* in b but in a, to zero
                not_in_b = where(in1d(acol, bcol, invert=True))[0]
                a._D[aptr+not_in_b, :] = 0

        else:
            a._D *= b
        return a

    def __div__(a, b):
        c = a.copy(dtype=get_dtype(b, other=a.dtype))
        c /= b
        return c

    def __rdiv__(a, b):
        c = b.copy(dtype=get_dtype(a, other=b.dtype))
        c /= a
        return c

    def __idiv__(a, b):
        if isinstance(b, SparseCSR):
            if a.shape != b.shape:
                raise ValueError('Division of two sparse matrices requires the same shape')

            # Ensure that a is aligned with b
            a.spalign(b)

            # loop and add elements
            for r in range(a.shape[0]):
                # pointers
                bptr = b.ptr[r]
                bn = b.ncol[r]

                # Get positions of b-elements in a:
                in_a = a._get(r, b.col[bptr:bptr+bn])
                a._D[in_a, :] /= b._D[bptr:bptr+bn, :]

        else:
            a._D /= b
        return a

    def __floordiv__(a, b):
        c = a.copy(dtype=get_dtype(b, other=a.dtype))
        c //= b
        return c

    def __ifloordiv__(a, b):
        if isinstance(b, SparseCSR):
            if a.shape != b.shape:
                raise ValueError('Floor-division of two sparse matrices requires the same shape')
            # Ensure that a is aligned with b
            a.spalign(b)

            # loop and add elements
            for r in range(a.shape[0]):
                # pointers
                bptr = b.ptr[r]
                bn = b.ncol[r]

                # Get positions of b-elements in a:
                in_a = a._get(r, b.col[bptr:bptr+bn])
                a._D[in_a, :] //= b._D[bptr:bptr+bn, :]

        else:
            a._D //= b
        return a

    def __truediv__(a, b):
        c = a.copy(dtype=get_dtype(b, other=a.dtype))
        c /= b
        return c

    def __itruediv__(a, b):
        if isinstance(b, SparseCSR):
            if a.shape != b.shape:
                raise ValueError('True-division of two sparse matrices requires the same shape')
            # Ensure that a is aligned with b
            a.spalign(b)

            # loop and add elements
            for r in range(a.shape[0]):
                # pointers
                bptr = b.ptr[r]
                bn = b.ncol[r]

                # Get positions of b-elements in a:
                in_a = a._get(r, b.col[bptr:bptr+bn])
                a._D[in_a, :].__itruediv__(b._D[bptr:bptr+bn, :])

        else:
            a._D /= b
        return a

    def __pow__(a, b):
        c = a.copy(dtype=get_dtype(b, other=a.dtype))
        c **= b
        return c

    def __rpow__(a, b):
        if isinstance(b, SparseCSR):
            raise NotImplementedError
        c = a.copy(dtype=get_dtype(b, other=a.dtype))
        c._D[...] = b ** c._D[...]
        return c

    def __ipow__(a, b):
        if isinstance(b, SparseCSR):
            if a.shape != b.shape:
                raise ValueError('True-division of two sparse matrices requires the same shape')
            # Ensure that a is aligned with b
            # 0 ** float == 1.
            a.spalign(b)

            # loop and add elements
            for r in range(a.shape[0]):
                # pointers
                aptr = a.ptr[r]
                an = a.ncol[r]
                bptr = b.ptr[r]
                bn = b.ncol[r]

                acol = a.col[aptr:aptr+an]
                bcol = b.col[bptr:bptr+bn]

                # Get positions of b-elements in a:
                in_a = a._get(r, bcol)
                a._D[in_a, :] **= b._D[bptr:bptr+bn, :]

                # Now set everything *not* in b but in a, to 1
                #  float ** 0 == 1
                not_in_b = where(in1d(acol, bcol, invert=True))[0]
                a._D[aptr+not_in_b, :] = 1

        else:
            a._D **= b
        return a

    @classmethod
[docs]    def register_math(cls, var, routines=None):
        """ Register math operators on the `cls` class using `var` as attribute `getattr(cls, var)` 

        Parameters
        ----------
        cls : class
           class which gets registered overloaded math operators
        var : `str`
           name of attribute that is `SparseCSR` object in `cls`
        routines : list of str
           names of routines that gets overloaded, defaults to:
            ['__sub__', '__add__', '__mul__', '__div__', 
             '__truediv__', '__pow__']
        """

        if routines is None:
            routines = ['__sub__', '__add__', '__mul__', '__div__',
                        '__truediv__', '__pow__']

        # What we want is something like this:
        # def func(a, b):
        #   if isinstance(a, cls):
        #       setattr(a, var, getattr(a, var) OP b)
        #   if isinstance(b, cls):
        #       setattr(b, var, a OP getattr(b, var))
        # setattr(cls,__ROUTINE__, func):

        # Now register all things
        for r in routines:
            pass


[docs]def ispmatrix(matrix, map_row=None, map_col=None):
    """ Iterator for iterating rows and columns for non-zero elements in a `scipy.sparse.*_matrix` (or `SparseCSR`)

    If either `map_row` or `map_col` are not None the generator will only yield
    the unique values.

    Parameters
    ----------
    matrix : scipy.sparse.sp_matrix
      the sparse matrix to iterate non-zero elements
    map_row : func, optional
      map each row entry through the function `map_row`, defaults to `None` which is 
      equivalent to no mapping.
    map_col : func, optional
      map each column entry through the function `map_col`, defaults to `None` which is 
      equivalent to no mapping.

    Yields
    ------
    int, int
       the row, column indices of the non-zero elements
    """

    if map_row is None and map_col is None:
        # Skip unique checks
        for r, c in _ispmatrix_all(matrix):
            yield r, c
        return

    if map_row is None:
        map_row = lambda x: x
    if map_col is None:
        map_col = lambda x: x
    map_row = np.vectorize(map_row)
    map_col = np.vectorize(map_col)

    nrow = len(np.unique(map_row(np.arange(matrix.shape[0]))))
    ncol = len(np.unique(map_col(np.arange(matrix.shape[1]))))
    rows = np.zeros(nrow, dtype=np.bool_)
    cols = np.zeros(ncol, dtype=np.bool_)

    # Initialize the unique arrays
    rows[:] = False

    # Consider using the numpy nditer function for buffered iterations
    #it = np.nditer([geom.o2a(tmp.row), geom.o2a(tmp.col % geom.no), tmp.data],
    #               flags=['buffered'], op_flags=['readonly'])

    if isspmatrix_csr(matrix):
        for r in range(matrix.shape[0]):
            rr = map_row(r)
            if rows[rr]: continue
            rows[rr] = True
            cols[:] = False
            for ind in range(matrix.indptr[r], matrix.indptr[r+1]):
                c = map_col(matrix.indices[ind])
                if cols[c]: continue
                cols[c] = True
                yield rr, c

    elif isspmatrix_lil(matrix):
        for r in range(matrix.shape[0]):
            rr = map_row(r)
            if rows[rr]: continue
            rows[rr] = True
            cols[:] = False
            if len(matrix.rows[r]) == 0:
                continue
            for c in map_col(matrix.rows[r]):
                if cols[c]: continue
                cols[c] = True
                yield rr, c

    elif isspmatrix_coo(matrix):
        raise ValueError("mapping and unique returns are not implemented for COO matrix")

    elif isspmatrix_csc(matrix):
        raise ValueError("mapping and unique returns are not implemented for CSC matrix")

    elif isinstance(matrix, SparseCSR):
        for r in range(matrix.shape[0]):
            rr = map_row(r)
            if rows[rr]: continue
            rows[rr] = True
            cols[:] = False
            n = matrix.ncol[r]
            ptr = matrix.ptr[r]
            for c in map_col(matrix.col[ptr:ptr+n]):
                if cols[c]: continue
                cols[c] = True
                yield rr, c

    else:
        raise NotImplementedError("The iterator for this sparse matrix has not been implemented")


def _ispmatrix_all(matrix):
    """ Iterator for iterating rows and columns for non-zero elements in a `scipy.sparse.*_matrix` (or `SparseCSR`)

    Parameters
    ----------
    matrix : scipy.sparse.sp_matrix
      the sparse matrix to iterate non-zero elements

    Yields
    ------
    int, int
       the row, column indices of the non-zero elements
    """
    if isspmatrix_csr(matrix):
        for r in range(matrix.shape[0]):
            for ind in range(matrix.indptr[r], matrix.indptr[r+1]):
                yield r, matrix.indices[ind]

    elif isspmatrix_lil(matrix):
        for r in range(matrix.shape[0]):
            for c in matrix.rows[r]:
                yield r, c

    elif isspmatrix_coo(matrix):
        for r, c in zip(matrix.row, matrix.col):
            yield r, c

    elif isspmatrix_csc(matrix):
        for c in range(matrix.shape[1]):
            for ind in range(matrix.indptr[c], matrix.indptr[c+1]):
                yield matrix.indices[ind], c

    elif isinstance(matrix, SparseCSR):
        for r in range(matrix.shape[0]):
            n = matrix.ncol[r]
            ptr = matrix.ptr[r]
            for c in matrix.col[ptr:ptr+n]:
                yield r, c

    else:
        raise NotImplementedError("The iterator for this sparse matrix has not been implemented")


[docs]def ispmatrixd(matrix, map_row=None, map_col=None):
    """ Iterator for iterating rows, columns and data for non-zero elements in a `scipy.sparse.*_matrix` (or `SparseCSR`)

    Parameters
    ----------
    matrix : scipy.sparse.sp_matrix
      the sparse matrix to iterate non-zero elements
    map_row : func, optional
      map each row entry through the function `map_row`, defaults to `None` which is 
      equivalent to no mapping.
    map_col : func, optional
      map each column entry through the function `map_col`, defaults to `None` which is 
      equivalent to no mapping.

    Yields
    ------
    int, int, <>
       the row, column and data of the non-zero elements
    """

    if map_row is None:
        map_row = lambda x: x
    if map_col is None:
        map_col = lambda x: x

    # Consider using the numpy nditer function for buffered iterations
    #it = np.nditer([geom.o2a(tmp.row), geom.o2a(tmp.col % geom.no), tmp.data],
    #               flags=['buffered'], op_flags=['readonly'])

    if isspmatrix_csr(matrix):
        for r in range(matrix.shape[0]):
            rr = map_row(r)
            for ind in range(matrix.indptr[r], matrix.indptr[r+1]):
                yield rr, map_col(matrix.indices[ind]), matrix.data[ind]

    elif isspmatrix_lil(matrix):
        for r in range(matrix.shape[0]):
            rr = map_row(r)
            for c, m in zip(map_col(matrix.rows[r]), matrix.data[r]):
                yield rr, c, m

    elif isspmatrix_coo(matrix):
        for r, c, m in zip(map_row(matrix.row), map_col(matrix.col), matrix.data):
            yield r, c, m

    elif isspmatrix_csc(matrix):
        for c in range(matrix.shape[1]):
            cc = map_col(c)
            for ind in range(matrix.indptr[c], matrix.indptr[c+1]):
                yield map_row(matrix.indices[ind]), cc, matrix.data[ind]

    elif isinstance(matrix, SparseCSR):
        for r in range(matrix.shape[0]):
            rr = map_row(r)
            n = matrix.ncol[r]
            ptr = matrix.ptr[r]
            for c, d in zip(map_col(matrix.col[ptr:ptr+n]), matrix._D[ind, :]):
                yield rr, c, d

    else:
        raise NotImplementedError("The iterator for this sparse matrix has not been implemented")