Source code for klus.algorithms

import numpy as _np
import scipy as _sp
import scipy.sparse.linalg

import klus.observables as _observables
import klus.kernels as _kernels

'''
## Algorithm and utility functions for nonlinear analyses

Based on software from Stefan Klus

Modules 
------- 
    
**algorithms** :   
    Routines for averaging and various computations.
    The implementations of the methods 
 
    - DMD, TICA, AMUSE
    - Ulam's method
    - EDMD, kernel EDMD, generator EDMD
    - SINDy
    - kernel PCA, kernel CCA
    - CMD
    - SEBA
 
are based on the publications listed here:
 
    https://github.com/sklus/d3s

'''



[docs]
def dmd(X, Y, mode='exact',retain=19):
    '''
    Exact and standard DMD of the data matrices X and Y.

    :param mode: 'exact' for exact DMD or 'standard' for standard DMD
    :return:     eigenvalues d and modes Phi
    '''
    print(' Retaining only ---> ', retain,  '  modes')
    print('  The rank of the data is ',_np.linalg.matrix_rank(X))
    U, s, Vt = _sp.linalg.svd(X, full_matrices=False)
    V=Vt.T.conj()
    S_inv = _sp.diag(1/s[0:retain])
    A = U[:,0:retain].T @ Y @ V[:,0:retain] @ S_inv
    d, W = sortEig(A, A.shape[0])
   
    if mode == 'exact':
        Phi = Y @ V[:,0:retain] @ S_inv @ W 
    elif mode == 'standard':
        Phi = U @ W
    else:
        raise ValueError('Only exact and standard DMD available.')

    return d, Phi,A




[docs]
def dmdc(X, Y, U, svThresh=1e-10):
    '''
    DMD + control where control matrix B is unknown, https://arxiv.org/abs/1409.6358
    :param X: State matrix in Reals NxM-1, where N is dim of state vector, M is number of samples
    :param Y: One step time-laged state matrix in Reals NxM-1
    :param U: Control input matrix, in Reals QxM-1, where Q is dim of control vector
    :param svThresh: Threshold below which to discard singular values
    :return: A_approx, B_approx, Phi  (where Phi are dynamic modes of A)
    '''
    n = X.shape[0] # size of state vector
    q = U.shape[0] # size of control vector

    # Y = G * Gamma
    Omega = scipy.vstack((X, U))
    U, svs, V = scipy.linalg.svd(Omega)
    V = V.T
    svs_to_keep = svs[scipy.where(svs > svThresh)] # todo: ensure exist svs that are greater than thresh
    n_svs = len(svs_to_keep)
    Sigma_truncated = scipy.diag(svs_to_keep)
    U_truncated = U[:, :n_svs]
    V_truncated = V[:, :n_svs]

    U2, svs2, V2 = scipy.linalg.svd(Y, full_matrices=False)
    V2 = V2.T
    svs_to_keep2 = svs2[scipy.where(svs2 > svThresh)]
    n_svs2 = len(svs_to_keep2)
    Sigma2_truncated = scipy.diag(svs_to_keep2)
    U2_truncated = U2[:, :n_svs2]
    V2_truncated = V2[:, :n_svs2]

    # separate into POD modes for A, B matrices
    UA = U_truncated[:n, :]
    UB = U_truncated[n:, :]

    A_approx = U2_truncated.T @ Y @ V_truncated @ scipy.linalg.inv(Sigma_truncated) @ UA.T @ U2_truncated
    B_approx = U2_truncated.T @ Y @ V_truncated @ scipy.linalg.inv(Sigma_truncated) @ UB.T

    # eigendecomposition of A_approx
    w, _ = scipy.linalg.eig(A_approx)
    W = scipy.diag(w)

    # compute dynamic modes of A
    Phi = Y @ V_truncated @ scipy.linalg.inv(Sigma_truncated) @ UA.T @ U2_truncated @ W

    return A_approx, B_approx, Phi




[docs]
def amuse(X, Y, evs=5):
    '''
    AMUSE implementation of TICA, see TICA documentation.
    
    :return:    eigenvalues d and corresponding eigenvectors Phi containing the coefficients for the eigenfunctions
    '''
    U, s, _ = _sp.linalg.svd(X, full_matrices=False)
    S_inv = _sp.diag(1/s)
    Xp = S_inv @ U.T @ X
    Yp = S_inv @ U.T @ Y
    K = Xp @ Yp.T
    d, W = sortEig(K, evs)
    Phi = U @ S_inv @ W

    # normalize eigenvectors
    for i in range(Phi.shape[1]):
        Phi[:, i] /= _sp.linalg.norm(Phi[:, i])
    return d, Phi




[docs]
def tica(X, Y, evs=5):
    '''
    Time-lagged independent component analysis of the data matrices X and Y.

    :param evs: number of eigenvalues/eigenvectors
    :return:    eigenvalues d and corresponding eigenvectors V containing the coefficients for the eigenfunctions
    '''
    return edmd(X, Y, _observables.identity, evs=evs)




[docs]
def ulam(X, Y, Omega, evs=5, operator='K'):
    '''
    Ulam's method for the Koopman or Perron-Frobenius operator. The matrices X and Y contain
    the input data.

    :param Omega:    box discretization of type topy.domain.discretization
    :param evs:      number of eigenvalues/eigenvectors
    :param operator: 'K' for Koopman or 'P' for Perron-Frobenius
    :return:         eigenvalues d and corresponding eigenvectors V containing the coefficients for the eigenfunctions

    TODO: Switch to sparse matrices.
    '''
    m = X.shape[1] # number of test points
    n = Omega.numBoxes() # number of boxes
    A = _sp.zeros([n, n])
    # compute transitions
    for i in range(m):
        ix = Omega.index(X[:, i])
        iy = Omega.index(Y[:, i])
        A[ix, iy] += 1
    # normalize
    for i in range(n):
        s = A[i, :].sum()
        if s != 0:
            A[i, :] /= s
    if operator == 'P': A = A.T
    d, V = sortEig(A, evs)
    return (d, V)




[docs]
def edmd(X, Y, psi, evs=5, operator='K'):
    '''
    Conventional EDMD for the Koopman or Perron-Frobenius operator. The matrices X and Y
    contain the input data.

    :param psi:      set of basis functions, see d3s.observables
    :param evs:      number of eigenvalues/eigenvectors
    :param operator: 'K' for Koopman or 'P' for Perron-Frobenius
    :return:         eigenvalues d and corresponding eigenvectors V containing the coefficients for the eigenfunctions
    '''
    PsiX = psi(X)
    PsiY = psi(Y)
    C_0 = PsiX @ PsiX.T
    C_1 = PsiX @ PsiY.T
    if operator == 'P': C_1 = C_1.T

    A = _sp.linalg.pinv(C_0) @ C_1
    d, V = sortEig(A, evs)
    return (A, d, V)




[docs]
def gedmd(X, Y, Z, psi, evs=5, operator='K'):
    '''
    Generator EDMD for the Koopman operator. The matrices X and Y
    contain the input data. For stochastic systems, Z contains the
    diffusion term evaluated in all data points X. If the system is
    deterministic, set Z = None.
    '''
    PsiX = psi(X)
    dPsiY = _np.einsum('ijk,jk->ik', psi.diff(X), Y)
    if not (Z is None): # stochastic dynamical system
        n = PsiX.shape[0] # number of basis functions
        ddPsiX = psi.ddiff(X) # second-order derivatives
        S = _np.einsum('ijk,ljk->ilk', Z, Z) # sigma \cdot sigma^T
        for i in range(n):
            dPsiY[i, :] += 0.5*_np.sum( ddPsiX[i, :, :, :] * S, axis=(0,1) )
    
    C_0 = PsiX @ PsiX.T
    C_1 = PsiX @ dPsiY.T
    if operator == 'P': C_1 = C_1.T

    A = _sp.linalg.pinv(C_0) @ C_1
    
    d, V = sortEig(A, evs, which='SM')
    
    return (A, d, V)




[docs]
def kedmd(X, Y, k, epsilon=0.0, evs=5, operator='P',kind='kernel'):
    '''
    Kernel EDMD for the Koopman or Perron-Frobenius operator. The matrices X and Y
    contain the input data.

    Parameters
    ----------
    X : ndarray
        Input data.
    Y : ndarray
        Input shifted data.
    k : kernel object
        Kernel object.
    epsilon : float
        Regularization parameter.
    evs : int
        Number of eigenvalues/eigenvectors.
    operator : str
        'K' for Koopman or 'P' for Perron-Frobenius.
    kind : str
        'kernel' for kernel EDMD or 'embedded' for embedded EDMD.
    cond : float
        Condition number of the kernel matrix.
    
    Returns
    -------
    A : ndarray
        Eigenfunction coefficients.
    d : ndarray 
        Eigenvalues.
    V : ndarray
        Eigenvectors.
    C : ndarray
        Coefficients from EIgenvalues problem.
    G_0 : ndarray
        Kernel matrix.
    G_1 : ndarray
        Kernel shifted data.
    '''

    if isinstance(X, list) or len(X.shape) < 2: # e.g., for strings
        n = len(X)
    else:
        n = X.shape[1]

    G_0 = _kernels.gramian(X, k)
    G_1 = _kernels.gramian2(X, Y, k)
    #
    # The epsilon must be removed in case is zero
    if operator == 'K': G_1 = G_1.T
    if kind =='kernel':
        A = _sp.linalg.pinv(G_0) @ G_1
    elif kind == 'embedded':
        A = G_1 @_sp.linalg.pinv(G_0)
    else:
        print("Error in KEDMD")
        
    d, V = sortEig(A, evs=evs)
    
    if operator == 'K': 
        W = G_0 @ V
    else:
        W = V
       
    # Compute coefficients for eigenfunctions calculations
    if operator == 'K':
        C = V
    else:
        C = _sp.linalg.pinv(G_0 ) @ V

    
    return d, W, C, A, G_0,G_1



[docs]
def sindy(X, Y, psi, eps=0.001, iterations=10):
    '''
    Sparse indentification of nonlinear dynamics for the data given by X and Y.

    :param psi:        set of basis functions, see topy.observables
    :param eps:        cutoff threshold
    :param iterations: number of sparsification steps
    :return:           coefficient matrix Xi
    '''
    PsiX = psi(X)
    Xi = Y @ _sp.linalg.pinv(PsiX) # least-squares initial guess

    for k in range(iterations):
        s = abs(Xi) < eps # find coefficients less than eps ...
        Xi[s] = 0         # ... and set them to zero
        for ind in range(X.shape[0]):
            b = ~s[ind, :] # consider only functions corresponding to coefficients greater than eps
            Xi[ind, b] = Y[ind, :] @ _sp.linalg.pinv(PsiX[b, :])
    return Xi




[docs]
def kpca(X, k, evs=5):
    '''
    Kernel PCA.
    
    Parameters
    ----------

    param X:    
       data matrix, each column represents a data point
    param k:    
       kernel
    param evs:  
     number of eigenvalues/eigenvectors
    
    Return
    ------
    d:      
        Eigenvalues
    V:  
        data X projected onto principal components
    G:
        Gram Matrix
    '''
    G = _kernels.gramian(X, k) # Gram matrix
    
    # center Gram matrix
    n = X.shape[1]
    N = _sp.eye(n) - 1/n*_sp.ones((n, n))
    G = N @ G @ N    
    d, V = sortEig(G, evs)
    return (d, V,G)




[docs]
def kcca(X, Y, k, option='CCA', evs=5, epsilon=1e-6):
    '''
    Kernel CCA. 

    Perform kernel CCA ina simplified form for time series, 
    otherwise applies KCCA to two different fields

    Parameters
    ----------
    
    X:   
        data matrix, each column represents a data point
    Y:   
        time-lagged data, each column y_i is x_i mapped forward by the dynamical system, 
        or a different data magtrix
    option:
        * 'lagged', assume that the data matrix `Y` is the time lagged version of `X`
        * 'CCA', assume `X` and `Y` to be independent fields  (default)
    k:  
        kernel
    evs:  
        number of eigenvalues/eigenvectors
    epsilon:
        regularization parameter

    Returns
    -------
        CCA coefficients 

    '''
    G_0 = _kernels.gramian(X, k)
    G_1 = _kernels.gramian(Y, k)
    
    # center Gram matrices
    n = X.shape[1]
    I = _sp.eye(n)
    N = I - 1/n*_sp.ones((n, n))
    G_0 = N @ G_0 @ N
    G_1 = N @ G_1 @ N
    
    if option == 'lagged':
        print(' Computing kernel CCA with lagged data  \n')
        A = _sp.linalg.solve(G_0 + epsilon*I, G_0, assume_a='sym') \
                @ _sp.linalg.solve(G_1 + epsilon*I, G_1, assume_a='sym')
        d, V = sortEig(A, evs)

    elif option == 'CCA':
        print(' Computing KCCA  \n')
        zers = _np.zeros(G_0.shape) 
        kdx = _np.concatenate(((G_0 + epsilon*I)@(G_0 + epsilon*I),zers),axis = 1)
        kdy = _np.concatenate((zers,(G_1 + epsilon*I)@(G_1 + epsilon*I)),axis = 1)
        KD = _np.concatenate((kdx,kdy))

        kdxy = _np.concatenate(((G_0 + epsilon*I)@(G_1 + epsilon*I),zers),axis = 1)
        kdyx = _np.concatenate((zers,(G_1 + epsilon*I)@(G_0 + epsilon*I)),axis = 1)
        KO = _np.concatenate((kdxy,kdyx))
        A = _sp.linalg.solve(KD, KO, assume_a='sym') 
        d, V = sortEig(A, evs)
    return (A, d, V)



[docs]
def cmd(X, Y, evs=5, epsilon=1e-6):
    '''
    Coherent mode decomposition.
    
    :param X:    data matrix, each column represents a data point
    :param Y:    lime-lagged data, each column y_i is x_i mapped forward by the dynamical system
    :param evs:  number of eigenvalues/eigenvectors
    :epsilon:    regularization parameter
    :return:     eigenvalues and modes xi and eta
    '''
    G_0 = X.T @ X
    G_1 = Y.T @ Y
    
    # center Gram matrices
    n = X.shape[1]
    I = _sp.eye(n)
    N = I - 1/n*_sp.ones((n, n))
    G_0 = N @ G_0 @ N
    G_1 = N @ G_1 @ N
    
    A = _sp.linalg.solve(G_0 + epsilon*I, _sp.linalg.solve(G_1 + epsilon*I, G_1, assume_a='sym')) @ G_0
    
    d, V = sortEig(A, evs)
    rho = _sp.sqrt(d);
    W = _sp.linalg.solve(G_1 + epsilon*I, G_0) @ V @ _sp.diag(rho)
    
    Xi = X @ V
    Eta = Y @ W
    
    return (rho, Xi, Eta)




[docs]
def seba(V, R0=None, maxIter=5000):
    '''
    Sparse eigenbasis approximation as described in 
    
    "Sparse eigenbasis approximation: Multiple feature extraction across spatiotemporal scales with
    application to coherent set identification" by G. Froyland, C. Rock, and K. Sakellariou.
    
    Based on the original Matlab implementation, see https://github.com/gfroyland/SEBA.
    
    :param V:        eigenvectors
    :param R0:       optional initial rotation
    :param maxIter:  maximum number of iterations
    :return:         sparse basis output
    
    TODO: perturb near-constant vectors?
    '''
    n, r = V.shape
    
    V, _ = _sp.linalg.qr(V, mode='economic')
    mu = 0.99/_sp.sqrt(n)
    
    if R0 == None:
        R0 = _sp.eye(r)
    else:
        R0, _ = _sp.linalg.polar(R0)
    
    S = _sp.zeros((n, r))
    
    for i in range(maxIter):
        Z = V @ R0.T
        
        # threshold
        for j in range(r):
            S[:, j] = _sp.sign(Z[:, j]) * _sp.maximum(abs(Z[:, j]) - mu, 0)
            S[:, j] = S[:, j]/_sp.linalg.norm(S[:, j])
        
        # polar decomposition
        R1, _ = _sp.linalg.polar(S.T @ V)
        
        # check whether converged
        if _sp.linalg.norm(R1 - R0) < 1e-14:
            break
        
        # overwrite initial matrix with new matrix
        R0 = R1.copy()
    
    # choose correct parity and normalize
    for j in range(r):
        S[:, j] = S[:, j] * _sp.sign(S[:, j].sum())
        S[:, j] = S[:, j] / _sp.amax(S[:, j])
    
    # sort vectors
    ind = _sp.argsort(_np.min(S, axis=0))[::-1]
    S = S[:, ind]
        
    return S



[docs]
def kcovedmd(X, Y, k, epsilon=0, evs=5, operator='P'):
    '''
    Kernel Covariance EDMD for the Koopman or Perron-Frobenius operator. 
    The matrices X and Y contain the input data.

    :param k:        kernel, see d3s.kernels
    :param epsilon:  regularization parameter
    :param evs:      number of eigenvalues/eigenvectors
    :param operator: 'K' for Koopman or 'P' for Perron-Frobenius (note that the default is P here)
    :return:         eigenvalues d and eigenfunctions evaluated in X
    '''
    if isinstance(X, list): # e.g., for strings
        n = len(X)
    else:
        n = X.shape[0]

    G_0 = _kernels.covariance(X, k)
    G_1 = _kernels.crosscov(X, Y, k)
    if operator == 'K': G_1 = G_1.T
    
    A = _sp.linalg.pinv(G_0 + epsilon*_sp.eye(n), rcond=1e-10) @ G_1
    d, V = sortEig(A, evs)
    if operator == 'K': V = G_0 @ V
    return (d, V, A,G_0,G_1)


# auxiliary functions

[docs]
def sortEig(A, B=None, evs=5, which='LM'):
    '''
    Computes eigenvalues and eigenvectors of A and sorts them in decreasing lexicographic order. 
    Optionally solve a generalized eigenvalue problem.

    Parameters
    ----------
    
    B:
        If not empty compute generalized eigenvalue problem
        Av = wBv

    evs:
        Number of eigenvalues/eigenvectors
    
    Return
    ------
    
    (w,V):
        Sorted eigenvalues and eigenvectors
    '''
    n = A.shape[0]
    if evs < n:
        print(f'Use sparse solver \n')
        d, V = _sp.sparse.linalg.eigs(A, evs, which=which)
    else:
        print(f'Use full solver \n')
        if B is None:
            d, V = _np.linalg.eig(A)
        else:
            d, V = _sp.linalg.eig(A,b=B)
    ind = d.argsort()[::-1] # [::-1] reverses the list of indices
    return (d[ind], V[:, ind])



[docs]
def FeatureMatrix(x,z,k):
    '''
    Compute the Feature Matrix Phi
    Computed on the support vectors x for the point z
    and the kernel k
    '''
    
    K = _kernels.gramian2(x, z, k)
    
    return K



[docs]
def kgedmd(X, Y, k, epsilon=0, evs=5, operator='P',kind='kernel',cond=1e-15):
    '''
    Kernel EDMD for the Koopman or Perron-Frobenius `generator operator`. The matrix contains
    the data and the matrix Y the derivatives of the data on training points.

    Only Gaussian Kernel

    The matrix Y contains estimate of derivatives on training points

    Parameters
    ----------
    X : ndarray
        Input data.
    Y : ndarray
        Input derivative data.
    k : kernel object
        Kernel object.
    epsilon : float
        Regularization parameter.
    evs : int
        Number of eigenvalues/eigenvectors.
    operator : str
        'K' for Koopman or 'P' for Perron-Frobenius.
    kind : str
        'kernel' for kernel EDMD or 'embedded' for embedded EDMD.
    cond : float
        Condition number of the kernel matrix.
    
    Returns
    -------
    A : ndarray
        Eigenfunction coefficients.
    d : ndarray 
        Eigenvalues.
    V : ndarray
        Eigenvectors.
    G_0 : ndarray
        Kernel matrix.
    G_1 : ndarray
        Kernel derivaitve data.
    '''
    if isinstance(X, list) or len(X.shape) < 2: # e.g., for strings
        n = len(X)
    else:
        n = X.shape[1]

    G_1 = _np.zeros((n,n))
    G_0 = _kernels.gramian(X, k)
    if operator == 'K': 
        G_1 = G_1.T    
    
    for i in range(n):
        for j in range(n):
            G_1[i, j] = Y[:, i].T @ k.diff(X[:, i], X[:, j])
    
    if operator == 'K':    
        A = _sp.linalg.pinv(G_0 + epsilon*_sp.eye(n), rcond=cond)@ G_1
    elif operator == 'P':
        A = _sp.linalg.pinv(G_0 + epsilon*_sp.eye(n), rcond=cond)@ G_1.T
    else:
        raise ValueError(f'Wrong operator in kgedmd {operator}')

        
    d, V = sortEig(A, evs)
    if operator == 'K': 
        V = G_0 @ V
    
    return d, V,A, G_0, G_1