Source code for dafi.random_field.covariance

# Copyright 2020 Virginia Polytechnic Institute and State University.
""" Covariance matrices. """

# standard library imports
import time

# third party imports
import numpy as np
from numpy.core.shape_base import atleast_2d
import scipy.sparse as sp
import scipy.sparse.linalg as splinalg


[docs]def generate_cov(kernel='sqrexp', stddev=1.0, sp_tol=1e-8, **kwargs):
    """ Generate a covariance matrix using the specified correlatiion
    kernel and standard deviation. 

    Additional *kwargs* are passed to the kernel function. 

    Parameters
    ----------
    kernel : function
        Function that returns a correlation matrix. All additional
        arguments are passed to this function. Alternatively, a string
        with the name of one of the implemented kernels.
    stddev : ndarray
        Standard deviation of each state. Alternatively, provide a float
        for a constant standard deviation.
        *dtype=float*, *ndim=1*, *shape=(nstate)*
    sp_tol : float
        Tolerance for sparse matrix. Any entry with correlation less
        than ``sp_tol`` will be set to zero.

    Returns
    -------
    cov : scipy.sparse.csc_matrix
        Covariance matrix.
        *dtype=float*, *ndim=2*, *shape=(nstate, nstate)*
    """
    # correlation matrix
    if isinstance(kernel, str):
        kernel = _get_kernel(kernel)
    corr = kernel(**kwargs)
    corr = array_to_sparse(corr, sp_tol)

    # constant stddev
    if len(np.atleast_1d(np.squeeze(np.array(stddev)))) == 1:
        stddev = np.ones(corr.shape[0]) * stddev

    # covariance matrix
    return corr_to_cov(corr, stddev)


[docs]def array_to_sparse(mat, tol):
    """ Convert numpy array to sparse by setting small entries to zero.

    Parameters
    ----------
    mat : ndarray
        Numpy array.
    tol : float
        Tolerance for sparse matrix. Any entry less than ``tol`` will
        be set to zero.

    Returns
    -------
    mat_sp : csc_matrix
        Matrix converted to sparse matrix.
    """
    indicator_mat = np.abs(mat) > tol
    indicator_mat = indicator_mat.astype(float)
    return sp.csc_matrix(mat*indicator_mat)


[docs]def check_mat(mat, type='cov', tol=1e-08):
    """ Perform checks for correlation or covariance matrices.

    Checks if matrix is symmetric and positive definite. For a
    correlation matrix also checks that the diagonal terms are close to
    1 and the off diagonal have magnitude less than or equal to 1.

    Parameters
    ----------
    mat : ndarray
        Correlation or covariance matrix. Can be ndarray, matrix, or
        scipy sparse matrix.
        *dtype=float*, *ndim=2*, *shape=(N, N)*
    type : str
        Matrix type: use 'corr' for a correlation matrix and 'cov' for a
        covariance matrix.
    tol : float
        Tolerance  used when checking if two values are close to  each
        other.

    Returns
    -------
    passed : bool
        Whether all tests passed succesfully.
    message : str
        Information on which tests did not pass.
    """
    def check_corr_diag(mat, tol):
        """ """
        return np.allclose(mat.diagonal(), 1.0, rtol=0.0, atol=tol)

    def check_corr_offdiag(mat, atol, rtol=0.0):
        tmp = np.abs(mat)
        tmp = tmp[tmp > 1.0]
        if tmp.size != 0:
            tmp = np.max(tmp)
        else:
            tmp = 1.0
        return np.isclose(tmp, 1.0, atol)

    def check_symmetric(mat, rtol, atol=0.0):
        """ """
        mat_2 = mat.T
        tmp = np.abs(mat - mat_2) - rtol * np.abs(mat_2)
        return (tmp.max() - atol <= 0)

    def check_positive_definite(mat, tol=1e-05, eps=1e-8):
        """ Checks if a symmetric matrix is positive-definite.

        Not very stable for very small eigenvalues.
        """
        min_eig = splinalg.eigsh(
            mat, k=1, which='LA', sigma=0, return_eigenvectors=False)
        min_eig = min_eig[0]
        return (min_eig + tol >= 0)

    # make sparse
    mat = sp.csc_matrix(mat)

    # perform checks
    passed = True
    message = ""
    if type == 'corr':
        diag = check_corr_diag(mat, tol)
        off_diag = check_corr_offdiag(mat, tol)
        if not diag:
            passed = False
            message += "\nNot all diagonal entries equal 1. "
        if not off_diag:
            passed = False
            message += "\nNot all off-diagonal entries between -1 and 1. "
    if type in ['cov', 'corr']:
        symmetric = check_symmetric(mat, tol)
        positive_definite = check_positive_definite(mat, tol)
        if not symmetric:
            passed = False
            message += "\nNot Symmetric. "
        if not positive_definite:
            passed = False
            message += "\nNot positive_definite. "
    return passed, message


[docs]def sparse_to_nan(mat):
    """Convert a sparse matrix to a matrix with NaNs instead of zeros.
    """
    spnan = np.ones(mat.shape)*np.nan
    nonsparse = sp.find(mat)
    for (irow, icol, val) in zip(nonsparse[0], nonsparse[1], nonsparse[2]):
        spnan[irow, icol] = val
    return spnan


[docs]def corr_to_cov(corr, stddev):
    """ Convert a correlation matrix to a covariance matrix.

    Parameters
    ----------
    corr : scipy.sparse.csc_matrix
        Correlation matrix.
        *dtype=float*, *ndim=2*, *shape=(nstate, nstate)*
    stddev : ndarray
        Standard deviation of each state. Alternatively, provide a float
        for a constant standard deviation.
        *dtype=float*, *ndim=1*, *shape=(nstate)*

    Returns
    -------
    cov : scipy.sparse.csc_matrix
        Covariance matrix.
        *dtype=float*, *ndim=2*, *shape=(nstate, nstate)*
    """
    if len(np.atleast_1d(np.squeeze(np.array(stddev)))) == 1:
        # constant stddev
        stddev = np.squeeze(stddev)
        cov = stddev**2 * corr
    else:
        stddev = np.atleast_2d(stddev)
        cov = corr.multiply(np.dot(stddev.T, stddev))
    return cov


[docs]def cov_to_corr(cov):
    """ Convert a covariance matrix to a correlation matrix.

    Parameters
    ----------
    cov : ndarray
        Covariance matrix.
        *dtype=float*, *ndim=2*, *shape=(nstate, nstate)*

    Returns
    -------
    corr : ndarray
        Correlation matrix.
        *dtype=float*, *ndim=2*, *shape=(nstate, nstate)*
    """
    stddev = np.sqrt(cov.diagonal())
    stddev = np.atleast_2d(stddev)
    corr = cov / np.dot(stddev.T, stddev)
    return corr


# kernels
def _get_kernel(kernel):
    """Return the requested kernel function. """
    return globals()['kernel_' + kernel]


[docs]def kernel_sqrexp(coords, length_scales):
    """ Create a correlation matrix using the square exponential
    function.

    Parameters
    ----------
    coords : ndarray
        Array of coordinates. Each row correspond to a different point
        and the number of columns is the number of physical dimensions
        (e.g. 3 for (x,y,z)).
        *dtype=float*, *ndim=2*, *shape=(npoints, ndims)*
    length_scales : list
        Length scale for each physical dimensions. List length is ndims.
        Each entry is either a one dimensional ndarray of length nstate
        (length scale field) or a float (constant length scale).

    Returns
    -------
    corr : ndarray
        Correlation matrix.
        *dtype=float*, *ndim=2*, *shape=(nstate, nstate)*
    """
    if len(np.atleast_1d(np.squeeze(np.array(length_scales)))) == 1:
        length_scales = [length_scales]

    if len(coords.shape) == 1:
        coords = np.expand_dims(coords, 1)
    npoints = coords.shape[0]
    nphys_dims = coords.shape[1]
    alpha = 2.0
    # calculate
    exp = np.zeros([npoints, npoints])

    def vec_to_mat(vec):
        vec = np.atleast_2d(vec)
        return np.sqrt(np.dot(vec.T, vec))

    for ipdim in range(nphys_dims):
        pos_1, pos_2 = np.meshgrid(coords[:, ipdim], coords[:, ipdim])
        lensc = length_scales[ipdim]
        constant_lscale = len(np.atleast_1d(np.squeeze(np.array(lensc)))) == 1
        if not constant_lscale:
            lensc = vec_to_mat(lensc)
        exp += ((pos_1 - pos_2) / (lensc))**alpha
    return np.exp(-0.5*exp)


[docs]def kernel_mixed_periodic_sqrexp(coords, length_scales, factor=6.0,
                                 period=None):
    """ Create a correlation matrix using the square exponential
    function in some directions and the periodic kernel in others.

    Parameters
    ----------
    coords : ndarray
        Array of coordinates. Each row correspond to a different point
        and the number of columns is the number of physical dimensions
        (e.g. 3 for (x,y,z)).
        *dtype=float*, *ndim=2*, *shape=(npoints, ndims)*
    length_scales : list
        Length scale for each physical dimensions. List length is ndims.
        Each entry is either a one dimensional ndarray of length nstate
        (length scale field) or a float (constant length scale).
        For periodic directions the ``factor`` argument is used (see
        ``factor``).
    factor : float
        Factor used in the physical interpretation of the periodic
        length scale. The provided lengthscale (:math:`l`) is modified as
        :math:`l = l * factor / p` where :math:`p` is the periodicity.
        A factor of about 6 results in similar physical interpretation
        of the provided length scale as for the non-periodic directions.
    period : list
        List of periodicity for each physical dimension (length ndims).
        Each entry is either a float (periodicity) or *'None'* for
        non-periodic directions.

    Returns
    -------
    corr : ndarray
        Correlation matrix.
        *dtype=float*, *ndim=2*, *shape=(nstate, nstate)*
    """
    if len(np.atleast_1d(np.squeeze(np.array(length_scales)))) == 1:
        length_scales = [length_scales]
    if len(coords.shape) == 1:
        coords = np.expand_dims(coords, 1)
    npoints = coords.shape[0]
    nphys_dims = coords.shape[1]
    alpha = 2.0
    if period is None:
        period = [None]*nphys_dims

    def vec_to_mat(vec):
        vec = np.atleast_2d(vec)
        return np.sqrt(np.dot(vec.T, vec))

    # calculate
    exp = np.zeros([npoints, npoints])
    for ipdim in range(nphys_dims):
        pos_1, pos_2 = np.meshgrid(coords[:, ipdim], coords[:, ipdim])
        dpos = (pos_1 - pos_2)
        lensc = length_scales[ipdim]
        constant_lscale = len(np.atleast_1d(np.squeeze(np.array(lensc)))) == 1
        if not constant_lscale:
            lensc = vec_to_mat(lensc)
        per = period[ipdim]
        if per is None:
            exp += -0.5*(dpos / (lensc))**alpha
        else:
            lensc = lensc * factor / per
            exp += -2.0*(np.sin(np.abs(dpos)*np.pi/per) / lensc)**2
    return np.exp(exp)


[docs]def kernel_input_file(filename, Type='corr'):
    """ Create a correlation matrix by reading it from a file.

    Parameters
    ----------
    filename : str
        Name (path) of file containing hte correlation or covariance
        matrix.
    Type : str
        The type of matrix contained in the file. Options are 'corr' for
        correlation matrix or 'cov' for covariance matrix.

    Returns
    -------
    corr : ndarray
        Correlation matrix.
        *dtype=float*, *ndim=2*, *shape=(nstate, nstate)*
    """
    corr = np.loadtxt(filename)
    if type == 'cov':
        corr = cov_to_corr(corr)
    return corr


# PDE-informed covariance
[docs]def source_cov_to_output_corr(cov, weights, mat):
    """ Convert the input field covariance to the output field
    correlation.

    The input and output field are related by a PDE described by the
    matrix ``mat``.
    This is used to create PDE-informed covariance matrices. See:

        Wu, Jin-Long, et al. *“Physics-Informed Covariance Kernel for
        Model-Form Uncertainty Quantification with Application to
        Turbulent Flows.”* Computers & Fluids, vol. 193, Oct. 2019,
        p. 104292. `doi:10.1016/j.compfluid.2019.104292`_.

    .. _doi:10.1016/j.compfluid.2019.104292:
       doi:10.1016/j.compfluid.2019.104292

    Parameters
    ----------
    cov : ndarray
        Covariance matrix.
        *dtype=float*, *ndim=2*, *shape=(nstate, nstate)*
    weights : ndarray
        Weight (e.g. cell volume) associated with each state.
        *dtype=float*, *ndim=1*, *shape=(nstate)*
    mat : ndarray
        Matrix corresponding to the PDE.
        *dtype=float*, *ndim=2*, *shape=(nstate, nstate)*

    Returns
    -------
    corr : ndarray
        Correlation structure of output field.
        *dtype=float*, *ndim=2*, *shape=(nstate, nstate)*
    """
    weights = np.squeeze(weights)
    weights = np.atleast_2d(weights)
    weight_mat = np.sqrt(np.dot(weights.T, weights))
    cov = cov * weight_mat
    inv_mat = np.linalg.solve(mat, np.identity(mat.shape[0]))
    # L*cov*L^T
    cov_out = np.dot(np.dot(inv_mat, cov), np.transpose(inv_mat))
    return cov_to_corr(cov_out)


# boundary conditions
# TODO: These functions have not been completely tested.
def _sqrexp_bc(kernel_base, der_dir, coords, length_scales):
    # TODO: do matrix operations rather than for loops.
    #       Requires sorting derivatives by direction.
    if len(np.atleast_1d(np.squeeze(np.array(length_scales)))) == 1:
        length_scales = [length_scales]

    nder = length(der_dir)
    nval = length(kernel_base) - nder

    coord_diff = []
    for i in range(coords.shape[1]):
        diff = np.subtract.outer(coords[:, i], coords[:, i])
        coord_diff.append(diff)

    # der-val
    for m in range(nder):
        for n in range(nval):
            i = der_dir[m]
            factor = 1/(length_scales[i]**2) * coord_diff[i][nval+m, n]
            kernel_base[nval+m, n] *= factor

    # val-der
    kernel_base[:nval, nval:] = kernel_base[nval:, :nval].T

    # der-der
    for m in range(nder):
        for n in range(nder):
            i = der_dir[m]
            j = der_dir[n]
            kdel = float(i == j)
            factor = 1/(length_scales[j]**2) * \
                coord_diff[i][nval+m, nval+n] * coord_diff[j][nval+m, nval+n]
            factor = 1/(length_scales[i]**2) * (kdel - factor)
            kernel_base[nval+m, nval+n] *= factor

    return kernel_base


def _mixed_periodic_sqrexp_bc(kernel_base, der_dir, coords,
                              length_scales, factor=6.0, period=None):
    # TODO: implement for periodic directions
    if period is None:
        period = [None]*coords.shape[1]
    for i in der_dir:
        if period[i] is not None:
            raise NotImplementedError
    return _sqrexp_bc(kernel_base, der_dir, coords, length_scales)


[docs]def bc_cov(kernel='sqrexp', stddev=1.0, sp_tol=1e-8,
           dirichlet_coords=None, neumann_coords=None, neumann_dir=None,
           int_val=None, int_der=None, prior_mean=None,
           perturb=1e-5, kernel_kwargs={}):
    """ Create covariance matrix based on specified kernel and 
    enforcing boundary conditions and observations. 

    Note: kernel_kwargs must contain coords. 

    See: 
        Michelén Ströfer, et al. *“Enforcing boundary conditions on 
        physical fields in Bayesian inversion.”* Computer Methods in 
        Applied Mechanics and Engineering, 367, 113097, 2020. 
        `doi:10.1016/j.cma.2020.113097`_.

    .. _doi:10.1016/j.cma.2020.113097:
       doi:10.1016/j.cma.2020.113097

    Parameters
    ----------
    kernel : function
        See *generate_cov*.
    stddev : ndarray
        See *generate_cov*.
    sp_tol : float
        See *generate_cov*.
    dirichlet_coords : ndarray
        Coordinates of points where Dirichlet boundary condition is 
        enforced (e.g. cell faces). 
        *dtype=float*, *ndim=2*, *shape=(npoints, ncoords)*
    neumann_coords : ndarray
        Coordinates of points where Neumann boundary condition is 
        enforced (e.g. cell faces). 
        *dtype=float*, *ndim=2*, *shape=(npoints, ncoords)*
    neumann_dir : ndarray
        Index of coordinate direction for the gradient. 
        *dtype=float*, *ndim=1*, *shape=(npoints)*
    int_value : dictionary
        Dictionary containing the coordinates 
        (*coords*, *ndarray*, *ndim=2*, *shape=(npoints, ncoords)*), 
        values (*val*, *ndarray*, *ndim=1*, *shape=(npoints)*), 
        standard deviation 
        (*stddev*, *ndarray*, *ndim=1*, *shape=(npoints)*), and
        baseline (prior, e.g. interpolate from prior mean) values 
        (*val_base*, *ndarray*, *ndim=1*, *shape=(npoints)*), 
        of npoints internal value observations. 
    int_der : dictionary
        Dictionary of internal derivative observations. See *int_value*.
        Additionally contains the direction (coordinate index)
        (*dir*, *ndarray*, *ndim=1*, *shape=(npoints)*)
    prior_mean : ndarray
        Mean vector prior to enforcing internal observations. 
        *dtype=float*, *ndim=1*, *shape=(nstate)*
    perturb : float
        Small quantity to add to a matrix diagonal before inversion.
    kernel_kwargs : dictionary
        Keyword arguments for chosen kernel function. 

    Returns
    -------
    mean : ndarray
        Modified mean
    cov : scipy.sparse.csc_matrix
        Covariance matrix. See *generate_cov*.
        *dtype=float*, *ndim=2*, *shape=(nstate, nstate)*
    """
    if kernel == "sqrexp":
        dx = _sqrexp_bc
    elif kernel == "mixed_periodic_sqrexp":
        dx = _mixed_periodic_sqrexp_bc
    else:
        msg = "Only 'sqrexp' and 'mixed_periodic_sqrexp' implemented."
        raise NotImplementedError(msg)

    # augment mesh
    coords = kernel_kwargs['coords']
    npoints = coords.shape[0]
    nval_int = 0
    nval_bc = 0
    nder_int = 0
    nder_bc = 0
    if int_val is not None:
        coords = np.vstack([coords, np.atleast_2d(int_val['coords'])])
        nval_int += len(int_val['coords'])
    if dirichlet_coords is not None:
        coords = np.vstack([coords, np.atleast_2d(dirichlet_coords)])
        nval_bc += len(dirichlet_coords)
    if int_der is not None:
        coords = np.vstack([coords, np.atleast_2d(int_der['coords'])])
        nder_int += len(int_der['coords'])
    if neumann_coords is not None:
        coords = np.vstack([coords, np.atleast_2d(neumann_coords)])
        nder_bc += len(neumann_coords)
    nval_obs = nval_int + nval_bc
    nval = npoints + nval_obs
    nder = nder_int + nder_bc

    # create covariance matrix on augmented mesh
    kernel_kwargs['coords'] = coords
    cov_aug = generate_cov(kernel, stddev, sp_tol, **kernel_kwargs)
    cov_aug = cov_aug.toarray()  # TODO: avoid converting to dense
    if nder > 0:
        int_der_dir = []
        if int_der is not None:
            int_der_dir = int_der['dir']
        der_dir = np.concatenate([int_der_dir, neumann_dir])
        cov_aug = dx(cov_aug, der_dir, **kernel_kwargs)

    # observation and observation error (covariance)
    int_val_stddev = []
    int_der_stddev = []
    int_val_obs = []
    int_der_obs = []
    int_val_base = []
    int_der_base = []
    if int_val is not None:
        if len(int_val['stddev']) == 1:
            int_val['stddev'] = np.ones(n_val_int) * int_val['stddev']
        int_val_stddev = int_val['stddev']
        int_val_obs = int_value['val']
        int_val_base = int_value['val_base']
    if int_der is not None:
        if len(int_der['stddev']) == 1:
            int_der['stddev'] = np.ones(n_der_int) * int_der['stddev']
        int_der_stddev = int_der['stddev']
        int_der_obs = int_value['val']
        int_der_base = int_value['val_base']

    def obsvec(v, d):
        return np.concatenate([v, np.zeros(nval_bc), d, np.zeros(nder_bc)])
    stddev = obsvec(int_val_stddev, int_der_stddev)
    obs_var = np.diag(stddev**2)
    obs = obsvec(int_val_obs, int_der_obs)
    obs_base = obsvec(int_val_base, int_der_base)

    # new covariance
    cov_xx = cov_aug[:npoints, :npoints]
    cov_yy = cov_aug[npoints:, npoints:] + obs_var
    cov_xy = cov_aug[:npoints, npoints:]
    cov_yx = cov_aug[npoints:, :npoints]
    cov_yy_i = np.linalg.inv(cov_yy + perturb*np.eye(cov_yy.shape[0]))
    cov = cov_xx - np.matmul(np.matmul(cov_xy, cov_yy_i), cov_yx)
    cov = array_to_sparse(cov, sp_tol)

    # new mean
    if int_val is not None or int_der is not None:
        if prior_mean is None:
            prior_mean = np.zeros(npoints)
        obs_diff = obs - obs_base
        mean = prior_mean + np.matmul(np.matmul(cov_xx, cov_yy_i), obs_diff)
    else:
        mean = prior_mean

    return mean, cov