Source code for attitude.orientation.pca

# -*- coding: utf-8 -*-
from __future__ import division
import numpy as N
import logging
from scipy.sparse import bsr_matrix
from scipy.linalg import lu
from scipy.sparse.linalg import svds
from scipy.integrate import quad
from itertools import chain
from ..coordinates import centered
from .base import BaseOrientation, rotation
from ..error.ellipse import ellipse
from ..stereonet import plane_errors, error_coords
from ..error.axes import sampling_axes, sampling_covariance, angular_errors, noise_axes
from ..test import scattered_plane
from ..geom.util import dot, vector
from ..geom.util import angle as vector_angle
from ..geom.conics import conic

log = logging.getLogger('attitude')

[docs]def random_pca(scattered=True):
    if scattered:
        arr,coeffs = scattered_plane()
    else:
        arr, coeffs = random_plane()
    arr = N.array(arr).transpose()
    return PCAOrientation(arr)

[docs]def augment(matrix):
    size = matrix.shape
    _ = N.identity(size[0]+1)
    _[:size[0],:size[1]] = matrix
    return _

[docs]def augment_vector(vec):
    return N.append(vec,[1],axis=0)

[docs]def rotate_tensor(tensor,transform):
    """
    Transforms a tensor by an affine transform
    """
    return dot(transform, tensor, transform.T)

[docs]def compose_affine(*transforms):
    """
    Returns a composite of several affine transformations.
    """
    return reduce(N.dot,reversed(transforms))

[docs]def normalize(v):
    return v/N.linalg.norm(v)

## magnitude of vector (by row)
norm = lambda x: N.linalg.norm(x,2,1)

[docs]def axis_transform(pca_axes):
    """
    Creates an affine transformation matrix to
    rotate data in PCA axes into Cartesian plane
    """
    from_ = N.identity(3)
    to_ = pca_axes

    # Find inverse transform for forward transform
    # y = M x -> M = y (x)^(-1)
    # We don't need to do least-squares since
    # there is a simple transformation
    trans_matrix = N.linalg.lstsq(from_,to_)[0]
    return trans_matrix


[docs]def test_SVD(pca):
    """
    Function to test the validity of singular
    value decomposition by reconstructing original
    data.
    """
    _ = pca
    rec = N.dot(_.U,N.dot(_.sigma,_.V))
    assert N.allclose(_.arr,rec)

[docs]def covariance_matrix(self):
    """
    Constructs the covariance matrix of
    input data from
    the singular value decomposition. Note
    that this is different than a covariance
    matrix of residuals, which is what we want
    for calculating fit errors.

    Using SVD output to compute covariance matrix
    X=UΣV⊤
    XX⊤XX⊤=(UΣV⊤)(UΣV⊤)⊤=(UΣV⊤)(VΣU⊤)
    V is an orthogonal matrix (V⊤V=I),
    covariance matrix of input data: XX⊤=UΣ2U⊤

     Because the axes represent identity in the
     PCA coordinate system, the PCA major axes
     themselves represent an affine transformation
     matrix from PCA to Cartesian space
    """

    a = N.dot(self.U,self.sigma)
    cv = N.dot(a,a.T)
    # This yields the covariance matrix in Cartesian
    # coordinates
    return cv

[docs]class PCAOrientation(BaseOrientation):
    """ Gets the axis-aligned principle components
        of the dataset.
    """
[docs]    @classmethod
    def from_axes(axes):
        """
        Recovers a principal component dataset from
        a set of axes (singular values*principal axes)
        of the dataset.
        """
        pass

    def __init__(self, arr, weights=None,  axes=None):
        """
        Perform PCA on on an input array

        :param axes: Precalculated axes for PCA fit
        :param weights: Relative axis loadings

        Relative loadings for individual axes of the input dataset.
        These will be applied transparently during the calculation
        of the PCA. This allows arbitrary standardization of the
        data for differently-scaled errors along coordinate axes.

        A common use of factor weightings is to standardize differently-
        scaled variables. This is accomplished by dividing by the standard
        deviation as such:
        `self.arr /= self.arr.std(axis=0)`
        Not dividing by std leaves us with an eigen-analysis of
        the *covariance matrix*, while dividing
        by it leaves us with an eigen-analysis
        of the *correlation matrix*.

        Applying non-equal weights will necessarily have an impact
        on the true orthagonality of the axes of error in the dataset,
        which may have an impact on plotting errors in Cartesian space.
        For now, this is ignore.
        """
        # For principal components, data needs
        # to be pre-processed to have zero mean
        self.member_of = None
        self.disabled = False

        self.method = noise_axes
        self.array = arr

        self.mean = arr.mean(axis=0)
        self.arr = centered(arr)

        # Factor loadings
        if weights is None:
            weights = N.ones(self.arr.shape[1])
        self.weights = weights

        self.n = len(self.arr)

        if axes is None:
            self.__run_svd()
        else:
            self.__load_saved_fit(axes)

        self.__compute_derived_parameters()

    def __run_svd(self):
        # Get singular values
        log.debug("Running singular value decomposition")

        if len(self.arr) < 3:
            raise ValueError("Cannot fit a plane to fewer than 3 coordinates")

        ### Apply factor weights
        # We should be careful that they aren't too
        # large so we don't run into numerical difficulties
        w = self.weights[N.newaxis,:]
        arr = self.arr/w
        res = N.linalg.svd(arr,
            full_matrices=False)

        self._U, s, V = res
        ### Divide by weights ###
        #V *= w
        #V /= N.linalg.norm(V,axis=1)
        s *= self.weights

        self.singular_values = s
        self.V = V

    def __load_saved_fit(self, axes):

        # Saves us the computationally expensive
        # step of running a SVD
        log.debug("Loaded PCA from saved axes")
        ## Get from axes if these are defined
        # In this case, axes must be equivalent
        # to self.axes*self.singular_values
        s = N.linalg.norm(axes,axis=0)
        self.V = axes/s
        # Don't compute U unless we have to
        self._U = None
        self.singular_values = s

    def __compute_derived_parameters(self):
        self.axes = self.V
        self.sigma = N.diag(self.singular_values)

        # Normal vector in axis-aligned coordinate frame
        self.offset = N.cross(self.sigma[0],self.sigma[1])

        self.normal = self.axes[-1]
        if self.normal[-1] < 0:
            # Could create a special case for inverted bedding
            self.normal = -self.normal

        v = N.zeros_like(self.normal)
        v[-1] = 1
        self._vertical = v
        self.strike = N.cross(self.normal,self._vertical)
        try:
            self.dip_dr = normalize(N.cross(self.strike,self.normal))
        except ValueError:
            # Can't do this in 2D cases
            self.dip_dr = None

        # Hyperbolic form of PCA
        #self.hyp = self.as_hyperbola(rotated=False)
        #d = N.abs(N.diagonal(self.hyp)[:-1])
        #self.hyp_axes = N.sqrt(1/d)

    @property
    def U(self):
        """
        Property to support lazy evaluation of residuals
        """
        if self._U is None:
            sinv = N.diag(1/self.singular_values)
            self._U = dot(self.arr,self.V.T,sinv)
        return self._U

    @property
    def eigenvalues(self):
        """
        Eigenvalues of the data covariance matrix
        """
        return self.singular_values**2/(self.n-1)

[docs]    def rotated(self):
        """
        Returns a dataset 'despun' so that
        it is aligned with the princpal
        axes of the dataset.
        """
        return N.dot(self.arr,self.V.T)

[docs]    def residuals(self):
        """
        Returns residuals of fit against all
        three data axes (singular values 1, 2,
        and 3). This takes the form of data along
        singular axis 3 (axes 1 and 2 define the plane)
        """
        _ = self.rotated()
        _[:,-1] = 0
        _ = N.dot(_,self.axes)
        return self.arr - _

    @property
    def center(self):
        return self.mean

    @property
    def centered_array(self):
        return self.arr

    @property
    def hyperbolic_axes(self):
        return self.method(self)

[docs]    def angular_error(self, axis_length):
        """
        The angular error for an in-plane axis of
        given length (either a PCA major axis or
        an intermediate direction).
        """
        hyp_axes = self.method(self)
        return N.arctan2(hyp_axes[-1],axis_length)

[docs]    def angular_errors(self, degrees=True):
        """
        Minimum and maximum angular errors
        corresponding to 1st and 2nd axes
        of PCA distribution.
        """
        hyp_axes = self.method(self)
        v = angular_errors(hyp_axes)
        if degrees:
            v = N.degrees(v)
        return tuple(v)

    def _covariance_matrix(self, type='noise'):
        """
        Constructs the covariance matrix from PCA
        residuals
        """
        if type == 'sampling':
            return self.sigma**2/(self.n-1)
        elif type == 'noise':
            return 4*self.sigma*N.var(self.rotated(), axis=0)

    @property
    def covariance_matrix(self):
        """
        The data covariance matrix is related to the
        cross-product matrix M^T M but scaled by the number of
        samples.
        """
        return self._covariance_matrix()

    @property
    def explained_variance(self):
        """
        Proportion of variance that is explained by the
        first two principal components (which together
        represent the planar fit). Analogous to R^2 of
        linear least squares.
        """
        v = N.diagonal(self.covariance_matrix)
        return v[0:2].sum()/v.sum()

    @property
    def coefficients(self):
        return self.axes[2]

    @property
    def azimuth(self):
        c = self.coefficients
        return N.arctan2(c[0],c[1])

    @property
    def slope(self):
        _ = self.coefficients
        mag = N.linalg.norm(_)
        return N.arccos(_[2]/mag)

    def _strike_dip(self):
        n = self.axes[2]
        r = N.linalg.norm(n)
        strike = N.arctan2(n[0],n[1])-N.pi/2
        dip = N.arccos(n[2]/r)
        return strike, dip

[docs]    def strike_dip(self, degrees=True):
        """
        Computes strike and dip from a normal vector.
        Results are usually the same as LLSQ
        in strike (to a few decimal places) and close in dip.
        Sometimes, dips are greater by as much as 45 degrees,
        reflecting inclusion of errors in x-y plane.
        """
        n = self.axes[2]
        r = N.linalg.norm(n)
        strike = N.degrees(N.arctan2(n[0],n[1]))-90
        dip = N.degrees(N.arccos(n[2]/r))

        # Since PCA errors are not pinned to the XYZ plane,
        # we need to make sure our results are in the
        # right quadrant.
        if dip > 90:
            dip = 180 - dip
            strike += 180

        # Proper azimuth notation
        if strike < 0:
            strike += 360

        return strike, dip

    def _rake(self):
        """
        Rake of maximum angular error relative to strike of plane
        (this is functionally equivalent to rake of minimum error
        from dip direction)
        """
        return vector_angle(self.dip_dr, self.axes[0])

[docs]    def rake(self):
        return N.degrees(self._rake())

[docs]    def strike_dip_rake(self):
        _ = self.strike_dip()
        return (_[0],_[1], self.rake())

[docs]    def as_conic(self, level=1):

        if dot(self.axes[2],vector(0,0,1)) < 0:
            self.axes *= -1

        cov = self.covariance_matrix
        idx = N.diag_indices(3)
        ell = N.identity(4)
        ell[idx] = 1/cov[idx]*level**2 #cov*level**2#
        ell[3,3] = -1
        ell = conic(ell)

        # Translate ellipse along 3rd major axis
        ell = ell.translate(self.offset)

        # Rotate ellipse matrix into cartesian
        # plane
        R = augment(self.axes)
        return ell.transform(R)

[docs]    def as_hyperbola(self, rotated=False):
        """
        Hyperbolic error area
        """
        idx = N.diag_indices(3)
        _ = 1/self.covariance_matrix[idx]
        d = list(_)
        d[-1] *= -1

        arr = N.identity(4)*-1
        arr[idx] = d
        hyp = conic(arr)
        if rotated:
            R = augment(self.axes)
            hyp = hyp.transform(R)
        return hyp

    def _ellipse(self, level=1):

        ell = self.as_conic(level=level)

        con, matrix, center = ell.projection()
        ax = con.major_axes()

        # Rotate major axes into 3d space
        axs_ = N.append(ax,N.zeros((2,1)),axis=1)
        axs = dot(axs_,matrix[:3])
        u = N.linspace(0,2*N.pi,1000)

        # Get a bundle of vectors defining cone
        # which circumscribes ellipsoid
        angles = N.array([N.cos(u),N.sin(u)]).T
        # Turn into vectors
        return dot(angles,axs),center

[docs]    def plane_errors(self, **kwargs):
        return plane_errors(self.axes,self.covariance_matrix, **kwargs)

[docs]    def error_coords(self, **kwargs):
        return error_coords(self.axes,self.covariance_matrix, **kwargs)

    @property
    def slope(self):
        _ = self.coefficients
        mag = N.linalg.norm(_)
        return N.arccos(_[2]/mag)

[docs]    def error_ellipse(self, spherical=True, vector=False, level=1):
        data,center = self._ellipse(level)
        data += center

        r = N.linalg.norm(data,axis=1)
        plunge = N.arcsin(data[:,2]/r)
        trend = N.arctan2(data[:,0],data[:,1])

        return (trend,plunge)

[docs]    def to_mapping(self,**values):
        values.setdefault('centered_array',self.centered_array.tolist())
        values.setdefault('center',self.center.tolist())
        if self.member_of is not None:
            values['member_of'] = self.member_of.hash

        return super().to_mapping(**values)

    def __repr__(self):
        sdr = self.strike_dip_rake()
        ae = self.angular_errors()
        return ("Orientation:: strike: {0:.2f} dip: {1:.2f}\n"
                "      error:: min: {3:.2f} max: {4:.2f} rake: {2:.2f}"
                .format(sdr[0],sdr[1],sdr[2], ae[0],ae[1]))
Source code for attitude.orientation.pca

Attitude

Navigation

Related Topics