fosanalysis/filtering_8py_source.html

r"""

Contains class definitions for filtering algorithms.

Those can be leveraged to deal with noise, e.g.\ by smoothing neighboring data points.


\author Bertram Richter

\date 2022

"""


from abc import abstractmethod

import copy


import numpy as np


from fosanalysis import utils

from . import base


class Filter(base.Task):

    r"""

    Abstract base class for filter classes.

    These filters will modify the values, but not the shape of the arrays.


    To reduce/avoid boundary effects, generally crop the data after smoothing.

    """


class Limit(Filter):

    r"""

    A filter to limit the entries.

    The result \f$y\f$ will only contain all entries for which \f$y_i \in [x_{\mathrm{min}},\: x_{\mathrm{max}}]\f$ holds.

    Values, that exceed the limits, will be truncated at the according limit using the equation

    \f[y_i = \min\left(\max\left(x_i,\: x_{\mathrm{min}}\right),\: x_{\mathrm{max}}\right)\f].

    """


    def __init__(self,

            minimum: float = None,

            maximum: float = None,

            *args, **kwargs):

        r"""

        Construct an instance of the class.

        \param minimum \copydoc minimum

        \param maximum \copydoc maximum

        \param *args Additional positional arguments, will be passed to the superconstructor.

        \param **kwargs Additional keyword arguments, will be passed to the superconstructor.

        """

        super().__init__(*args, **kwargs)


        self.minimum = minimum


        self.maximum = maximum


    def run(self,

            x: np.array,

            y: np.array,

            z: np.array,

            make_copy: bool = True,

            timespace: str = "2d",

            minimum: float = None,

            maximum: float = None,

            *args, **kwargs) -> tuple:

        r"""

        Limit the entries in the given list to the specified range.

        Returns a list, which conforms to \f$\mathrm{minimum} \leq x \leq \mathrm{maximum} \forall x \in X\f$.

        Entries, which exceed the given range are cropped to it.

        \copydetails preprocessing.base.Task.run()

        \param minimum \copydoc minimum

        \param maximum \copydoc maximum

        """

        return super().run(x, y, z,

                timespace=timespace,

                make_copy=make_copy,

                minimum=minimum,

                maximum=maximum,

                *args, **kwargs)


    def _run_1d(self,

            x: np.array,

            z: np.array,

            *args, **kwargs) -> tuple:

        return x, self._limit(z, *args, **kwargs)


    def _run_2d(self,

            x: np.array,

            y: np.array,

            z: np.array,

            *args, **kwargs) -> tuple:

        return x, y, self._limit(z, *args, **kwargs)


    def _limit(self,

            z: np.array,

            minimum: float = None,

            maximum: float = None,

            *args, **kwargs) -> np.array:

        r"""

        Limit the values of the array.

        \param z Array with data to be limited.

        \param minimum \copydoc minimum

        \param maximum \copydoc maximum

        \param *args Additional positional arguments, ignored.

        \param **kwargs Additional keyword arguments, ignored.

        """

        minimum = minimum if minimum is not None else self.minimum

        maximum = maximum if maximum is not None else self.maximum

        if minimum is not None:

            z = np.maximum(z, minimum)

        if maximum is not None:

            z = np.minimum(z, maximum)

        return z


class SlidingFilter(Filter):

    r"""

    Abstract base class for filter classes, based on sliding windows.

    The sliding windows are generated by \ref utils.windows.sliding().

    To each of those sliding windows, \ref method is applied.

    The result is written to the central pixel of the window.

    To reduce/avoid boundary effects, genrally crop the data after smoothing.

    """


    def __init__(self,

            radius: int,

            method: str,

            pad_mode: str = None,

            *args, **kwargs):

        r"""

        Construct an instance of the class.

        As this is an abstract class, it may not be instantiated directly itself.

        \param radius \copydoc radius

        \param method \copydoc method

        \param pad_mode \copydoc pad_mode

        \param *args Additional positional arguments, will be passed to the superconstructor.

        \param **kwargs Additional keyword arguments, will be passed to the superconstructor.

        """

        super().__init__(*args, **kwargs)


        self.radius = radius


        self.method = method


        self.pad_mode = pad_mode


    def run(self,

            x: np.array,

            y: np.array,

            z: np.array,

            timespace: str = None,

            make_copy: bool = True,

            radius: int = None,

            method: str = None,

            *args, **kwargs) -> tuple:

        r"""

        The given data is filtered with a sliding window.

        \copydetails SlidingFilter

        \copydetails preprocessing.base.Task.run()

        \param radius \copydoc radius Defaults to \ref radius.

        \param method \copydoc method

        """

        return super().run(x, y, z,

                timespace=timespace,

                make_copy=make_copy,

                radius=radius,

                method=method,

                *args, **kwargs)


    def _run_1d(self,

            x: np.array,

            z: np.array,

            *args, **kwargs) -> tuple:

        return x, self._slide(z, *args, **kwargs)


    def _run_2d(self,

            x: np.array,

            y: np.array,

            z: np.array,

            *args, **kwargs) -> tuple:

        return x, y, self._slide(z, *args, **kwargs)


    def _slide(self,

            z: np.array,

            radius = None,

            method: str = None,

            *args, **kwargs) -> np.array:

        r"""

        Move the window over the input array and apply \ref method on it.

        The central pixel of the window \f$x_{i}\f$ is assigned the value

        \f[

            x_{i} \gets \mathrm{op}(x_{j,\:\ldots,\:k}) \text{ with } j = i -r \text{ and } k = i + r.

        \f]

        \param z Array of strain data.

        \param radius \copydoc radius Defaults to \ref radius.

        \param method \copydoc method

        \param *args Additional positional arguments, will be ignored.

        \param **kwargs Additional keyword arguments, will be ignored.

        \return Returns an array with the same shape as `z`.

        """

        radius = radius if radius is not None else self.radius

        method = method if method is not None else self.method

        method_function = method if callable(method) else getattr(np, method)

        if radius == 0:

            return z

        return utils.windows.sliding_window_function(z, radius, method_function)


class Cluster(Filter):

    r"""

    The Cluster filter is an iterative smoothing algorithm guaranteed to converge \cite Lou_2020_ApplicationofClustering.

    The one-dimensional signal to filter consists of abscissa data \f$\mathbf{x}\f$ and according ordinate data (measured values) \f$\mathbf{z}\f$.

    For the \f$k\f$th entry (pixel), consisting of its location \f$x_{k}\f$ and its original value \f$z_{k}\f$, a value is estimated iteratively.

    The pixel value estimate \f$z^{(t+1)}_{k}\f$ for the next iteration step \f$t+1\f$ is determined by (see \ref _new_z_t()):

    \f[

        z^{(t+1)}_{k} = \frac{

            \sum_{i} z_{i} w_{i} \exp\left(- \beta^{(t)} \left(z_{i} - z^{(t)}_{k}\right)^{2}\right)

        }{

            \sum_{i} w_{i} \exp\left(- \beta^{(t)} \left(z_{i} - z^{(t)}_{k}\right)^{2}\right)

        }.

    \f]

    Here, the \f$i\f$th pixels position is \f$x_{i}\f$, its value is \f$z_{i}\f$ and \f$w_{i}\f$ is its weight.

    The weight indicates the influence on the currently optimized pixel at position \f$x_{k}\f$

    and drops exponentially with the distance for the current pixel (see \ref _get_weights())

    \f[

        w_{i} = \exp\left(-\alpha ||x_{i} - x_{k}||^{2}\right)

    \f]

    with \f$|| x_{i} - x_{k} ||^{2}\f$ being the squared Euclidian norm.

    The main parameter for the filter is \f$\alpha\f$, which controls the weight falloff and hence, the filter's scale.

    It can be calculated from ttarget weight and distance with \ref estimate_alpha().

    The locality parameter \f$\beta\f$ based on the local variance is estimated to (see \ref _get_beta()):

    \f[

        \beta^{(t)} = \frac{

            \sum_{i} w_{i}

        }{

            2 \sum_{i} \left(z_{i}-z^{(t)_{k}}\right)^{2} w_{i}

        }.

    \f]

    The initial guess \f$z^{(0)}\f$ is estimated by (see \ref _initial_z):

    \f[

        z^{(0)} = \frac{

            \sum_{i} z_{i} w_{i}

        }{

            \sum_{i} w_{i}

        }.

    \f]

    After each iteration, the estimate change is

    \f[

        \Delta z^{(t)}_{k} = |z^{(t-1)} - z^{(t)}_{k}|

    \f]

    calculated and the iteration is stopped if this change falls below the predefined threshold \f$\Delta z_{\mathrm{tol}}\f$:

    \f[

        \Delta z^{(t)}_{k} \leq \Delta z_{\mathrm{tol}}.

    \f]

    This process is repeated for all pixels.

    """


    def __init__(self,

            alpha: float,

            tolerance: float = 0.1,

            fill: bool = False,

            *args, **kwargs):

        r"""

        Construct a Cluster object.

        \param alpha \copybrief alpha \copydetails alpha For more, see \ref alpha.

        \param tolerance \copybrief tolerance \copydetails tolerance.

        \param fill \copybrief fill \copydetails fill.

        \param *args Additional positional arguments, will be passed to the superconstructor.

        \param **kwargs Additional keyword arguments, will be passed to the superconstructor.

        """

        super().__init__(*args, **kwargs)


        self.alpha = alpha


        self.tolerance = tolerance


        self.fill = fill


    @property


    def alpha(self):

        return self._alpha


    @alpha.setter


    def alpha(self, alpha):

        assert alpha >= 0, "The scaling value alpha needs to be non-negative!"

        self._alpha = alpha


    def _run_1d(self,

            x: np.array,

            z: np.array,

            *args, **kwargs) -> tuple:

        r"""

        Carry out the filtering on one-dimensional data.


        \copydetails fosanalysis.preprocessing.base.Task._run_1d()

        """

        z_filtered = copy.deepcopy(z)

        z_zero = copy.deepcopy(z)

        nan_array = np.logical_not(np.isfinite(z_zero))

        z_zero[nan_array] = 0

        iterator = np.nditer(z_zero, flags=["multi_index"])

        for z_orig in iterator:

            pixel = iterator.multi_index

            if self.fill or not nan_array[pixel]:

                weights_array = self._get_weights(pixel, x)

                weights_array[nan_array] = 0

                z_t = self._initial_z(z_zero, weights_array)

                improvement = np.inf

                while abs(improvement) > self.tolerance:

                    z_t_new = self._new_z_t(z_zero, weights_array, z_t)

                    improvement = z_t_new - z_t

                    z_t = z_t_new

                z_filtered[pixel] = z_t

        return x, z_filtered


    def _run_2d(self,

            x: np.array,

            y: np.array,

            z: np.array,

            *args, **kwargs) -> tuple:

        r"""

        Cluster has no true 2D operation mode.

        Set \ref timespace to `"1d_space"`!

        """

        raise NotImplementedError("Cluster does not support true 2D operation. Try `timepace='1d_space'` instead.")


    def _get_weights(self,

            pixel: int,

            x_array: np.array,

            ) -> np.array:

        r"""

        Calculate the array of weights for the current position.

        The weight \f$w_i\f$ of the \f$i\f$th element on the current

        element is calculated as

        \f[

            w_{i} = \exp\left(-\alpha || x_{i} - x ||^{2}\right).

        \f]

        \param pixel Position (index) of the current datapoint to estimate.

        \param x_array Array of abscissa data.

        """

        position = x_array[pixel]

        dist = np.square(x_array - position)

        return np.exp(-self.alpha * dist)


    def _get_beta(self,

            z_dist_array: np.array,

            weights_array: np.array,

            ) -> float:

        r"""

        Calculate the locality parameter \f$\beta\f$.

        The locality parameter \f$\beta\f$ is affected on the local variance.

        It is calculated as

        \f[

            \beta^{(t)} = \frac{

                \sum_{i} w_{i}

            }{

                2 \sum_{i} \left(z_{i}-z^{(t)_{k}}\right)^{2} w_{i}

            }.

        \f]

        \param z_dist_array 1D-array distance matrix for the current pixel.

        \param weights_array 1D-array containing the weights.

        """

        return 0.5 * np.sum(weights_array)/np.sum(weights_array * z_dist_array)


    def _initial_z(self,

            z_array: np.array,

            weights_array:np.array,

            ) -> float:

        r"""

        Guess the the initial estimate.

        The initial estimate \f$z^{(0)}\f$ is calculated by

        \f[

            z^{(0)} = \frac{\sum_{i} z_{i} w_{i}}{\sum_{i} w_{i}}.

        \f]

        \param z_array 1D-array of the original ordniate data.

        \param weights_array 1D-array containing the weights.

        """

        return np.sum(weights_array * z_array)/np.sum(weights_array)


    def _new_z_t(self,

            z_array: np.array,

            weights_array: np.array,

            z_t: float,

            ) -> float:

        r"""

        Calculate the next iteration estimate.

        The next estimate \f$z^{(t+1)}_{k}\f$ is calculated as

        \f[

            z^{(t+1)}_{k} = \frac{

                \sum_{i} z_{i} w_{i} \exp\left(- \beta^{(t)} \left(z_{i} - z^{(t)}_{k}\right)^{2}\right)

            }{

                \sum_{i} w_{i} \exp\left(- \beta^{(t)} \left(z_{i} - z^{(t)}_{k}\right)^{2}\right)

            }.

        \f]

        Here, the \f$i\f$th pixels position is \f$x_{i}\f$, its value is \f$z_{i}\f$ and \f$w_{i}\f$ is its weight.

        The weight indicates the influence on the currently optimized pixel at position \f$x_{k}\f$

        and drops exponentially with the distance for the current pixel.

        \param z_array 1D-array of the original ordniate data.

        \param weights_array 1D-array containing the weights.

        \param z_t Estimate of the previous iteration step for the current pixel.

        """

        z_dist_array = np.square(z_array - z_t)

        beta = self._get_beta(z_dist_array, weights_array)

        weighted = weights_array * np.exp(-beta * z_dist_array)

        numerator = np.sum(z_array * weighted)

        denominator = np.sum(weighted)

        return numerator/denominator


    def estimate_alpha(self,

            weight: float,

            length: float,

            ):

        r"""

        Calculate the weight falloff parameter \f$\alpha\f$, see \ref alpha.

        It is calculated as

        \f[

            \alpha = -\frac{\ln w}{l^2}

        \f]

        \param weight Target weight \f$w\f$.

        \param length Target distance \f$l\f$.

        """

        assert weight > 0, "weight and length must be greater than 0!"

        assert length > 0, "weight and length must be greater than 0!"

        return -np.log(weight)/(np.square(length))


fosanalysis.preprocessing.base.Task
Abstract base class for preprocessing task classes.
Definition base.py:56

fosanalysis.preprocessing.filtering.Cluster
The Cluster filter is an iterative smoothing algorithm guaranteed to converge lou_2020_applicationofc...
Definition filtering.py:216

fosanalysis.preprocessing.filtering.Cluster._alpha
_alpha
Definition filtering.py:301

fosanalysis.preprocessing.filtering.Cluster._initial_z
float _initial_z(self, np.array z_array, np.array weights_array)
Guess the the initial estimate.
Definition filtering.py:378

fosanalysis.preprocessing.filtering.Cluster._run_2d
tuple _run_2d(self, np.array x, np.array y, np.array z, *args, **kwargs)
Cluster has no true 2D operation mode.
Definition filtering.py:333

fosanalysis.preprocessing.filtering.Cluster._new_z_t
float _new_z_t(self, np.array z_array, np.array weights_array, float z_t)
Definition filtering.py:393

fosanalysis.preprocessing.filtering.Cluster.fill
fill
Switch, whether missing data should be interpolated.
Definition filtering.py:294

fosanalysis.preprocessing.filtering.Cluster._run_1d
tuple _run_1d(self, np.array x, np.array z, *args, **kwargs)
Carry out the filtering on one-dimensional data.
Definition filtering.py:305

fosanalysis.preprocessing.filtering.Cluster.tolerance
tolerance
Stopping criterion for the iterative process.
Definition filtering.py:291

fosanalysis.preprocessing.filtering.Cluster.alpha
alpha
Falloff parameter for the weight function.
Definition filtering.py:286

fosanalysis.preprocessing.filtering.Cluster.__init__
__init__(self, float alpha, float tolerance=0.1, bool fill=False, *args, **kwargs)
Construct a Cluster object.
Definition filtering.py:268

fosanalysis.preprocessing.filtering.Cluster._get_beta
float _get_beta(self, np.array z_dist_array, np.array weights_array)
Definition filtering.py:359

fosanalysis.preprocessing.filtering.Cluster._get_weights
np.array _get_weights(self, int pixel, np.array x_array)
Calculate the array of weights for the current position.
Definition filtering.py:342

fosanalysis.preprocessing.filtering.Cluster.estimate_alpha
estimate_alpha(self, float weight, float length)
Calculate the weight falloff parameter , see alpha.
Definition filtering.py:420

fosanalysis.preprocessing.filtering.Filter
Abstract base class for filter classes.
Definition filtering.py:18

fosanalysis.preprocessing.filtering.Limit
A filter to limit the entries.
Definition filtering.py:26

fosanalysis.preprocessing.filtering.Limit._run_2d
tuple _run_2d(self, np.array x, np.array y, np.array z, *args, **kwargs)
Native two-dimensional operation implementation.
Definition filtering.py:85

fosanalysis.preprocessing.filtering.Limit.maximum
maximum
Maximal value, which will be included in the result.
Definition filtering.py:52

fosanalysis.preprocessing.filtering.Limit._limit
np.array _limit(self, np.array z, float minimum=None, float maximum=None, *args, **kwargs)
Limit the values of the array.
Definition filtering.py:91

fosanalysis.preprocessing.filtering.Limit.__init__
__init__(self, float minimum=None, float maximum=None, *args, **kwargs)
Construct an instance of the class.
Definition filtering.py:36

fosanalysis.preprocessing.filtering.Limit.run
tuple run(self, np.array x, np.array y, np.array z, bool make_copy=True, str timespace="2d", float minimum=None, float maximum=None, *args, **kwargs)
Limit the entries in the given list to the specified range.
Definition filtering.py:61

fosanalysis.preprocessing.filtering.Limit.minimum
minimum
Minimal value, which will be included in the result.
Definition filtering.py:48

fosanalysis.preprocessing.filtering.Limit._run_1d
tuple _run_1d(self, np.array x, np.array z, *args, **kwargs)
Reimplementations describe a one-dimensional operation.
Definition filtering.py:79

fosanalysis.preprocessing.filtering.SlidingFilter
Abstract base class for filter classes, based on sliding windows.
Definition filtering.py:108

fosanalysis.preprocessing.filtering.SlidingFilter.run
tuple run(self, np.array x, np.array y, np.array z, str timespace=None, bool make_copy=True, int radius=None, str method=None, *args, **kwargs)
The given data is filtered with a sliding window.
Definition filtering.py:166

fosanalysis.preprocessing.filtering.SlidingFilter.__init__
__init__(self, int radius, str method, str pad_mode=None, *args, **kwargs)
Construct an instance of the class.
Definition filtering.py:120

fosanalysis.preprocessing.filtering.SlidingFilter._run_1d
tuple _run_1d(self, np.array x, np.array z, *args, **kwargs)
Reimplementations describe a one-dimensional operation.
Definition filtering.py:183

fosanalysis.preprocessing.filtering.SlidingFilter._slide
np.array _slide(self, np.array z, radius=None, str method=None, *args, **kwargs)
Move the window over the input array and apply method on it.
Definition filtering.py:195

fosanalysis.preprocessing.filtering.SlidingFilter._run_2d
tuple _run_2d(self, np.array x, np.array y, np.array z, *args, **kwargs)
Native two-dimensional operation implementation.
Definition filtering.py:189

fosanalysis.preprocessing.filtering.SlidingFilter.pad_mode
pad_mode
Mode for padding the edges of the result array.
Definition filtering.py:157

fosanalysis.preprocessing.filtering.SlidingFilter.radius
radius
Smoothing radius for the data, number of entries of data to each side to be taken into account.
Definition filtering.py:139

fosanalysis.preprocessing.filtering.SlidingFilter.method
method
Specify, how the data is smoothed.
Definition filtering.py:153