Source code for pyunlocbox.functions

# -*- coding: utf-8 -*-

r"""
The :mod:`pyunlocbox.functions` module implements an interface for solvers to
access the functions to be optimized as well as common objective functions.

Interface
---------

The :class:`func` base class defines a common interface to all functions:

.. autosummary::

    func.cap
    func.eval
    func.prox
    func.grad

Functions
---------

Then, derived classes implement various common objective functions.

**Norm operators** (based on :class:`norm`)

.. autosummary::

    norm_l1
    norm_l2
    norm_nuclear
    norm_tv

**Projection operators** (based on :class:`proj`)

.. autosummary::

    proj_positive
    proj_b2
    proj_lineq
    proj_spsd

**Miscellaneous**

.. autosummary::

    dummy
    structured_sparsity

.. inheritance-diagram:: pyunlocbox.functions
    :parts: 2

"""

from __future__ import division

from time import time
from copy import deepcopy

import numpy as np
from scipy.optimize import minimize

from pyunlocbox import operators as op


def _soft_threshold(z, T, handle_complex=True):
    r"""
    Return the soft thresholded signal.

    Parameters
    ----------
    z : array_like
        Input signal (real or complex).
    T : float or array_like
        Threshold on the absolute value of `z`. There could be either a single
        threshold for the entire signal `z` or one threshold per dimension.
        Useful when you use weighted norms.
    handle_complex : bool
        Indicate that we should handle the thresholding of complex numbers,
        which may be slower. Default is True.

    Returns
    -------
    sz : ndarray
        Soft thresholded signal.

    Examples
    --------
    >>> from pyunlocbox import functions
    >>> functions._soft_threshold([-2, -1, 0, 1, 2], 1)
    array([-1,  0,  0,  0,  1])

    """
    sz = np.maximum(np.abs(z) - T, 0)

    if not handle_complex:
        # This soft thresholding method only supports real signal.
        sz[:] = np.sign(z) * sz

    else:
        # This soft thresholding method supports complex complex signal.
        # Transform to float to avoid integer division.
        # In our case 0 divided by 0 should be 0, not NaN, and is not an error.
        # It corresponds to 0 thresholded by 0, which is 0.
        old_err_state = np.seterr(invalid='ignore')
        sz[:] = np.nan_to_num(1. * sz / (sz + T) * z)
        np.seterr(**old_err_state)

    return sz


def _prox_star(func, z, T):
    r"""
    Proximity operator of the convex conjugate of a function.

    Notes
    -----
    Based on the Moreau decomposition of a vector w.r.t. a convex function.

    """
    return z - T * func.prox(z / T, 1 / T)


[docs]class func(object):
    r"""
    This class defines the function object interface.

    It is intended to be a base class for standard functions which will
    implement the required methods. It can also be instantiated by user code
    and dynamically modified for rapid testing.  The instanced objects are
    meant to be passed to the :func:`pyunlocbox.solvers.solve` solving
    function.

    Parameters
    ----------
    y : array_like, optional
        Measurements. Default is 0.
    A : function or ndarray, optional
        The forward operator. Default is the identity, :math:`A(x)=x`. If `A`
        is an ``ndarray``, it will be converted to the operator form.
    At : function or ndarray, optional
        The adjoint operator. If `At` is an ``ndarray``, it will be converted
        to the operator form. If `A` is an ``ndarray``, default is the
        transpose of `A`.  If `A` is a function, default is `A`,
        :math:`At(x)=A(x)`.
    tight : bool, optional
        ``True`` if `A` is a tight frame (semi-orthogonal linear transform),
        ``False`` otherwise. Default is ``True``.
    nu : float, optional
        Bound on the norm of the operator `A`, i.e. :math:`\|A(x)\|^2 \leq \nu
        \|x\|^2`. Default is 1.
    tol : float, optional
        The tolerance stopping criterion. The exact definition depends on the
        function object, please see the documentation of the considered
        function. Default is 1e-3.
    maxit : int, optional
        The maximum number of iterations. Default is 200.

    Examples
    --------

    Let's define a parabola as an example of the manual implementation of a
    function object :

    >>> from pyunlocbox import functions
    >>> f = functions.func()
    >>> f._eval = lambda x: x**2
    >>> f._grad = lambda x: 2*x
    >>> x = [1, 2, 3, 4]
    >>> f.eval(x)
    array([ 1,  4,  9, 16])
    >>> f.grad(x)
    array([2, 4, 6, 8])
    >>> f.cap(x)
    ['EVAL', 'GRAD']

    """

    def __init__(self, y=0, A=None, At=None, tight=True, nu=1, tol=1e-3,
                 maxit=200, **kwargs):

        if callable(y):
            self.y = lambda: np.asarray(y())
        else:
            self.y = lambda: np.asarray(y)

        if A is None:
            self.A = lambda x: x
        else:
            if callable(A):
                self.A = A
            else:
                # Transform matrix form to operator form.
                self.A = lambda x: A.dot(x)

        if At is None:
            if A is None:
                self.At = lambda x: x
            elif callable(A):
                self.At = A
            else:
                self.At = lambda x: A.T.dot(x)
        else:
            if callable(At):
                self.At = At
            else:
                self.At = lambda x: At.dot(x)

        self.tight = tight
        self.nu = nu
        self.tol = tol
        self.maxit = maxit

        # Should be initialized if called alone, updated by solve().
        self.verbosity = 'NONE'

[docs]    def eval(self, x):
        r"""
        Function evaluation.

        Parameters
        ----------
        x : array_like
            The evaluation point. If `x` is a matrix, the function gets
            evaluated for each column, as if it was a set of independent
            problems. Some functions, like the nuclear norm, are only defined
            on matrices.

        Returns
        -------
        z : float
            The objective function evaluated at `x`. If `x` is a matrix, the
            sum of the objectives is returned.

        Notes
        -----
        This method is required by the :func:`pyunlocbox.solvers.solve` solving
        function to evaluate the objective function. Each function class
        should therefore define it.

        """
        sol = self._eval(np.asarray(x))
        if self.verbosity in ['LOW', 'HIGH']:
            name = self.__class__.__name__
            print('    {} evaluation: {:e}'.format(name, sol))
        return sol

    def _eval(self, x):
        raise NotImplementedError("Class user should define this method.")

[docs]    def prox(self, x, T):
        r"""
        Function proximal operator.

        Parameters
        ----------
        x : array_like
            The evaluation point. If `x` is a matrix, the function gets
            evaluated for each column, as if it was a set of independent
            problems. Some functions, like the nuclear norm, are only defined
            on matrices.
        T : float
            The regularization parameter.

        Returns
        -------
        z : ndarray
            The proximal operator evaluated for each column of `x`.

        Notes
        -----
        The proximal operator is defined by
        :math:`\operatorname{prox}_{\gamma f}(x) = \operatorname{arg\,min}
        \limits_z \frac{1}{2} \|x-z\|_2^2 + \gamma f(z)`

        This method is required by some solvers.

        When the map A in the function construction is a tight frame
        (semi-orthogonal linear transformation), we can use property (x) of
        Table 10.1 in :cite:`combettes:2011iq` to compute the proximal
        operator of the composition of A with the base function. Whenever
        this is not the case, we have to resort to some iterative procedure,
        which may be very inefficient.

        """
        return self._prox(np.asarray(x), T)

    def _prox(self, x, T):
        raise NotImplementedError("Class user should define this method.")

[docs]    def grad(self, x):
        r"""
        Function gradient.

        Parameters
        ----------
        x : array_like
            The evaluation point. If `x` is a matrix, the function gets
            evaluated for each column, as if it was a set of independent
            problems. Some functions, like the nuclear norm, are only defined
            on matrices.

        Returns
        -------
        z : ndarray
            The objective function gradient evaluated for each column of `x`.

        Notes
        -----
        This method is required by some solvers.

        """
        return self._grad(np.asarray(x))

    def _grad(self, x):
        raise NotImplementedError("Class user should define this method.")

[docs]    def cap(self, x):
        r"""
        Test the capabilities of the function object.

        Parameters
        ----------
        x : array_like
            The evaluation point. Not really needed, but this function calls
            the methods of the object to test if they can properly execute
            without raising an exception. Therefore it needs some evaluation
            point with a consistent size.

        Returns
        -------
        cap : list of string
            A list of capabilities ('EVAL', 'GRAD', 'PROX').

        """
        tmp = self.verbosity
        self.verbosity = 'NONE'
        cap = ['EVAL', 'GRAD', 'PROX']
        try:
            self.eval(x)
        except NotImplementedError:
            cap.remove('EVAL')
        try:
            self.grad(x)
        except NotImplementedError:
            cap.remove('GRAD')
        try:
            self.prox(x, 1)
        except NotImplementedError:
            cap.remove('PROX')
        self.verbosity = tmp
        return cap


[docs]class dummy(func):
    r"""
    Dummy function (eval, prox, grad).

    This can be used as a second function object when there is only one
    function to minimize. It always evaluates as 0.

    Examples
    --------
    >>> from pyunlocbox import functions
    >>> f = functions.dummy()
    >>> x = [1, 2, 3, 4]
    >>> f.eval(x)
    0
    >>> f.prox(x, 1)
    array([1, 2, 3, 4])
    >>> f.grad(x)
    array([0, 0, 0, 0])

    """

    def __init__(self, **kwargs):
        # Constructor takes keyword-only parameters to prevent user errors.
        super(dummy, self).__init__(**kwargs)

    def _eval(self, x):
        return 0

    def _prox(self, x, T):
        return x

    def _grad(self, x):
        return np.zeros_like(x)


[docs]class norm(func):
    r"""
    Base class which defines the attributes of the `norm` objects.

    See generic attributes descriptions of the
    :class:`pyunlocbox.functions.func` base class.

    Parameters
    ----------
    lambda_ : float, optional
        Regularization parameter :math:`\lambda`. Default is 1.
    w : array_like, optional
        Weights for a weighted norm. Default is 1.

    """

    def __init__(self, lambda_=1, w=1, **kwargs):
        super(norm, self).__init__(**kwargs)
        self.lambda_ = lambda_
        self.w = np.asarray(w)


[docs]class norm_l1(norm):
    r"""
    L1-norm (eval, prox).

    See generic attributes descriptions of the
    :class:`pyunlocbox.functions.norm` base class. Note that the constructor
    takes keyword-only parameters.

    Notes
    -----
    * The L1-norm of the vector `x` is given by
      :math:`\lambda \|w \cdot (A(x)-y)\|_1`.
    * The L1-norm proximal operator evaluated at `x` is given by
      :math:`\operatorname{arg\,min}\limits_z \frac{1}{2} \|x-z\|_2^2 + \gamma
      \|w \cdot (A(z)-y)\|_1` where :math:`\gamma = \lambda \cdot T`. This is
      simply a soft thresholding.

    Examples
    --------
    >>> from pyunlocbox import functions
    >>> f = functions.norm_l1()
    >>> f.eval([1, 2, 3, 4])
    10
    >>> f.prox([1, 2, 3, 4], 1)
    array([0., 1., 2., 3.])

    """

    def __init__(self, **kwargs):
        # Constructor takes keyword-only parameters to prevent user errors.
        super(norm_l1, self).__init__(**kwargs)

    def _eval(self, x):
        sol = self.A(x) - self.y()
        return self.lambda_ * np.sum(np.abs(self.w * sol))

    def _prox(self, x, T):
        # Gamma is T in the matlab UNLocBox implementation.
        gamma = self.lambda_ * T
        if self.tight:
            # Nati: I've checked this code the use of 'y' seems correct
            sol = self.A(x) - self.y()
            sol = _soft_threshold(sol, gamma * self.nu * self.w) - sol
            sol = x + self.At(sol) / self.nu
        else:
            raise NotImplementedError('Not implemented for non-tight frame.')
        return sol


[docs]class norm_l2(norm):
    r"""
    L2-norm (eval, prox, grad).

    See generic attributes descriptions of the
    :class:`pyunlocbox.functions.norm` base class. Note that the constructor
    takes keyword-only parameters.

    Notes
    -----
    * The squared L2-norm of the vector `x` is given by
      :math:`\lambda \|w \cdot (A(x)-y)\|_2^2`.
    * The squared L2-norm proximal operator evaluated at `x` is given by
      :math:`\operatorname{arg\,min}\limits_z \frac{1}{2} \|x-z\|_2^2 + \gamma
      \|w \cdot (A(z)-y)\|_2^2` where :math:`\gamma = \lambda \cdot T`.
    * The squared L2-norm gradient evaluated at `x` is given by
      :math:`2 \lambda \cdot At(w \cdot (A(x)-y))`.

    Examples
    --------
    >>> from pyunlocbox import functions
    >>> f = functions.norm_l2()
    >>> x = [1, 2, 3, 4]
    >>> f.eval(x)
    30
    >>> f.prox(x, 1)
    array([0.33333333, 0.66666667, 1.        , 1.33333333])
    >>> f.grad(x)
    array([2, 4, 6, 8])

    """

    def __init__(self, **kwargs):
        # Constructor takes keyword-only parameters to prevent user errors.
        super(norm_l2, self).__init__(**kwargs)
        if self.tight:
            if self.w.size > 1:
                raise ValueError(
                    "Cannot use tight with vector of weights. Please use a "
                    "constant weight or set tight=False. Alternatively, you "
                    "can merge the weights into your operator."
                )

    def _eval(self, x):
        sol = self.A(x) - self.y()
        return self.lambda_ * np.sum((self.w * sol)**2)

    def _prox(self, x, T):
        # Gamma is T in the matlab UNLocBox implementation.
        gamma = self.lambda_ * T
        if self.tight:
            sol = x + 2. * gamma * self.At(self.y() * self.w**2)
            sol /= 1. + 2. * gamma * self.nu * self.w**2
        else:
            res = minimize(fun=lambda z: 0.5 * np.sum((z - x)**2) + gamma *
                           np.sum((self.w * (self.A(z) - self.y()))**2),
                           x0=x,
                           method='BFGS',
                           jac=lambda z: z - x + 2. * gamma *
                           self.At((self.w**2) * (self.A(z) - self.y())))
            if res.success:
                sol = res.x
            else:
                raise RuntimeError('norm_l2.prox: ' + res.message)
        return sol

    def _grad(self, x):
        sol = self.A(x) - self.y()
        return 2 * self.lambda_ * self.At((self.w**2) * sol)


[docs]class norm_nuclear(norm):
    r"""
    Nuclear-norm (eval, prox).

    See generic attributes descriptions of the
    :class:`pyunlocbox.functions.norm` base class. Note that the constructor
    takes keyword-only parameters.

    Notes
    -----
    * The nuclear-norm of the matrix `x` is given by
      :math:`\lambda \| x \|_* = \lambda \operatorname{trace} (\sqrt{x^* x}) =
      \lambda \sum_{i=1}^N |e_i|` where `e_i` are the eigenvalues of `x`.
    * The nuclear-norm proximal operator evaluated at `x` is given by
      :math:`\operatorname{arg\,min}\limits_z \frac{1}{2} \|x-z\|_2^2 + \gamma
      \| x \|_*` where :math:`\gamma = \lambda \cdot T`, which is a
      soft-thresholding of the eigenvalues.

    Examples
    --------
    >>> from pyunlocbox import functions
    >>> f = functions.norm_nuclear()
    >>> f.eval([[1, 2],[2, 3]])  # doctest:+ELLIPSIS
    4.47213595...
    >>> f.prox([[1, 2],[2, 3]], 1)
    array([[0.89442719, 1.4472136 ],
           [1.4472136 , 2.34164079]])

    """

    def __init__(self, **kwargs):
        # Constructor takes keyword-only parameters to prevent user errors.
        super(norm_nuclear, self).__init__(**kwargs)

    def _eval(self, x):
        # TODO: take care of sparse matrices.
        _, s, _ = np.linalg.svd(x)
        return self.lambda_ * np.sum(np.abs(s))

    def _prox(self, x, T):
        # Gamma is T in the matlab UNLocBox implementation.
        gamma = self.lambda_ * T
        # TODO: take care of sparse matrices.
        U, s, V = np.linalg.svd(x)
        s = _soft_threshold(s, gamma)
        S = np.diag(s)
        return np.dot(U, np.dot(S, V))


[docs]class norm_tv(norm):
    r"""
    TV-norm (eval, prox).

    See generic attributes descriptions of the
    :class:`pyunlocbox.functions.norm` base class. Note that the constructor
    takes keyword-only parameters.

    Notes
    -----
    TODO

    See :cite:`beck2009fastTV` for details about the algorithm.

    Examples
    --------
    >>> import numpy as np
    >>> from pyunlocbox import functions
    >>> f = functions.norm_tv()
    >>> x = np.arange(0, 16)
    >>> x = x.reshape(4, 4)
    >>> f.eval(x)  # doctest:+ELLIPSIS
        norm_tv evaluation: 5.210795e+01
    52.10795063...

    """

    def __init__(self, dim=2, verbosity='LOW', **kwargs):
        super(norm_tv, self).__init__(**kwargs)
        self.kwargs = kwargs
        self.dim = dim
        self.verbosity = verbosity

    def _eval(self, x):
        if self.dim >= 2:
            y = 0
            grads = []
            grads = op.grad(x, dim=self.dim, **self.kwargs)
            for g in grads:
                y += np.power(abs(g), 2)
            y = np.sqrt(y)
            return np.sum(y)

        if self.dim == 1:
            dx = op.grad(x, dim=self.dim, **self.kwargs)
            y = np.sum(np.abs(dx), axis=0)
            return np.sum(y)

    def _prox(self, x, T):
        # Time counter
        t_init = time()

        tol = self.tol
        maxit = self.maxit

        # TODO implement test_gamma
        # Initialization
        sol = x

        if self.dim == 1:
            r = op.grad(x * 0, dim=self.dim, **self.kwargs)
            rr = deepcopy(r)
        elif self.dim == 2:
            r, s = op.grad(x * 0, dim=self.dim, **self.kwargs)
            rr, ss = deepcopy(r), deepcopy(s)
        elif self.dim == 3:
            r, s, k = op.grad(x * 0, dim=self.dim, **self.kwargs)
            rr, ss, kk = deepcopy(r), deepcopy(s), deepcopy(k)
        elif self.dim == 4:
            r, s, k, u = op.grad(x * 0, dim=self.dim, **self.kwargs)
            rr, ss, kk, uu = deepcopy(r), deepcopy(s), deepcopy(k), deepcopy(u)

        if self.dim >= 1:
            pold = r
        if self.dim >= 2:
            qold = s
        if self.dim >= 3:
            kold = k
        if self.dim >= 4:
            uold = u

        told, prev_obj = 1., 0.

        # Initialization for weights
        if self.dim >= 1:
            try:
                wx = self.kwargs["wx"]
            except (KeyError, TypeError):
                wx = 1.
        if self.dim >= 2:
            try:
                wy = self.kwargs["wy"]
            except (KeyError, TypeError):
                wy = 1.
        if self.dim >= 3:
            try:
                wz = self.kwargs["wz"]
            except (KeyError, TypeError):
                wz = 1.
        if self.dim >= 4:
            try:
                wt = self.kwargs["wt"]
            except (KeyError, TypeError):
                wt = 1.

        if self.dim == 1:
            mt = wx
        elif self.dim == 2:
            mt = np.maximum(wx, wy)
        elif self.dim == 3:
            mt = np.maximum(wx, np.maximum(wy, wz))
        elif self.dim == 4:
            mt = np.maximum(np.maximum(wx, wy), np.maximum(wz, wt))

        if self.verbosity in ['LOW', 'HIGH', 'ALL']:
            print("Proximal TV Operator")

        iter = 0
        while iter <= maxit:
            # Current Solution
            if self.dim == 1:
                sol = x - T * op.div(rr, **self.kwargs)
            elif self.dim == 2:
                sol = x - T * op.div(rr, ss, **self.kwargs)
            elif self.dim == 3:
                sol = x - T * op.div(rr, ss, kk, **self.kwargs)
            elif self.dim == 4:
                sol = x - T * op.div(rr, ss, kk, uu, **self.kwargs)

            #  Objective function value
            obj = 0.5 * np.power(np.linalg.norm(x[:] - sol[:]), 2) + \
                T * np.sum(self._eval(sol), axis=0)
            rel_obj = np.abs(obj - prev_obj) / obj
            prev_obj = obj

            if self.verbosity in ['HIGH', 'ALL']:
                print("Iter: ", iter, " obj = ", obj, " rel_obj = ", rel_obj)

            # Stopping criterion
            if rel_obj < tol:
                crit = "TOL_EPS"
                break

            #  Update divergence vectors and project
            if self.dim == 1:
                dx = op.grad(sol, dim=self.dim, **self.kwargs)
                r -= 1. / (4 * T * mt**2) * dx
                weights = np.maximum(1, np.abs(r))

            elif self.dim == 2:
                dx, dy = op.grad(sol, dim=self.dim, **self.kwargs)
                r -= (1. / (8. * T * mt**2.)) * dx
                s -= (1. / (8. * T * mt**2.)) * dy
                weights = np.maximum(1, np.sqrt(np.power(np.abs(r), 2) +
                                                np.power(np.abs(s), 2)))

            elif self.dim == 3:
                dx, dy, dz = op.grad(sol, dim=self.dim, **self.kwargs)
                r -= 1. / (12. * T * mt**2) * dx
                s -= 1. / (12. * T * mt**2) * dy
                k -= 1. / (12. * T * mt**2) * dz
                weights = np.maximum(1, np.sqrt(np.power(np.abs(r), 2) +
                                                np.power(np.abs(s), 2) +
                                                np.power(np.abs(k), 2)))

            elif self.dim == 4:
                dx, dy, dz, dt = op.grad(sol, dim=self.dim, **self.kwargs)
                r -= 1. / (16 * T * mt**2) * dx
                s -= 1. / (16 * T * mt**2) * dy
                k -= 1. / (16 * T * mt**2) * dz
                u -= 1. / (16 * T * mt**2) * dt
                weights = np.maximum(1, np.sqrt(np.power(np.abs(r), 2) +
                                                np.power(np.abs(s), 2) +
                                                np.power(np.abs(k), 2) +
                                                np.power(np.abs(u), 2)))

            # FISTA update
            t = (1 + np.sqrt(4 * told**2)) / 2.

            if self.dim >= 1:
                p = r / weights
                r = p + (told - 1) / t * (p - pold)
                pold = p
                rr = deepcopy(r)

            if self.dim >= 2:
                q = s / weights
                s = q + (told - 1) / t * (q - qold)
                ss = deepcopy(s)
                qold = q

            if self.dim >= 3:
                o = k / weights
                k = o + (told - 1) / t * (o - kold)
                kk = deepcopy(k)
                kold = o

            if self.dim >= 4:
                m = u / weights
                u = m + (told - 1) / t * (m - uold)
                uu = deepcopy(u)
                uold = m

            told = t
            iter += 1

        try:
            type(crit) == str
        except NameError:
            crit = "MAX_IT"

        t_end = time()
        exec_time = t_end - t_init

        if self.verbosity in ['HIGH', 'ALL']:
            print("Prox_TV: obj = {0}, rel_obj = {1}, {2}, iter = {3}".format(
                obj, rel_obj, crit, iter))
            print("exec_time = ", exec_time)
        return sol


[docs]class proj(func):
    r"""
    Base class which defines the attributes of the `proj` objects.

    See generic attributes descriptions of the
    :class:`pyunlocbox.functions.func` base class.

    Notes
    -----
    * All indicator functions (projections) evaluate to zero by definition.

    """
    def __init__(self, **kwargs):
        super(proj, self).__init__(**kwargs)

    def _eval(self, x):
        # Matlab version returns a small delta to avoid division by 0 when
        # evaluating relative tolerance. Here the delta is added in the solve
        # function if the sum of the objective functions is zero.
        # np.spacing(1.0) is equivalent to matlab eps = eps(1.0)
        # return np.spacing(1.0)
        return 0


[docs]class proj_positive(proj):
    r"""
    Projection on the positive octant (eval, prox).

    This function is the indicator function :math:`i_S(z)` of the set
    :math:`S = \left\{z \in \mathbb{R}^N \mid z \leq 0 \right\}`
    that is zero if :math:`z` is in the set and infinite otherwise.

    See generic attributes descriptions of the
    :class:`pyunlocbox.functions.proj` base class. Note that the constructor
    takes keyword-only parameters.

    Notes
    -----
    * The evaluation of this function is zero.

    Examples
    --------
    >>> from pyunlocbox import functions
    >>> f = functions.proj_positive()
    >>> x = [-2.5, 1.5]
    >>> f.eval(x)
    0
    >>> f.prox(x, 0)
    array([0. , 1.5])

    """

    def __init__(self, **kwargs):
        # Constructor takes keyword-only parameters to prevent user errors.
        super(proj_positive, self).__init__(**kwargs)

    def _prox(self, x, T):
        return np.clip(x, 0, np.inf)


[docs]class proj_spsd(proj):
    r"""
    Projection on symmetric positive semi-definite matrices (eval, prox).

    This function is the indicator function :math:`i_S(M)` of the set
    :math:`S = \left\{M \in \mathbb{R}^{N \times N}
    \mid M \succeq 0, M=M^T \right\}`
    that is zero if :math:`M` is in the set and infinite otherwise.

    See generic attributes descriptions of the
    :class:`pyunlocbox.functions.proj` base class. Note that the constructor
    takes keyword-only parameters.

    Notes
    -----
    * The evaluation of this function is zero.

    Examples
    --------
    >>> from pyunlocbox import functions
    >>> f = functions.proj_spsd()
    >>> A = np.array([[0, -1] , [-1, 1]])
    >>> A = (A + A.T) / 2  # Symmetrize the matrix.
    >>> np.linalg.eig(A)[0]
    array([-0.61803399,  1.61803399])
    >>> f.eval(A)
    0
    >>> Aproj = f.prox(A, 0)
    >>> np.linalg.eig(Aproj)[0]
    array([0.        , 1.61803399])

    """
    def __init__(self, **kwargs):
        # Constructor takes keyword-only parameters to prevent user errors.
        super(proj_spsd, self).__init__(**kwargs)

    def _prox(self, x, T):
        isreal = np.isreal(x).all()

        # 1. make it symmetric.
        sol = (x + np.conj(x.T)) / 2

        # 2. make it semi-positive.
        D, V = np.linalg.eig(sol)
        D = np.real(D)
        if isreal:
            V = np.real(V)
        D = np.clip(D, 0, np.inf)
        sol = V @ np.diag(D) @ np.conj(V.T)
        return sol


[docs]class proj_b2(proj):
    r"""
    Projection on the L2-ball (eval, prox).

    This function is the indicator function :math:`i_S(z)` of the set
    :math:`S= \left\{z \in \mathbb{R}^N \mid \|Az-y\|_2 \leq \epsilon \right\}`
    that is zero if :math:`z` is in the set and infinite otherwise.

    See generic attributes descriptions of the
    :class:`pyunlocbox.functions.proj` base class. Note that the constructor
    takes keyword-only parameters.

    Parameters
    ----------
    epsilon : float, optional
        The radius of the ball. Default is 1.
    method : {'FISTA', 'ISTA'}, optional
        The method used to solve the problem. It can be 'FISTA' or 'ISTA'.
        Default is 'FISTA'.

    Notes
    -----
    * The `tol` parameter is defined as the tolerance for the projection on the
      L2-ball. The algorithm stops if :math:`\frac{\epsilon}{1-tol} \leq
      \|y-A(z)\|_2 \leq \frac{\epsilon}{1+tol}`.
    * The evaluation of this function is zero.
    * The L2-ball proximal operator evaluated at `x` is given by
      :math:`\operatorname{arg\,min}\limits_z \frac{1}{2} \|x-z\|_2^2 + i_S(z)`
      which has an identical solution as
      :math:`\operatorname{arg\,min}\limits_z \|x-z\|_2^2` such that
      :math:`\|A(z)-y\|_2 \leq \epsilon`. It is thus a projection of the vector
      `x` onto an L2-ball of diameter `epsilon`.

    See Also
    --------
    proj_lineq : use instead of ``epsilon=0``

    Examples
    --------
    >>> from pyunlocbox import functions
    >>> f = functions.proj_b2(y=[1, 1])
    >>> x = [3, 3]
    >>> f.eval(x)
    0
    >>> f.prox(x, 0)
    array([1.70710678, 1.70710678])

    """
    def __init__(self, epsilon=1, method='FISTA', **kwargs):
        # Constructor takes keyword-only parameters to prevent user errors.
        super(proj_b2, self).__init__(**kwargs)
        self.epsilon = epsilon
        self.method = method

    def _prox(self, x, T):

        crit = None  # Stopping criterion.
        niter = 0    # Number of iterations.

        # Tight frame.
        if self.tight:
            tmp1 = self.A(x) - self.y()
            with np.errstate(divide='ignore', invalid='ignore'):
                # Avoid 'division by zero' warning
                scale = self.epsilon / np.sqrt(np.sum(tmp1 * tmp1, axis=0))
            tmp2 = tmp1 * np.minimum(1, scale)  # Scaling.
            sol = x + self.At(tmp2 - tmp1) / self.nu
            crit = 'TOL'
            u = np.nan

        # Non tight frame.
        else:

            # Initialization.
            sol = x
            u = np.zeros_like(self.y())
            if self.method == 'FISTA':
                v_last = u
                t_last = 1.
            elif self.method != 'ISTA':
                raise ValueError('The method should be either FISTA or ISTA.')

            # Tolerance around the L2-ball.
            epsilon_low = self.epsilon / (1. + self.tol)
            epsilon_up = self.epsilon / (1. - self.tol)

            # Check if we are already in the L2-ball.
            norm_res = np.linalg.norm(self.y() - self.A(sol), 2)
            if norm_res <= epsilon_up:
                crit = 'INBALL'

            # Projection onto the L2-ball
            while not crit:

                niter += 1

                # Residual.
                res = self.A(sol) - self.y()
                norm_res = np.linalg.norm(res, 2)

                if self.verbosity == 'HIGH':
                    print('    proj_b2 iteration {:3d}: epsilon = {:.2e}, '
                          '||y-A(z)||_2 = {:.2e}'.format(niter, self.epsilon,
                                                         norm_res))

                # Scaling for projection.
                res += u * self.nu
                norm_proj = np.linalg.norm(res, 2)

                ratio = min(1, self.epsilon / norm_proj)
                v = 1. / self.nu * (res - res * ratio)

                if self.method == 'FISTA':
                    t = (1. + np.sqrt(1. + 4. * t_last**2.)) / 2.  # Time step.
                    u = v + (t_last - 1.) / t * (v - v_last)
                    v_last = v
                    t_last = t
                else:
                    u = v

                # Current estimation.
                sol = x - self.At(u)

                # Stopping criterion.
                if norm_res >= epsilon_low and norm_res <= epsilon_up:
                    crit = 'TOL'
                elif niter >= self.maxit:
                    crit = 'MAXIT'

            if self.verbosity in ['LOW', 'HIGH']:
                norm_res = np.linalg.norm(self.y() - self.A(sol), 2)
                print('    proj_b2: epsilon = {:.2e}, ||y-A(z)||_2 = {:.2e}, '
                      '{}, niter = {}'.format(self.epsilon, norm_res, crit,
                                              niter))

        return sol


[docs]class proj_lineq(proj):
    r"""
    Projection on the plane satisfying the linear equality Az = y (eval, prox).

    This function is the indicator function :math:`i_S(z)` of the set
    :math:`S = \left\{z \in \mathbb{R}^N \mid Az = y \right\}`
    that is zero if :math:`z` is in the set and infinite otherwise.

    The proximal operator is
    :math:`\operatorname{arg\,min}_z \| z - x \|_2 \text{ s.t. } Az = y`.

    See generic attributes descriptions of the
    :class:`pyunlocbox.functions.proj` base class. Note that the constructor
    takes keyword-only parameters.

    Notes
    -----
    * A parameter `pinvA`, the pseudo-inverse of `A`, must be provided if the
      parameter `A` is provided as an operator/callable (not a matrix).
    * The evaluation of this function is zero.

    See Also
    --------
    proj_b2 : quadratic case

    Examples
    --------
    >>> from pyunlocbox import functions
    >>> import numpy as np
    >>> x = np.array([0, 0])
    >>> A = np.array([[1, 1]])
    >>> pinvA = np.linalg.pinv(A)
    >>> y = np.array([1])
    >>> f = functions.proj_lineq(A=A, pinvA=pinvA, y=y)
    >>> sol = f.prox(x, 0)
    >>> sol
    array([0.5, 0.5])
    >>> np.abs(A.dot(sol) - y) < 1e-15
    array([ True])

    """
    def __init__(self, A=None, pinvA=None, **kwargs):
        # Constructor takes keyword-only parameters to prevent user errors.
        super(proj_lineq, self).__init__(A=A, **kwargs)

        if pinvA is None:
            if A is None:
                print("Are you sure about the parameters?" +
                      "The projection will return y.")
                self.pinvA = lambda x: x
            else:
                if callable(A):
                    raise ValueError(
                            "Provide A as a numpy array or provide pinvA.")
                else:
                    # Transform matrix form to operator form.
                    self._pinvA = np.linalg.pinv(A)
                    self.pinvA = lambda x: self._pinvA.dot(x)
        else:
            if callable(pinvA):
                self.pinvA = pinvA
            else:
                self.pinvA = lambda x: pinvA.dot(x)

    def _prox(self, x, T):
        # Applying the projection formula.
        # (for now, only the non scalable version)
        residue = self.A(x) - self.y()
        sol = x - self.pinvA(residue)
        return sol


[docs]class structured_sparsity(func):
    r"""
    Structured sparsity (eval, prox).

    The structured sparsity term that is defined in the work of
    Jenatton et al. 2011 `Proximal methods for hierarchical sparse coding
    <https://hal.inria.fr/inria-00516723>`_.

    .. math:: \Omega(x) = \lambda \cdot \sum_{g \in G} w_g \cdot \|x_g\|_2

    See generic attributes descriptions of the
    :class:`pyunlocbox.functions.func` base class.

    Parameters
    ----------
    lambda_ : float, optional
        The scaling factor of the function that corresponds to :math:`\lambda`.
        Must be a non-negative number.
    groups: list of lists of integers
        Each element encodes the indices of the vector belonging to a single
        group. Corresponds to :math:`G`.
    weights : array_like
        Weight associated to each group. Corresponds to :math:`w_g`. Must have
        the same length as :math:`G`.

    Examples
    --------
    >>> from pyunlocbox import functions
    >>> groups = [[0, 1], [3, 2, 4]]
    >>> weights = [2, 1]
    >>> f = functions.structured_sparsity(10, groups, weights)
    >>> x = [2, 2.5, -0.5, 0.3, 0.01]
    >>> f.eval(x)
    69.86305169905782
    >>> f.prox(x, 0.1)
    array([0.7506099 , 0.93826238, 0.        , 0.        , 0.        ])

    """

    def __init__(self, lambda_=1, groups=[[]], weights=[0], **kwargs):
        super(structured_sparsity, self).__init__(**kwargs)

        if lambda_ < 0:
            raise ValueError('The scaling factor must be non-negative.')
        self.lambda_ = lambda_

        if not isinstance(groups, list):
            raise TypeError('The groups must be defined as a list of lists.')
        self.groups = groups

        if len(weights) != len(groups):
            raise ValueError('Length of weights must be equal to number of '
                             'groups.')
        self.weights = weights

    def _eval(self, x):
        costs = [w * np.linalg.norm(x[g])
                 for g, w in zip(self.groups, self.weights)]
        return self.lambda_ * np.sum(costs)

    def _prox(self, x, T):
        gamma = self.lambda_ * T
        v = x.copy()
        for g, w in zip(self.groups, self.weights):
            xn = np.linalg.norm(v[g])
            r = gamma * w
            if xn > r:
                v[g] -= v[g] * r / xn
            else:
                v[g] = 0
        return v