Source code for deepinv.optim.fixed_point

import torch
import torch.nn as nn
import warnings
from tqdm import tqdm


[docs] class FixedPoint(nn.Module): r""" Fixed-point iterations module. This module implements the fixed-point iteration algorithm given a specific fixed-point iterator (e.g. proximal gradient iteration, the ADMM iteration, see :meth:`deepinv.optim.optim_iterators`), that is for :math:`k=1,2,...` .. math:: \qquad (x_{k+1}, u_{k+1}) = \operatorname{FixedPoint}(x_k, u_k, f, g, A, y, ...) \hspace{2cm} (1) where :math:`f` is the data-fidelity term, :math:`g` is the prior, :math:`A` is the physics model, :math:`y` is the data. :Examples: This example shows how to use the :class:`FixedPoint` class to solve the problem :math:`\min_x 0.5*||Ax-y||_2^2 + \lambda*||x||_1` with the PGD algorithm, where A is the identity operator, :math:`\lambda = 1` and :math:`y = [2, 2]`. >>> import deepinv as dinv >>> # Create the measurement operator A >>> A = torch.tensor([[1, 0], [0, 1]], dtype=torch.float64) >>> A_forward = lambda v: A @ v >>> A_adjoint = lambda v: A.transpose(0, 1) @ v >>> # Define the physics model associated to this operator >>> physics = dinv.physics.LinearPhysics(A=A_forward, A_adjoint=A_adjoint) >>> # Define the measurement y >>> y = torch.tensor([2, 2], dtype=torch.float64) >>> # Define the data fidelity term >>> data_fidelity = dinv.optim.data_fidelity.L2() >>> # Define the prior term >>> prior = dinv.optim.prior.L1Prior() >>> # Define the parameters of the algorithm >>> params_algo = {"g_param": 1.0, "stepsize": 1.0, "lambda": 1.0, "beta": 1.0} >>> # Choose the iterator associated to the PGD algorithm >>> iterator = dinv.optim.optim_iterators.PGDIteration() >>> # Iterate the iterator >>> x_init = torch.tensor([2, 2], dtype=torch.float64) # Define initialisation of the algorithm >>> X = {"est": (x_init ,), "cost": []} # Iterates are stored in a dictionary of the form {'est': (x,z), 'cost': F} >>> max_iter = 50 >>> for it in range(max_iter): ... X = iterator(X, data_fidelity, prior, params_algo, y, physics) >>> # Return the solution >>> X["est"][0] tensor([1., 1.], dtype=torch.float64) :param deepinv.optim.optim_iterators.optim_iterator iterator: function that takes as input the current iterate, as well as parameters of the optimization problem (prior, measurements, etc.) :param function update_params_fn: function that returns the parameters to be used at each iteration. Default: ``None``. :param function update_prior_fn: function that returns the prior to be used at each iteration. Default: ``None``. :param function init_iterate_fn: function that returns the initial iterate. Default: ``None``. :param function init_metrics_fn: function that returns the initial metrics. Default: ``None``. :param function check_iteration_fn: function that performs a check on the last iteration and returns a bool indicating if we can proceed to next iteration. Default: ``None``. :param function check_conv_fn: function that checks the convergence after each iteration, returns a bool indicating if convergence has been reached. Default: ``None``. :param int max_iter: maximum number of iterations. Default: ``50``. :param bool early_stop: if True, the algorithm stops when the convergence criterion is reached. Default: ``True``. :param bool anderson_acceleration: if True, the Anderson acceleration is used. Default: ``False``. :param int history_size: size of the history used for the Anderson acceleration. Default: ``5``. :param float beta_anderson_acc: momentum of the Anderson acceleration step. Default: ``1.0``. :param float eps_anderson_acc: regularization parameter of the Anderson acceleration step. Default: ``1e-4``. """ def __init__( self, iterator=None, update_params_fn=None, update_data_fidelity_fn=None, update_prior_fn=None, init_iterate_fn=None, init_metrics_fn=None, update_metrics_fn=None, check_iteration_fn=None, check_conv_fn=None, max_iter=50, early_stop=True, anderson_acceleration=False, history_size=5, beta_anderson_acc=1.0, eps_anderson_acc=1e-4, verbose=False, show_progress_bar=False, ): super().__init__() self.iterator = iterator self.max_iter = max_iter self.early_stop = early_stop self.update_params_fn = update_params_fn self.update_data_fidelity_fn = update_data_fidelity_fn self.update_prior_fn = update_prior_fn self.init_iterate_fn = init_iterate_fn self.init_metrics_fn = init_metrics_fn self.update_metrics_fn = update_metrics_fn self.check_conv_fn = check_conv_fn self.check_iteration_fn = check_iteration_fn self.anderson_acceleration = anderson_acceleration self.history_size = history_size self.beta_anderson_acc = beta_anderson_acc self.eps_anderson_acc = eps_anderson_acc self.verbose = verbose self.show_progress_bar = show_progress_bar if self.check_conv_fn is None and self.early_stop: warnings.warn( "early_stop is set to True but no check_conv_fn has been defined." ) self.early_stop = False
[docs] def init_anderson_acceleration(self, X): r""" Initialize the Anderson acceleration algorithm. Code inspired from `this tutorial <http://implicit-layers-tutorial.org/deep_equilibrium_models/>`_. :param dict X: initial iterate. """ x = X["est"][0] b, d, h, w = x.shape x_hist = torch.zeros( b, self.history_size, d * h * w, dtype=x.dtype, device=x.device ) # history of iterates. T_hist = torch.zeros( b, self.history_size, d * h * w, dtype=x.dtype, device=x.device ) # history of T(x_k) with T the fixed point operator. H = torch.zeros( b, self.history_size + 1, self.history_size + 1, dtype=x.dtype, device=x.device, ) # H in the Anderson acceleration linear system Hp = q . H[:, 0, 1:] = H[:, 1:, 0] = 1.0 q = torch.zeros( b, self.history_size + 1, 1, dtype=x.dtype, device=x.device ) # q in the Anderson acceleration linear system Hp = q . q[:, 0] = 1 return x_hist, T_hist, H, q
[docs] def anderson_acceleration_step( self, it, X_prev, TX_prev, x_hist, T_hist, H, q, cur_data_fidelity, cur_prior, cur_params, *args, ): r""" Anderson acceleration step. Code inspired from `this tutorial <http://implicit-layers-tutorial.org/deep_equilibrium_models/>`_. :param int it: current iteration. :param dict X_prev: previous iterate. :param dict TX_prev: output of the fixed-point operator evaluated at X_prev :param torch.Tensor x_hist: history of last ``history-size`` iterates. :param torch.Tensor T_hist: history of T evlauaton at the last ``history-size``, where T is the fixed-point operator. :param torch.Tensor H: H in the Anderson acceleration linear system Hp = q . :param torch.Tensor q: q in the Anderson acceleration linear system Hp = q . :param deepinv.optim.DataFidelity cur_data_fidelity: Instance of the DataFidelity class defining the current data_fidelity. :param deepinv.optim.prior cur_prior: Instance of the Prior class defining the current prior. :param dict cur_params: Dictionary containing the current parameters of the algorithm. :param args: arguments for the iterator. """ x_prev = X_prev["est"][0] # current iterate Tx Tx_prev = TX_prev["est"][0] # current iterate x b = x_prev.shape[0] # batchsize x_hist[:, it % self.history_size] = x_prev.reshape( b, -1 ) # prepare history of x T_hist[:, it % self.history_size] = Tx_prev.reshape( b, -1 ) # prepare history of Tx m = min(it + 1, self.history_size) G = T_hist[:, :m] - x_hist[:, :m] H[:, 1 : m + 1, 1 : m + 1] = ( torch.bmm(G, G.transpose(1, 2)) + self.eps_anderson_acc * torch.eye(m, dtype=Tx_prev.dtype, device=Tx_prev.device)[None] ) p = torch.linalg.solve(H[:, : m + 1, : m + 1], q[:, : m + 1])[ :, 1 : m + 1, 0 ] # solve the linear system H p = q. x = ( self.beta_anderson_acc * (p[:, None] @ T_hist[:, :m])[:, 0] + (1 - self.beta_anderson_acc) * (p[:, None] @ x_hist[:, :m])[:, 0] ) # Anderson acceleration step. x = x.view(x_prev.shape) F = ( self.iterator.F_fn(x, cur_data_fidelity, cur_prior, cur_params, *args) if self.iterator.has_cost else None ) est = list(TX_prev["est"]) est[0] = x return {"est": est, "cost": F}
[docs] def forward(self, *args, compute_metrics=False, x_gt=None, **kwargs): r""" Loops over the fixed-point iterator as (1) and returns the fixed point. The iterates are stored in a dictionary of the form ``X = {'est': (x_k, u_k), 'cost': F_k}`` where: * ``est`` is a tuple containing the current primal and auxiliary iterates, * ``cost`` is the value of the cost function at the current iterate. Since the prior and parameters (stepsize, regularisation parameter, etc.) can change at each iteration, the prior and parameters are updated before each call to the iterator. :param bool compute_metrics: if ``True``, the metrics are computed along the iterations. Default: ``False``. :param torch.Tensor x_gt: ground truth solution. Default: ``None``. :param args: optional arguments for the iterator. Commonly (y,physics) where ``y`` (torch.Tensor y) is the measurement and ``physics`` (deepinv.physics) is the physics model. :param kwargs: optional keyword arguments for the iterator. :return tuple: ``(x,metrics)`` with ``x`` the fixed-point solution (dict) and ``metrics`` the computed along the iterations if ``compute_metrics`` is ``True`` or ``None`` otherwise. """ X = ( self.init_iterate_fn(*args, F_fn=self.iterator.F_fn) if self.init_iterate_fn else None ) metrics = ( self.init_metrics_fn(X, x_gt=x_gt) if self.init_metrics_fn and compute_metrics else None ) self.check_iteration = True if self.anderson_acceleration: self.x_hist, self.T_hist, self.H, self.q = self.init_anderson_acceleration( X ) it = 0 for it in tqdm( range(self.max_iter), disable=(not self.verbose or not self.show_progress_bar), ): X_prev = X X = self.single_iteration( X, it, *args, **kwargs, ) if self.check_iteration: metrics = ( self.update_metrics_fn(metrics, X_prev, X, x_gt=x_gt) if self.update_metrics_fn and compute_metrics else None ) if ( self.early_stop and (self.check_conv_fn is not None) and it > 1 and self.check_conv_fn(it, X_prev, X) ): break it += 1 return X, metrics
def single_iteration(self, X, it, *args, **kwargs): cur_params = self.update_params_fn(it) if self.update_params_fn else None cur_data_fidelity = ( self.update_data_fidelity_fn(it) if self.update_data_fidelity_fn else None ) cur_prior = self.update_prior_fn(it) if self.update_prior_fn else None X_prev = X X = self.iterator( X_prev, cur_data_fidelity, cur_prior, cur_params, *args, **kwargs ) if self.anderson_acceleration: X = self.anderson_acceleration_step( it, X_prev, X, self.x_hist, self.T_hist, self.H, self.q, cur_data_fidelity, cur_prior, cur_params, *args, ) self.check_iteration = ( self.check_iteration_fn(X_prev, X) if self.check_iteration_fn else True ) return X if self.check_iteration else X_prev