Source code for pathsim.optim.anderson

########################################################################################
##
##                               ANDERSON ACCELERATION 
##                                (optim/anderson.py)
##
########################################################################################

# IMPORTS ==============================================================================

import numpy as np

from collections import deque

from scipy.linalg import lu_factor, lu_solve

from .numerical import num_jac

from .._constants import (
    TOLERANCE,
    OPT_RESTART,
    OPT_HISTORY,
    SOL_TOLERANCE_FPI,
    SOL_ITERATIONS_MAX
    )


# CLASS ================================================================================


[docs]
class Anderson:
    """Anderson acceleration for fixed-point iteration.

    Solves nonlinear equations in fixed-point form :math:`x = g(x)` by
    computing the next iterate as a linear combination of previous iterates
    whose coefficients minimise the least-squares residual.

    .. math::

        x_{k+1} = \\sum_{i=0}^{m_k} \\alpha_i^{(k)}\\, g(x_{k-m_k+i})
        \\quad\\text{with}\\quad
        \\alpha^{(k)} = \\arg\\min \\bigl\\|\\sum_i \\alpha_i\\, r_{k-m_k+i}\\bigr\\|

    where :math:`r_k = g(x_k) - x_k` and :math:`m_k \\le m` is the current
    buffer depth.

    In PathSim this class is the inner fixed-point solver used by the
    simulation engine to resolve algebraic loops (cycles in the block
    diagram). Each loop-closing ``ConnectionBooster`` owns an ``Anderson``
    instance that accelerates convergence of the fixed-point iteration
    over the loop. The buffer depth ``m`` controls how many previous
    iterates are retained; larger values improve convergence on difficult
    loops at the cost of a small least-squares solve per iteration.

    Parameters
    ----------
    m : int
        buffer depth (number of stored iterates)
    restart : bool
        if True, clear the buffer once it reaches depth ``m``

    References
    ----------
    .. [1] Anderson, D. G. (1965). "Iterative Procedures for Nonlinear
           Integral Equations". Journal of the ACM, 12(4), 547--560.
           :doi:`10.1145/321296.321305`
    .. [2] Walker, H. F., & Ni, P. (2011). "Anderson Acceleration for
           Fixed-Point Iterations". SIAM Journal on Numerical Analysis,
           49(4), 1715--1735. :doi:`10.1137/10078356X`
    """

    def __init__(self, m=OPT_HISTORY, restart=OPT_RESTART):

        #length of buffer for next estimate
        self.m = m

        #restart after buffer length is reached?
        self.restart = restart

        #rolling difference buffers
        self.dx_buffer = deque(maxlen=self.m)
        self.dr_buffer = deque(maxlen=self.m)

        #prvious values
        self.x_prev = None
        self.r_prev = None


    def __bool__(self):
        return True


    def __len__(self):
        return len(self.dx_buffer[0]) if self.dx_buffer else 0



[docs]
    def solve(self, func, x0, iterations_max=100, tolerance=1e-6):
        """Solve the function 'func' with initial 
        value 'x0' up to a certain tolerance.

        Note
        ----
        This method is for testing purposes only and 
        not used in the simulation loop.
        
        Parameters
        ----------
        func : callable
            function to solve
        x0 : numeric
            starting value for solution
        iterations_max : int
            maximum number of solver iterations
        tolerance : float
            convergence condition

        Returns
        -------
        x : numeric
            solution
        res : float
            residual
        i : int
            iteration count
        """

        _x = x0.copy()
        for i in range(iterations_max):
            _x, _res = self.step(_x, func(_x)+_x)
            if _res < tolerance:
                return _x, _res, i

        raise RuntimeError(f"did not converge in {iterations_max} steps")




[docs]
    def reset(self):
        """reset the anderson accelerator"""

        #clear difference buffers
        self.dx_buffer.clear()
        self.dr_buffer.clear()

        #clear previous values
        self.x_prev = None
        self.r_prev = None




[docs]
    def step(self, x, g):
        """Perform one iteration on the fixed-point solution.
    
        Parameters
        ----------
        x : float, array
            current solution
        g : float, array
            current evaluation of g(x)
        
        Returns
        -------
        x : float, array
            new solution
        res : float
            residual norm, fixed point error
        """

        #make numeric if value
        _x = np.asarray(x).flatten()
        _g = np.asarray(g).flatten()

        #residual (this gets minimized)
        _res = _g - _x
        
        #fallback to regular fpi if 'm == 0'
        if self.m == 0:
            return _g, np.linalg.norm(_res)
    
        #if no buffer, regular fixed-point update
        if self.x_prev is None:

            #save values for next iteration
            self.x_prev = _x
            self.r_prev = _res

            return _g, np.linalg.norm(_res)

        #append to difference buffer
        self.dx_buffer.append(_x - self.x_prev)
        self.dr_buffer.append(_res - self.r_prev)
        
        #save values for next iteration
        self.x_prev = _x
        self.r_prev = _res

        #if buffer size 'm' reached, restart
        if self.restart and len(self.dx_buffer) >= self.m:
            self.reset()
            return _g, np.linalg.norm(_res)

        #get difference matrices 
        dX = np.vstack(self.dx_buffer)
        dR = np.vstack(self.dr_buffer)

        #exit for scalar values (size-1 arrays after flatten)
        if _res.size == 1:

            #flatten to 1D for dot products
            dR_flat = dR.flatten()
            dX_flat = dX.flatten()

            #delta squared norm
            dR2 = np.dot(dR_flat, dR_flat)

            #catch division by zero
            if dR2 <= TOLERANCE:
                return _g, abs(_res[0])

            #new solution and residual
            return _x - _res[0] * np.dot(dR_flat, dX_flat) / dR2, abs(_res[0])

        #compute coefficients from least squares problem
        C, *_ = np.linalg.lstsq(dR.T, _res, rcond=None)

        #new solution and residual norm
        return _x - C @ dX, np.linalg.norm(_res)






[docs]
class NewtonAnderson(Anderson):
    """Hybrid Newton--Anderson fixed-point solver.

    Extends :class:`Anderson` by prepending a Newton step when a Jacobian
    of :math:`g` is available.  The Newton step

    .. math::

        \\tilde{x} = x - (J_g - I)^{-1}\\,(g(x) - x)

    provides a quadratically convergent initial correction; the subsequent
    Anderson mixing step then stabilises the iteration and damps
    oscillations.

    In PathSim this solver is used inside every implicit ODE integration
    engine (BDF, DIRK, ESDIRK).  When a block provides a local Jacobian
    (e.g. ``ODE`` or ``LTI`` blocks), the Newton pre-step yields much
    faster convergence of the implicit update equation, reducing the
    number of fixed-point iterations per timestep.  Without a Jacobian the
    solver falls back to pure Anderson acceleration.

    References
    ----------
    .. [1] Anderson, D. G. (1965). "Iterative Procedures for Nonlinear
           Integral Equations". Journal of the ACM, 12(4), 547--560.
           :doi:`10.1145/321296.321305`
    .. [2] Walker, H. F., & Ni, P. (2011). "Anderson Acceleration for
           Fixed-Point Iterations". SIAM Journal on Numerical Analysis,
           49(4), 1715--1735. :doi:`10.1137/10078356X`
    """

    def __init__(self, m=OPT_HISTORY, restart=OPT_RESTART):
        super().__init__(m, restart)

        #cached LU factorization of the Newton matrix and the matrix it
        #factorizes, reused across iterations / stages while it is unchanged
        self._lu = None
        self._A = None



[docs]
    def reset(self):
        """Reset the anderson accelerator and the cached Newton factorization"""
        super().reset()
        self._lu = None
        self._A = None




[docs]
    def solve(self, func, x0, jac=None, iterations_max=100, tolerance=1e-6):
        """Solve the function 'func' with initial value 
        'x0' up to a certain tolerance.

        Parameters
        ----------
        func : callable
            function to solve
        x0 : numeric
            starting value for solution
        jac : callable
            jacobian of 'func'
        iterations_max : int
            maximum number of solver iterations
        tolerance : float
            convergence condition

        Note
        ----
        This method is for testing purposes only and 
        not used in the simulation loop.

        Returns
        -------
        x : numeric
            solution
        res : float
            residual
        i : int
            iteration count
        """

        _x = x0.copy()
        for i in range(iterations_max):
            _x, _res = self.step(_x, func(_x)+_x, None if jac is None else jac(_x))
            if _res < tolerance:
                return _x, _res, i

        raise RuntimeError(f"did not converge in {iterations_max} steps")



    def _newton(self, x, g, jac):
        """Newton step on solution, where 'f=g-x' is the 
        residual and 'jac' is the jacobian of 'g'.

        Parameters
        ----------
        x : float, array
            current solution
        g : float, array
            current evaluation of g(x)
        jac : array
            evaluation of jacobian of 'g'

        Returns
        -------
        x : float, array
            new solution
        res : float
            residual norm
        """

        #preprocess formats
        _x = np.asarray(x).flatten()
        _g = np.asarray(g).flatten()

        _jac = np.asarray(jac)

        #compute residual
        _res = _g - _x

        #early exit for scalar or purely vectorial values
        if _res.size == 1 or np.ndim(_jac) == 1:
            
            return _x - _res / (_jac - 1.0), np.linalg.norm(_res)

        #vectorial values (newton raphson), Newton matrix 'jac - I'
        _A = _jac - np.eye(len(_res))

        #reuse the cached factorization while the Newton matrix is unchanged
        #(constant jacobian across iterations / stages), refactor otherwise
        if self._A is not None and _A.shape == self._A.shape \
            and np.array_equal(_A, self._A):
            _lu = self._lu
        else:
            _lu = lu_factor(_A)
            self._A, self._lu = _A.copy(), _lu

        return _x - lu_solve(_lu, _res), np.linalg.norm(_res)



[docs]
    def step(self, x, g, jac=None):
        """Perform one iteration on the fixed-point solution. 
        
        If the jacobian of g 'jac' is provided, a newton step 
        is performed previous to anderson acceleration.
            
        Parameters
        ----------
        x : float, array
            current solution
        g : float, array
            current evaluation of g(x)
        jac : array
            evaluation of jacobian of 'g'

        Returns
        -------
        x : float, array
            new solution
        res : float
            residual norm
        """

        #newton step if jacobian available
        if jac is None: 

            #regular anderson step with residual
            return super().step(x, g)
        else: 
            #newton step with residual
            _x, res_norm = self._newton(x, g, jac)

            #anderson step with no residual
            y, _ = super().step(_x, g)

            return y, res_norm





# ROOT SOLVING ========================================================================

def _inf_norm(residual, x):
    """Infinity norm of the residual at 'x'."""
    return np.linalg.norm(np.atleast_1d(residual(x)), np.inf)



[docs]
def solve_root(opt, residual, x0, jac=None,
               tolerance=SOL_TOLERANCE_FPI, iterations_max=SOL_ITERATIONS_MAX,
               line_search_max=20):
    """Solve the square nonlinear system :math:`F(x) = 0` by Anderson accelerated
    damped Newton iteration.

    Each iteration takes a Newton direction :math:`\\Delta x = J^{-1} F`,
    damps it with a backtracking line search on the residual norm so the step
    stays in the basin of the current root, and then accelerates the resulting
    iterate with the Anderson optimizer

    .. math::

        \\tilde{x}_{k+1} = x_k - \\alpha_k J^{-1} F(x_k), \\qquad
        x_{k+1} = \\mathrm{Anderson}(x_k, \\tilde{x}_{k+1})


    The Anderson step is applied to the (damped) Newton iterate rather than to
    the raw fixed-point map :math:`x + F(x)`, so the first iterate is already a
    proper Newton step and cold starts do not jump out of the root's basin. The
    accelerated iterate is kept only if it does not increase the residual,
    otherwise the plain Newton iterate is used, which makes the acceleration
    safe. The optimizer instance is the same Newton-Anderson type the implicit
    engines use, so the algebraic solves stay consistent with the solver stack.

    The optimizer is reset before the iteration; the initial value doubles as
    the warm-start.

    Parameters
    ----------
    opt : Anderson | NewtonAnderson
        Anderson optimizer instance used to accelerate the Newton iterates
    residual : callable
        residual function 'F(x)' of the square system
    x0 : float, array[float]
        initial value / warm-start for the solution
    jac : callable, None
        optional analytical Jacobian of 'residual', central finite differences
        are used as a fallback if 'None'
    tolerance : float
        convergence tolerance on the residual norm
    iterations_max : int
        maximum number of iterations
    line_search_max : int
        maximum number of backtracking line search steps per iteration

    Returns
    -------
    x : array[float]
        converged solution
    res : float
        residual norm at the last iteration
    iterations : int
        number of iterations used
    """

    #fresh optimizer state for this solve
    opt.reset()

    #working solution as a flat float array (warm-start from 'x0')
    _x = np.atleast_1d(x0).astype(float)
    _res, i = _inf_norm(residual, _x), 0

    for i in range(iterations_max):

        #converged -> early exit
        if _res < tolerance:
            break

        #newton direction (least squares fallback if the jacobian is singular)
        _F = np.atleast_1d(residual(_x))
        _J = np.atleast_2d(jac(_x) if jac is not None else num_jac(residual, _x))
        try:
            _dx = np.linalg.solve(_J, _F)
        except np.linalg.LinAlgError:
            _dx, *_ = np.linalg.lstsq(_J, _F, rcond=None)

        #backtracking line search keeps the step in the basin of the root
        _a, _xn, _rn = 1.0, _x - _dx, _inf_norm(residual, _x - _dx)
        for _ in range(line_search_max):
            _cand = _x - _a * _dx
            _rc = _inf_norm(residual, _cand)
            if _rc < (1.0 - 1e-4 * _a) * _res:
                _xn, _rn = _cand, _rc
                break
            _a *= 0.5

        #anderson acceleration of the damped newton iterate, kept only if it
        #does not increase the residual (safeguard against overshoot)
        _xa = np.atleast_1d(opt.step(_x, _xn)[0]).flatten()
        if _inf_norm(residual, _xa) <= _rn:
            _x, _res = _xa, _inf_norm(residual, _xa)
        else:
            _x, _res = _xn, _rn

    return _x, _res, i