PANOC-ALM/Doxygen/panoc-helpers_8hpp_source.html

#pragma once


#include <panoc-alm/inner/decl/panoc-stop-crit.hpp>

#include <panoc-alm/util/atomic_stop_signal.hpp>

#include <panoc-alm/util/problem.hpp>

#include <panoc-alm/util/solverstatus.hpp>


#include <stdexcept>


namespace pa::detail {


inline real_t calc_ψ_ŷ(const Problem &p,

                       crvec x,

                       crvec y,

                       crvec Σ,

                       rvec ŷ

) {

    if (p.m == 0) /* [[unlikely]] */

        return p.f(x);


    // g(x)

    p.g(x, ŷ);

    // ζ = g(x) + Σ⁻¹y

    ŷ += Σ.asDiagonal().inverse() * y;

    // d = ζ - Π(ζ, D)

    ŷ = projecting_difference(ŷ, p.D);

    // dᵀŷ, ŷ = Σ d

    real_t dᵀŷ = 0;

    for (unsigned i = 0; i < p.m; ++i) {

        dᵀŷ += ŷ(i) * Σ(i) * ŷ(i); // TODO: vectorize

        ŷ(i) = Σ(i) * ŷ(i);

    }

    // ψ(x) = f(x) + ½ dᵀŷ

    real_t ψ = p.f(x) + 0.5 * dᵀŷ;


    return ψ;

}


inline void calc_grad_ψ_from_ŷ(const Problem &p,

                               crvec x,

                               crvec ŷ,

                               rvec grad_ψ,

                               rvec work_n

) {

    // ∇ψ = ∇f(x) + ∇g(x) ŷ

    p.grad_f(x, grad_ψ);

    if (p.m != 0) /* [[likely]] */ {

        p.grad_g_prod(x, ŷ, work_n);

        grad_ψ += work_n;

    }

}


inline real_t calc_ψ_grad_ψ(const Problem &p,

                            crvec x,

                            crvec y,

                            crvec Σ,

                            rvec grad_ψ,

                            rvec work_n,

                            rvec work_m

) {

    // ψ(x) = f(x) + ½ dᵀŷ

    real_t ψ = calc_ψ_ŷ(p, x, y, Σ, work_m);

    // ∇ψ = ∇f(x) + ∇g(x) ŷ

    calc_grad_ψ_from_ŷ(p, x, work_m, grad_ψ, work_n);

    return ψ;

}


inline void calc_grad_ψ(const Problem &p,

                        crvec x,

                        crvec y,

                        crvec Σ,

                        rvec grad_ψ,

                        rvec work_n,

                        rvec work_m

) {

    if (p.m == 0) /* [[unlikely]] */

        return p.grad_f(x, grad_ψ);


    // g(x)

    p.g(x, work_m);

    // ζ = g(x) + Σ⁻¹y

    work_m += (y.array() / Σ.array()).matrix();

    // d = ζ - Π(ζ, D)

    work_m = projecting_difference(work_m, p.D);

    // ŷ = Σ d

    work_m = Σ.asDiagonal() * work_m;


    // ∇ψ = ∇f(x) + ∇g(x) ŷ

    p.grad_f(x, grad_ψ);

    p.grad_g_prod(x, work_m, work_n);

    grad_ψ += work_n;

}


inline void calc_err_z(const Problem &p,

                       crvec x̂,

                       crvec y,

                       crvec Σ,

                       rvec err_z

) {

    // g(x̂)

    p.g(x̂, err_z);

    // ζ = g(x̂) + Σ⁻¹y

    // ẑ = Π(ζ, D)

    // g(x) - ẑ

    err_z = err_z - project(err_z + Σ.asDiagonal().inverse() * y, p.D);

    // TODO: catastrophic cancellation?

}


inline auto

projected_gradient_step(const Box &C,

                        real_t γ,

                        crvec x,

                        crvec grad_ψ

) {

    using binary_real_f = real_t (*)(real_t, real_t);

    return (-γ * grad_ψ)

        .binaryExpr(C.lowerbound - x, binary_real_f(std::fmax))

        .binaryExpr(C.upperbound - x, binary_real_f(std::fmin));

}


inline void calc_x̂(const Problem &prob,

                   real_t γ,

                   crvec x,

                   crvec grad_ψ,

                   rvec x̂,

                   rvec p

) {

    p = projected_gradient_step(prob.C, γ, x, grad_ψ);

    x̂ = x + p;

}


inline bool stop_crit_requires_grad_̂ψₖ(PANOCStopCrit crit) {

    switch (crit) {

        case PANOCStopCrit::ApproxKKT: [[fallthrough]];

        case PANOCStopCrit::ApproxKKT2: return true;

        case PANOCStopCrit::ProjGradNorm: [[fallthrough]];

        case PANOCStopCrit::ProjGradNorm2: [[fallthrough]];

        case PANOCStopCrit::ProjGradUnitNorm: [[fallthrough]];

        case PANOCStopCrit::ProjGradUnitNorm2: [[fallthrough]];

        case PANOCStopCrit::FPRNorm: [[fallthrough]];

        case PANOCStopCrit::FPRNorm2: return false;

        case PANOCStopCrit::Ipopt: return true;

    }

    throw std::out_of_range("Invalid PANOCStopCrit");

}


inline real_t calc_error_stop_crit(

    const Box &C,

    PANOCStopCrit crit,

    crvec pₖ,

    real_t γ,

    crvec xₖ,

    crvec x̂ₖ,

    crvec ŷₖ,

    crvec grad_ψₖ,

    crvec grad_̂ψₖ

) {

    switch (crit) {

        case PANOCStopCrit::ApproxKKT: {

            auto err = (1 / γ) * pₖ + (grad_ψₖ - grad_̂ψₖ);

            // These parentheses     ^^^               ^^^     are important to

            // prevent catastrophic cancellation when the step is small

            return vec_util::norm_inf(err);

        }

        case PANOCStopCrit::ApproxKKT2: {

            auto err = (1 / γ) * pₖ + (grad_ψₖ - grad_̂ψₖ);

            // These parentheses     ^^^               ^^^     are important to

            // prevent catastrophic cancellation when the step is small

            return err.norm();

        }

        case PANOCStopCrit::ProjGradNorm: {

            return vec_util::norm_inf(pₖ);

        }

        case PANOCStopCrit::ProjGradNorm2: {

            return pₖ.norm();

        }

        case PANOCStopCrit::ProjGradUnitNorm: {

            return vec_util::norm_inf(

                projected_gradient_step(C, 1, xₖ, grad_ψₖ));

        }

        case PANOCStopCrit::ProjGradUnitNorm2: {

            return projected_gradient_step(C, 1, xₖ, grad_ψₖ).norm();

        }

        case PANOCStopCrit::FPRNorm: {

            return vec_util::norm_inf(pₖ) / γ;

        }

        case PANOCStopCrit::FPRNorm2: {

            return pₖ.norm() / γ;

        }

        case PANOCStopCrit::Ipopt: {

            auto err =

                vec_util::norm_inf(projected_gradient_step(C, 1, x̂ₖ, grad_̂ψₖ));

            auto n = 2 * (ŷₖ.size() + x̂ₖ.size());

            if (n == 0)

                return err;

            auto C_lagr_mult =

                vec_util::norm_1(projecting_difference(x̂ₖ - grad_̂ψₖ, C));

            auto D_lagr_mult   = vec_util::norm_1(ŷₖ);

            const real_t s_max = 100;

            real_t s_d =

                std::max(s_max, (C_lagr_mult + D_lagr_mult) / n) / s_max;

            return err / s_d;

        }

    }

    throw std::out_of_range("Invalid PANOCStopCrit");

}


inline real_t descent_lemma(

    const Problem &problem,

    real_t rounding_tolerance,

    real_t L_max,

    crvec xₖ,

    real_t ψₖ,

    crvec grad_ψₖ,

    crvec y,

    crvec Σ,

    rvec x̂ₖ,

    rvec pₖ,

    rvec ŷx̂ₖ,

    real_t &ψx̂ₖ,

    real_t &norm_sq_pₖ,

    real_t &grad_ψₖᵀpₖ,

    real_t &Lₖ,

    real_t &γₖ) {


    real_t old_γₖ = γₖ;

    real_t margin = (1 + std::abs(ψₖ)) * rounding_tolerance;

    while (ψx̂ₖ - ψₖ > grad_ψₖᵀpₖ + 0.5 * Lₖ * norm_sq_pₖ + margin) {

        if (not(Lₖ * 2 <= L_max))

            break;


        Lₖ *= 2;

        γₖ /= 2;


        // Calculate x̂ₖ and pₖ (with new step size)

        calc_x̂(problem, γₖ, xₖ, grad_ψₖ, /* in ⟹ out */ x̂ₖ, pₖ);

        // Calculate ∇ψ(xₖ)ᵀpₖ and ‖pₖ‖²

        grad_ψₖᵀpₖ = grad_ψₖ.dot(pₖ);

        norm_sq_pₖ = pₖ.squaredNorm();


        // Calculate ψ(x̂ₖ) and ŷ(x̂ₖ)

        ψx̂ₖ = calc_ψ_ŷ(problem, x̂ₖ, y, Σ, /* in ⟹ out */ ŷx̂ₖ);

    }

    return old_γₖ;

}


template <class ParamsT, class DurationT>

inline SolverStatus check_all_stop_conditions(

    const ParamsT &params,

    DurationT time_elapsed,

    unsigned iteration,

    const AtomicStopSignal &stop_signal,

    real_t ε,

    real_t εₖ,

    unsigned no_progress) {


    bool out_of_time     = time_elapsed > params.max_time;

    bool out_of_iter     = iteration == params.max_iter;

    bool interrupted     = stop_signal.stop_requested();

    bool not_finite      = not std::isfinite(εₖ);

    bool conv            = εₖ <= ε;

    bool max_no_progress = no_progress > params.max_no_progress;

    return conv              ? SolverStatus::Converged

           : out_of_time     ? SolverStatus::MaxTime

           : out_of_iter     ? SolverStatus::MaxIter

           : not_finite      ? SolverStatus::NotFinite

           : max_no_progress ? SolverStatus::NoProgress

           : interrupted     ? SolverStatus::Interrupted

                             : SolverStatus::Unknown;

}


inline void calc_augmented_lagrangian_hessian(

    const Problem &problem,

    crvec xₖ,

    crvec ŷxₖ,

    crvec y,

    crvec Σ,

    rvec g,

    mat &H,

    rvec work_n) {


    // Compute the Hessian of the Lagrangian

    problem.hess_L(xₖ, ŷxₖ, H);

    // Compute the Hessian of the augmented Lagrangian

    problem.g(xₖ, g);

    for (vec::Index i = 0; i < problem.m; ++i) {

        real_t ζ = g(i) + y(i) / Σ(i);

        bool inactive =

            problem.D.lowerbound(i) < ζ && ζ < problem.D.upperbound(i);

        if (not inactive) {

            problem.grad_gi(xₖ, i, work_n);

            H += work_n * Σ(i) * work_n.transpose();

        }

    }

}


inline void calc_augmented_lagrangian_hessian_prod_fd(

    const Problem &problem,

    crvec xₖ,

    crvec y,

    crvec Σ,

    crvec grad_ψ,

    crvec v,

    rvec Hv,

    rvec work_n1,

    rvec work_n2,

    rvec work_m) {


    real_t cbrt_ε = std::cbrt(std::numeric_limits<real_t>::epsilon());

    real_t h      = cbrt_ε * (1 + xₖ.norm());

    rvec xₖh      = work_n1;

    xₖh           = xₖ + h * v;

    calc_grad_ψ(problem, xₖh, y, Σ, Hv, work_n2, work_m);

    Hv -= grad_ψ;

    Hv /= h;

}


inline real_t initial_lipschitz_estimate(

    const Problem &problem,

    crvec xₖ,

    crvec y,

    crvec Σ,

    real_t ε,

    real_t δ,

    real_t L_min,

    real_t L_max,

    real_t &ψ,

    rvec grad_ψ,

    rvec work_n1,

    rvec work_n2,

    rvec work_n3,

    rvec work_m) {


    auto h        = (xₖ * ε).cwiseAbs().cwiseMax(δ);

    work_n1       = xₖ + h;

    real_t norm_h = h.norm();

    // Calculate ∇ψ(x₀ + h)

    calc_grad_ψ(problem, work_n1, y, Σ, /* in ⟹ out */ work_n2, work_n3,

                work_m);

    // Calculate ψ(xₖ), ∇ψ(x₀)

    ψ = calc_ψ_grad_ψ(problem, xₖ, y, Σ, /* in ⟹ out */ grad_ψ, work_n1,

                      work_m);


    // Estimate Lipschitz constant using finite differences

    real_t L = (work_n2 - grad_ψ).norm() / norm_h;

    return std::clamp(L, L_min, L_max);

}


inline real_t initial_lipschitz_estimate(

    const Problem &problem,

    crvec xₖ,

    crvec y,

    crvec Σ,

    real_t ε,

    real_t δ,

    real_t L_min,

    real_t L_max,

    rvec grad_ψ,

    rvec work_n1,

    rvec work_n2,

    rvec work_n3,

    rvec work_m) {


    auto h        = (xₖ * ε).cwiseAbs().cwiseMax(δ);

    work_n1       = xₖ + h;

    real_t norm_h = h.norm();

    // Calculate ∇ψ(x₀ + h)

    calc_grad_ψ(problem, work_n1, y, Σ, /* in ⟹ out */ work_n2, work_n3,

                work_m);

    // Calculate ∇ψ(x₀)

    calc_grad_ψ(problem, xₖ, y, Σ, /* in ⟹ out */ grad_ψ, work_n1, work_m);


    // Estimate Lipschitz constant using finite differences

    real_t L = (work_n2 - grad_ψ).norm() / norm_h;

    return std::clamp(L, L_min, L_max);

}


} // namespace pa::detail

atomic_stop_signal.hpp

pa::AtomicStopSignal
Definition: atomic_stop_signal.hpp:7

pa::AtomicStopSignal::stop_requested
bool stop_requested() const
Definition: atomic_stop_signal.hpp:16

problem.hpp

bicycle-obstacle-avoidance-mpc.prob
prob
Definition: bicycle-obstacle-avoidance-mpc.py:38

codegen-rosenbrock.y
y
Definition: codegen-rosenbrock.py:9

codegen-rosenbrock.g
int g
Definition: codegen-rosenbrock.py:17

codegen-rosenbrock.x
x
Definition: codegen-rosenbrock.py:8

getting-started.p
p
Definition: getting-started.py:11

main.problem
problem
Definition: main.py:16

main.H
H
Definition: main.py:8

pa::detail
Definition: alm-helpers.hpp:6

pa::detail::stop_crit_requires_grad_̂ψₖ
bool stop_crit_requires_grad_̂ψₖ(PANOCStopCrit crit)
Definition: panoc-helpers.hpp:153

pa::detail::calc_err_z
void calc_err_z(const Problem &p, crvec x̂, crvec y, crvec Σ, rvec err_z)
Calculate the error between ẑ and g(x).
Definition: panoc-helpers.hpp:107

pa::detail::calc_augmented_lagrangian_hessian_prod_fd
void calc_augmented_lagrangian_hessian_prod_fd(const Problem &problem, crvec xₖ, crvec y, crvec Σ, crvec grad_ψ, crvec v, rvec Hv, rvec work_n1, rvec work_n2, rvec work_m)
Compute the Hessian matrix of the augmented Lagrangian function multiplied by the given vector,...
Definition: panoc-helpers.hpp:379

pa::detail::calc_grad_ψ
void calc_grad_ψ(const Problem &p, crvec x, crvec y, crvec Σ, rvec grad_ψ, rvec work_n, rvec work_m)
Calculate the gradient ∇ψ(x).
Definition: panoc-helpers.hpp:79

pa::detail::calc_ψ_ŷ
real_t calc_ψ_ŷ(const Problem &p, crvec x, crvec y, crvec Σ, rvec ŷ)
Calculate both ψ(x) and the vector ŷ that can later be used to compute ∇ψ.
Definition: panoc-helpers.hpp:16

pa::detail::projected_gradient_step
auto projected_gradient_step(const Box &C, real_t γ, crvec x, crvec grad_ψ)
Projected gradient step.
Definition: panoc-helpers.hpp:131

pa::detail::calc_grad_ψ_from_ŷ
void calc_grad_ψ_from_ŷ(const Problem &p, crvec x, crvec ŷ, rvec grad_ψ, rvec work_n)
Calculate ∇ψ(x) using ŷ.
Definition: panoc-helpers.hpp:44

pa::detail::initial_lipschitz_estimate
real_t initial_lipschitz_estimate(const Problem &problem, crvec xₖ, crvec y, crvec Σ, real_t ε, real_t δ, real_t L_min, real_t L_max, real_t &ψ, rvec grad_ψ, rvec work_n1, rvec work_n2, rvec work_n3, rvec work_m)
Estimate the Lipschitz constant of the gradient  using finite differences.
Definition: panoc-helpers.hpp:412

pa::detail::check_all_stop_conditions
SolverStatus check_all_stop_conditions(const ParamsT &params, DurationT time_elapsed, unsigned iteration, const AtomicStopSignal &stop_signal, real_t ε, real_t εₖ, unsigned no_progress)
Check all stop conditions (required tolerance reached, out of time, maximum number of iterations exce...
Definition: panoc-helpers.hpp:307

pa::detail::calc_ψ_grad_ψ
real_t calc_ψ_grad_ψ(const Problem &p, crvec x, crvec y, crvec Σ, rvec grad_ψ, rvec work_n, rvec work_m)
Calculate both ψ(x) and its gradient ∇ψ(x).
Definition: panoc-helpers.hpp:62

pa::detail::calc_x̂
void calc_x̂(const Problem &prob, real_t γ, crvec x, crvec grad_ψ, rvec x̂, rvec p)
Definition: panoc-helpers.hpp:142

pa::detail::descent_lemma
real_t descent_lemma(const Problem &problem, real_t rounding_tolerance, real_t L_max, crvec xₖ, real_t ψₖ, crvec grad_ψₖ, crvec y, crvec Σ, rvec x̂ₖ, rvec pₖ, rvec ŷx̂ₖ, real_t &ψx̂ₖ, real_t &norm_sq_pₖ, real_t &grad_ψₖᵀpₖ, real_t &Lₖ, real_t &γₖ)
Increase the estimate of the Lipschitz constant of the objective gradient and decrease the step size ...
Definition: panoc-helpers.hpp:242

pa::detail::calc_error_stop_crit
real_t calc_error_stop_crit(const Box &C, PANOCStopCrit crit, crvec pₖ, real_t γ, crvec xₖ, crvec x̂ₖ, crvec ŷₖ, crvec grad_ψₖ, crvec grad_̂ψₖ)
Compute the ε from the stopping criterion, see PANOCStopCrit.
Definition: panoc-helpers.hpp:169

pa::detail::calc_augmented_lagrangian_hessian
void calc_augmented_lagrangian_hessian(const Problem &problem, crvec xₖ, crvec ŷxₖ, crvec y, crvec Σ, rvec g, mat &H, rvec work_n)
Compute the Hessian matrix of the augmented Lagrangian function.
Definition: panoc-helpers.hpp:342

pa::vec_util::norm_1
real_t norm_1(const Vec &v)
Get the 1-norm of the given vector.
Definition: vec.hpp:49

pa::vec_util::norm_inf
real_t norm_inf(const Vec &v)
Get the maximum or infinity-norm of the given vector.
Definition: vec.hpp:42

pa::PANOCStopCrit
PANOCStopCrit
Definition: panoc-stop-crit.hpp:8

pa::PANOCStopCrit::ProjGradUnitNorm
@ ProjGradUnitNorm
∞-norm of the projected gradient with unit step size:

pa::PANOCStopCrit::ProjGradNorm
@ ProjGradNorm
∞-norm of the projected gradient with step size γ:

pa::PANOCStopCrit::Ipopt
@ Ipopt
The stopping criterion used by Ipopt, see https://link.springer.com/article/10.1007/s10107-004-0559-y...

pa::PANOCStopCrit::FPRNorm2
@ FPRNorm2
2-norm of fixed point residual:

pa::PANOCStopCrit::ProjGradNorm2
@ ProjGradNorm2
2-norm of the projected gradient with step size γ:

pa::PANOCStopCrit::ApproxKKT
@ ApproxKKT
Find an ε-approximate KKT point in the ∞-norm:

pa::PANOCStopCrit::FPRNorm
@ FPRNorm
∞-norm of fixed point residual:

pa::PANOCStopCrit::ApproxKKT2
@ ApproxKKT2
Find an ε-approximate KKT point in the 2-norm:

pa::PANOCStopCrit::ProjGradUnitNorm2
@ ProjGradUnitNorm2
2-norm of the projected gradient with unit step size:

pa::crvec
Eigen::Ref< const vec > crvec
Default type for immutable references to vectors.
Definition: vec.hpp:18

pa::project
auto project(const Vec &v, const Box &box)
Project a vector onto a box.
Definition: box.hpp:15

pa::SolverStatus
SolverStatus
Exit status of a numerical solver such as ALM or PANOC.
Definition: solverstatus.hpp:7

pa::SolverStatus::Interrupted
@ Interrupted
Solver was interrupted by the user.

pa::SolverStatus::Unknown
@ Unknown
Initial value.

pa::SolverStatus::MaxTime
@ MaxTime
Maximum allowed execution time exceeded.

pa::SolverStatus::NoProgress
@ NoProgress
No progress was made in the last iteration.

pa::SolverStatus::MaxIter
@ MaxIter
Maximum number of iterations exceeded.

pa::SolverStatus::Converged
@ Converged
Converged and reached given tolerance.

pa::SolverStatus::NotFinite
@ NotFinite
Intermediate results were infinite or not-a-number.

pa::mat
realmat mat
Default type for matrices.
Definition: vec.hpp:20

pa::real_t
double real_t
Default floating point type.
Definition: vec.hpp:8

pa::projecting_difference
auto projecting_difference(const Vec &v, const Box &box)
Get the difference between the given vector and its projection.
Definition: box.hpp:28

pa::rvec
Eigen::Ref< vec > rvec
Default type for mutable references to vectors.
Definition: vec.hpp:16

pa::Box
Definition: box.hpp:7

panocpy.test.params
params
Definition: test.py:275

panocpy.test.L
int L
Definition: test.py:49

panocpy.test.Σ
int Σ
Definition: test.py:72

panocpy.test.err_z
err_z
Definition: test.py:78

panocpy.test.n
int n
Definition: test.py:40

panocpy.test.ε
int ε
Definition: test.py:73

panocpy.test.C
C
Definition: test.py:262

panocpy.test.v
v
Definition: test.py:44

panoc-stop-crit.hpp

solverstatus.hpp

pa::Problem
Problem description for minimization problems.
Definition: include/panoc-alm/util/problem.hpp:26