Source code for kona.algorithms.util.merit

import sys

[docs]class MeritFunction(object):
    """
    Base class for all merit functions.

    Attributes
    ----------
    primal_factory : VectorFactory
        Generator for new primal vectors.
    state_factory : VectorFactory
        Generator for new state vectors.
    out_file : file
        File stream for writing data.
    _allocated : boolean
        Flag to track whether merit function memory has been allocated.

    Parameters
    ----------
    primal_factory : VectorFactory
    state_factory : VectorFactory
    optns : dict
    out_file : file
    """
    def __init__(self, primal_factory, state_factory,
                 optns={}, out_file=sys.stdout):
        self.primal_factory = primal_factory
        self.state_factory = state_factory
        self.out_file = out_file
        self._allocated = False

[docs]    def reset(self, search_dir, x_start, u_start, p_dot_grad=None):
        """
        Reset the merit function at a new design and state point.

        If merit memory is not yet allocated, this function should also do that.

        Parameters
        ----------
        search_dir : DesignVector or CompositePrimalVector
            Search direction vector in the primal space.
        x_start : DesignVector
            Initial primal vector.
        u_start : StateVector
            State vector corresponding to ``x_start``.
        p_dot_grad : float, optional
            Value of :math:`\\langle p, \\nabla f \\rangle` at ``x_start``.
        """
        raise NotImplementedError # pragma: no cover

[docs]    def eval_func(self, alpha):
        """
        Evaluate merit function value at ``alpha``

        Parameters
        ----------
        alpha : float

        Returns
        -------
        float : Value of merit function ``alpha``.
        """
        raise NotImplementedError # pragma: no cover

[docs]    def eval_grad(self, alpha):
        """
        Evaluate merit function gradient :math:`\\langle p, \\nabla f \\rangle`
        at the given ``alpha``

        .. note::

            This method can either ``pass`` or ``return 0`` for gradient-free
            merit functions.

        Parameters
        ----------
        alpha : float

        Returns
        -------
        float : Value of :math:`\\langle p, \\nabla f \\rangle` at ``alpha``.
        """
        return 0 # pragma: no cover

[docs]class ObjectiveMerit(MeritFunction):
    """
    Merit function for line searches applied to the raw objective.

    Other, more complicated merit functions can be derived from this.

    Attributes
    ----------
    last_func_alpha : float
        Last value of alpha for which objective value is evaluated.
    last_grad_alpha : float
        Last value of alpha for which objective grad is evaluated.
    func_val : float
        Value of the objective at ``last_func_alpha``.
    p_dot_grad : float
        Value of :math:`\\langle p, \\nabla f \\rangle` at ``last_grad_alpha``.
    x_start : DesignVector
        Initial position of the primal variables, where :math:`\\alpha = 0`.
    x_trial : DesignVector
        Trial position of the primal variables at a new alpha.
    u_trial : StateVector
        Trial position of the state variables at a new alpha.
    search_dir : DesignVector
        The search direction vector.
    state_work : StateVector
        Work vector for state operations.
    adjoint_work : StateVector
        Work vector for adjoint operations.
    design_work : DesignVector
        Work vector for primal operations.
    """

    def __init__(self, primal_factory, state_factory,
                 optns={}, out_file=sys.stdout):
        super(ObjectiveMerit, self).__init__(primal_factory, state_factory,
                                             optns, out_file)
        self.primal_factory.request_num_vectors(4)
        self.state_factory.request_num_vectors(3)

[docs]    def reset(self, search_dir, x_start, u_start, p_dot_grad):
        assert isinstance(search_dir, DesignVector)
        assert isinstance(x_start, DesignVector)
        assert isinstance(u_start, StateVector)
        # if user provided a state vector
        # if the internal vectors are not allocated, do it now
        if not self._allocated:
            self.x_start = self.primal_factory.generate()
            self.x_trial = self.primal_factory.generate()
            self.search_dir = self.primal_factory.generate()
            self.primal_work = self.primal_factory.generate()
            self.u_trial = self.state_factory.generate()
            self.state_work = self.state_factory.generate()
            self.adjoint_work = self.state_factory.generate()
            self._allocated = True
        # store information for the new point the merit function is reset at
        self.x_start.equals(x_start)
        self.search_dir.equals(search_dir)
        self.func_val = objective_value(x_start, u_start)
        self.p_dot_grad = p_dot_grad
        self.last_func_alpha = 0.0
        self.last_grad_alpha = 0.0

[docs]    def eval_func(self, alpha):
        # do calculations only if alpha changed significantly
        if abs(alpha - self.last_func_alpha) > EPS:
            # calculate the trial primal and state vectors
            self.x_trial.equals_ax_p_by(
                1.0, self.x_start, alpha, self.search_dir)
            if self.u_trial.equals_primal_solution(self.x_trial):
                # calculate and return the raw objective function
                self.func_val = objective_value(self.x_trial, self.u_trial)
            else:
                self.func_val = np.nan
            # store last used alpha
            self.last_func_alpha = alpha

        return self.func_val

[docs]    def eval_grad(self, alpha):
        # do calculations only if alpha changed significantly
        if abs(alpha - self.last_grad_alpha) > EPS:
            # calculate the trial primal and state vectors
            self.x_trial.equals_ax_p_by(
                1.0, self.x_start, alpha, self.search_dir)
            self.x_trial.enforce_bounds()
            self.u_trial.equals_primal_solution(self.x_trial)
            # calculate objective partial
            self.primal_work.equals_objective_partial(self.x_trial,
                                                      self.u_trial)
            # add contribution from objective partial
            self.p_dot_grad = self.search_dir.inner(self.primal_work)
            # calculate adjoint
            self.adjoint_work.equals_objective_adjoint(
                self.x_trial, self.u_trial, self.state_work)
            # create dR/dX jacobian wrapper
            jacobian = dRdX(self.x_trial, self.u_trial)
            # multiply the adjoint by dR/dX^T and store into primal work
            jacobian.T.product(self.adjoint_work, self.primal_work)
            # add contribution from non-linear state changes
            self.p_dot_grad += self.search_dir.inner(self.primal_work)
            # store last used alpha
            self.last_grad_alpha = alpha

        return self.p_dot_grad

[docs]class L2QuadraticPenalty(MeritFunction):
    """
    A merit function with L2 constraint norm pernalty term, used for
    constrained RSNK problems.

    The merit function is defined as:

    .. math::

        \\mathcal(M)(x, s) = f(x, u(x)) +
        \\frac{1}{2} \\mu || c_{eq}(x, u(x)) ||^2 +
        \\frac{1}{2} \\mu || c_{in}(x, u(x)) - s ||^2
    """
    def __init__(self, primal_factory, state_factory=None,
                 eq_factory=None, ineq_factory=None,
                 optns={}, out_file=sys.stdout):
        # trigger the base class initialization
        super(L2QuadraticPenalty, self).__init__(
            primal_factory, state_factory, optns, out_file)

        # store a pointer to the dual factory
        if eq_factory is None and ineq_factory is None:
            raise TypeError("L2QuadraticPenalty >> " +
                            "Must provide at least one dual factory!")
        self.eq_factory = eq_factory
        self.ineq_factory = ineq_factory

        # request all necessary vectors
        self.primal_factory.request_num_vectors(2)
        self.state_factory.request_num_vectors(3)
        if self.eq_factory is not None:
            self.eq_factory.request_num_vectors(1)
        if self.ineq_factory is not None:
            self.ineq_factory.request_num_vectors(3)

[docs]    def reset(self, kkt_start, u_start, search_dir, mu):
        # if the internal vectors are not allocated, do it now
        if not self._allocated:
            self.design_work = self.primal_factory.generate()
            self.x_trial = self.primal_factory.generate()
            self.u_trial = self.state_factory.generate()
            self.state_work = self.state_factory.generate()
            self.adjoint_work = self.state_factory.generate()
            if self.eq_factory is not None:
                self.cnstr_eq = self.eq_factory.generate()
            else:
                self.cnstr_eq = None
            if self.ineq_factory is not None:
                self.cnstr_ineq = self.ineq_factory.generate()
                self.slack_trial = self.ineq_factory.generate()
                self.slack_work = self.ineq_factory.generate()
            else:
                self.cnstr_ineq = None
                self.slack_trial = None
                self.slack_work = None
            self._allocated = True

        # store information for the new point the merit function is reset at
        self.p_dot_grad = None
        self.mu = mu
        self.u_start = u_start
        if isinstance(kkt_start.primal, CompositePrimalVector):
            self.x_start = kkt_start.primal.design
            self.design_step = search_dir.primal.design
            self.slack_start = kkt_start.primal.slack
            self.slack_step = search_dir.primal.slack
        else:
            self.x_start = kkt_start.primal
            self.design_step = search_dir.primal
            self.slack_start = None
            self.slack_step = None

        # set initial point into trial
        self.x_trial.equals(self.x_start)
        self.u_trial.equals(self.u_start)

        # evaluate constraints at the trial point
        if self.cnstr_eq is not None:
            self.cnstr_eq.equals_constraints(self.x_trial, self.u_trial)
        if self.cnstr_ineq is not None:
            self.cnstr_ineq.equals_constraints(self.x_trial, self.u_trial)
            self.slack_trial.equals(self.slack_start)
            self.cnstr_ineq.minus(self.slack_trial)

        # evaluate merit function value
        obj_val = objective_value(self.x_trial, self.u_trial)
        if self.cnstr_eq is not None:
            penalty_eq = 0.5*self.mu*(self.cnstr_eq.norm2**2)
        else:
            penalty_eq = 0.
        if self.cnstr_ineq is not None:
            penalty_ineq = 0.5*self.mu*(self.cnstr_ineq.norm2**2)
        else:
            penalty_ineq = 0.
        self.func_val = obj_val + penalty_eq + penalty_ineq
        self.last_func_alpha = 0.0

[docs]    def eval_func(self, alpha):
        if abs(alpha - self.last_func_alpha) > EPS:
            # compute trial point
            self.x_trial.equals_ax_p_by(
                1., self.x_start, alpha, self.design_step)
            self.x_trial.enforce_bounds()
            self.u_trial.equals_primal_solution(self.x_trial)

            # evaluate constraints at the trial point
            if self.cnstr_eq is not None:
                self.cnstr_eq.equals_constraints(self.x_trial, self.u_trial)
            if self.cnstr_ineq is not None:
                self.cnstr_ineq.equals_constraints(self.x_trial, self.u_trial)
                self.slack_trial.equals_ax_p_by(
                    1., self.slack_start, alpha, self.slack_step)
                self.cnstr_ineq.minus(self.slack_trial)

            # evaluate merit function value
            obj_val = objective_value(self.x_trial, self.u_trial)
            if self.cnstr_eq is not None:
                penalty_eq = 0.5 * self.mu * (self.cnstr_eq.norm2 ** 2)
            else:
                penalty_eq = 0.
            if self.cnstr_ineq is not None:
                penalty_ineq = 0.5 * self.mu * (self.cnstr_ineq.norm2 ** 2)
            else:
                penalty_ineq = 0.
            self.func_val = obj_val + penalty_eq + penalty_ineq
            self.last_func_alpha = alpha

        return self.func_val

[docs]class AugmentedLagrangian(L2QuadraticPenalty):
    """
    An augmented Lagrangian merit function for constrained RSNK problems.

    The augmented Lagrangian is defined as:

    .. math::

        \\hat{\\mathcal{L}}(x, s) = f(x, u(x)) +
        \\lambda_{eq}^T c_{eq}(x, u(x)) +
        \\lambda_{in}^T \\left[c_{in}(x, u(x)) - s\\right] +
        \\frac{1}{2} \\mu || c_{eq}(x, u(x)) ||^2 +
        \\frac{1}{2} \\mu || c_{in}(x, u(x)) - s ||^2

    Unlike the traditional augmented Lagrangian, the Kona version has the
    Lagrange multipliers and the slack variables fozen. This is done to make
    the merit function comparable to the predicted decrease produced by the
    FLECS solver.
    """
    def __init__(self, primal_factory, state_factory,
                 eq_factory=None, ineq_factory=None,
                 optns={}, out_file=sys.stdout):
        # initialize the parent merit function
        super(AugmentedLagrangian, self).__init__(
            primal_factory, state_factory,
            eq_factory, ineq_factory,
            optns, out_file)

        self.freeze_mults = get_opt(optns, False, 'freeze_mults')

        # request an additional dual vector
        if self.eq_factory is not None:
            self.eq_factory.request_num_vectors(1)
        if self.ineq_factory is not None:
            self.ineq_factory.request_num_vectors(1)

        # child allocation flag
        self._child_allocated = False

[docs]    def reset(self, kkt_start, u_start, search_dir, mu):
        # allocate the parent merit function
        super(AugmentedLagrangian, self).reset(
            kkt_start, u_start, search_dir, mu)

        # if the internal vectors are not allocated, do it now
        if not self._child_allocated:
            if self.eq_factory is not None:
                self.mult_eq = self.eq_factory.generate()
            else:
                self.mult_eq = None
            if self.ineq_factory is not None:
                self.mult_ineq = self.ineq_factory.generate()
            else:
                self.mult_eq = None
            self._child_allocated = True

        # store references to dual start and dual step
        if self.cnstr_eq is None:
            self.mult_eq_start = None
            self.mult_eq_step = None
            self.mult_ineq_start = kkt_start.dual
            self.mult_ineq_step = search_dir.dual
        elif self.cnstr_ineq is None:
            self.mult_eq_start = kkt_start.dual
            self.mult_eq_step = search_dir.dual
            self.mult_ineq_start = None
            self.mult_ineq_step = None
        else:
            self.mult_eq_start = kkt_start.dual.eq
            self.mult_eq_step = search_dir.dual.eq
            self.mult_ineq_start = kkt_start.dual.ineq
            self.mult_ineq_step = search_dir.dual.ineq

        # add multiplier terms to the function value
        if self.cnstr_eq is not None:
            self.mult_eq.equals(self.mult_eq_start)
            self.func_val += self.mult_eq.inner(self.cnstr_eq)
        if self.cnstr_ineq is not None:
            self.mult_ineq.equals(self.mult_ineq_start)
            self.func_val += self.mult_ineq.inner(self.cnstr_ineq)

[docs]    def eval_func(self, alpha):
        if abs(alpha - self.last_func_alpha) > EPS:
            # evaluate the parent merit function value
            self.func_val = super(AugmentedLagrangian, self).eval_func(alpha)
            # add the multiplier term on top of the parent merit value
            if self.cnstr_eq is not None:
                if not self.freeze_mults:
                    self.mult_eq.equals_ax_p_by(
                        1., self.mult_eq_start, alpha, self.mult_eq_step)
                else:
                    self.mult_eq.equals(self.mult_eq_start)
                self.func_val += self.mult_eq.inner(self.cnstr_eq)
                print self.func_val
            if self.cnstr_ineq is not None:
                if not self.freeze_mults:
                    self.mult_ineq.equals_ax_p_by(
                        1., self.mult_ineq_start, alpha, self.mult_ineq_step)
                else:
                    self.mult_ineq.equals(self.mult_ineq_start)
                self.func_val += self.mult_ineq.inner(self.cnstr_ineq)

        return self.func_val

# imports here to prevent circular errors
import numpy as np
from kona.options import get_opt
from kona.linalg.common import objective_value
from kona.linalg.solvers.util import EPS
from kona.linalg.vectors.common import *
from kona.linalg.vectors.composite import CompositePrimalVector