gtsam/gtsam_unstable/linear/QPSolver.h

/*
 * QPSolver.h
 * @brief: A quadratic programming solver implements the active set method
 * @date: Apr 15, 2014
 * @author: thduynguyen
 */

#pragma once

#include <gtsam/linear/VectorValues.h>
#include <gtsam_unstable/linear/QP.h>

#include <vector>
#include <set>

namespace gtsam {

/// This struct holds the state of QPSolver at each iteration
struct QPState {
  VectorValues values;
  VectorValues duals;
  LinearInequalityFactorGraph workingSet;
  bool converged;

  /// default constructor
  QPState() :
      values(), duals(), workingSet(), converged(false) {
  }

  /// constructor with initial values
  QPState(const VectorValues& initialValues, const VectorValues& initialDuals,
      const LinearInequalityFactorGraph& initialWorkingSet, bool _converged) :
      values(initialValues), duals(initialDuals), workingSet(initialWorkingSet), converged(
          _converged) {
  }
};

/**
 * This class implements the active set method to solve quadratic programming problems
 * encoded in a GaussianFactorGraph with special mixed constrained noise models, in which
 * a negative sigma denotes an inequality <=0 constraint,
 * a zero sigma denotes an equality =0 constraint,
 * and a positive sigma denotes a normal Gaussian noise model.
 */
class QPSolver {

  const QP& qp_; //!< factor graphs of the QP problem, can't be modified!
  GaussianFactorGraph baseGraph_; //!< factor graphs of cost factors and linear equalities. The working set of inequalities will be added to this base graph in the process.
  VariableIndex costVariableIndex_, equalityVariableIndex_,
      inequalityVariableIndex_;
  FastSet<Key> constrainedKeys_; //!< all constrained keys, will become factors in the dual graph

public:
  /// Constructor
  QPSolver(const QP& qp);

  /// Find solution with the current working set
  VectorValues solveWithCurrentWorkingSet(
      const LinearInequalityFactorGraph& workingSet) const;

  /// @name Build the dual graph
  /// @{

  /// Collect the Jacobian terms for a dual factor
  template<typename FACTOR>
  std::vector<std::pair<Key, Matrix> > collectDualJacobians(Key key,
      const FactorGraph<FACTOR>& graph,
      const VariableIndex& variableIndex) const {
    std::vector<std::pair<Key, Matrix> > Aterms;
    if (variableIndex.find(key) != variableIndex.end()) {
      BOOST_FOREACH(size_t factorIx, variableIndex[key]){
      typename FACTOR::shared_ptr factor = graph.at(factorIx);
      if (!factor->active()) continue;
      Matrix Ai = factor->getA(factor->find(key)).transpose();
      Aterms.push_back(std::make_pair(factor->dualKey(), Ai));
    }
  }
    return Aterms;
  }

  /// Create a dual factor
  JacobianFactor::shared_ptr createDualFactor(Key key,
      const LinearInequalityFactorGraph& workingSet,
      const VectorValues& delta) const;

  /**
   * Build the dual graph to solve for the Lagrange multipliers.
   *
   * The Lagrangian function is:
   *        L(X,lambdas) = f(X) - \sum_k lambda_k * c_k(X),
   * where the unconstrained part is
   *        f(X) = 0.5*X'*G*X - X'*g + 0.5*f0
   * and the linear equality constraints are
   *        c1(X), c2(X), ..., cm(X)
   *
   * Take the derivative of L wrt X at the solution and set it to 0, we have
   *    \grad f(X) = \sum_k lambda_k * \grad c_k(X)   (*)
   *
   * For each set of rows of (*) corresponding to a variable xi involving in some constraints
   * we have:
   *    \grad f(xi) = \frac{\partial f}{\partial xi}' = \sum_j G_ij*xj - gi
   *    \grad c_k(xi) = \frac{\partial c_k}{\partial xi}'
   *
   * Note: If xi does not involve in any constraint, we have the trivial condition
   * \grad f(Xi) = 0, which should be satisfied as a usual condition for unconstrained variables.
   *
   * So each variable xi involving in some constraints becomes a linear factor A*lambdas - b = 0
   * on the constraints' lambda multipliers, as follows:
   *    - The jacobian term A_k for each lambda_k is \grad c_k(xi)
   *    - The constant term b is \grad f(xi), which can be computed from all unconstrained
   *    Hessian factors connecting to xi: \grad f(xi) = \sum_j G_ij*xj - gi
   */
  GaussianFactorGraph::shared_ptr buildDualGraph(
      const LinearInequalityFactorGraph& workingSet,
      const VectorValues& delta) const;

  /// @}

  /**
   * The goal of this function is to find currently active inequality constraints
   * that violate the condition to be active. The one that violates the condition
   * the most will be removed from the active set. See Nocedal06book, pg 469-471
   *
   * Find the BAD active inequality that pulls x strongest to the wrong direction
   * of its constraint (i.e. it is pulling towards >0, while its feasible region is <=0)
   *
   * For active inequality constraints (those that are enforced as equality constraints
   * in the current working set), we want lambda < 0.
   * This is because:
   *   - From the Lagrangian L = f - lambda*c, we know that the constraint force
   *     is (lambda * \grad c) = \grad f. Intuitively, to keep the solution x stay
   *     on the constraint surface, the constraint force has to balance out with
   *     other unconstrained forces that are pulling x towards the unconstrained
   *     minimum point. The other unconstrained forces are pulling x toward (-\grad f),
   *     hence the constraint force has to be exactly \grad f, so that the total
   *     force is 0.
   *   - We also know that  at the constraint surface c(x)=0, \grad c points towards + (>= 0),
   *     while we are solving for - (<=0) constraint.
   *   - We want the constraint force (lambda * \grad c) to pull x towards the - (<=0) direction
   *     i.e., the opposite direction of \grad c where the inequality constraint <=0 is satisfied.
   *     That means we want lambda < 0.
   *   - This is because when the constrained force pulls x towards the infeasible region (+),
   *     the unconstrained force is pulling x towards the opposite direction into
   *     the feasible region (again because the total force has to be 0 to make x stay still)
   *     So we can drop this constraint to have a lower error but feasible solution.
   *
   * In short, active inequality constraints with lambda > 0 are BAD, because they
   * violate the condition to be active.
   *
   * And we want to remove the worst one with the largest lambda from the active set.
   *
   */
  int identifyLeavingConstraint(const LinearInequalityFactorGraph& workingSet,
      const VectorValues& lambdas) const;

  /**
   * Compute step size alpha for the new solution x' = xk + alpha*p, where alpha \in [0,1]
   *
   *    @return a tuple of (alpha, factorIndex, sigmaIndex) where (factorIndex, sigmaIndex)
   *            is the constraint that has minimum alpha, or (-1,-1) if alpha = 1.
   *            This constraint will be added to the working set and become active
   *            in the next iteration
   */
  boost::tuple<double, int> computeStepSize(
      const LinearInequalityFactorGraph& workingSet, const VectorValues& xk,
      const VectorValues& p) const;

  /** Iterate 1 step, return a new state with a new workingSet and values */
  QPState iterate(const QPState& state) const;

  /**
   * Identify active constraints based on initial values.
   */
  LinearInequalityFactorGraph identifyActiveConstraints(
      const LinearInequalityFactorGraph& inequalities,
      const VectorValues& initialValues) const;

  /** Optimize with a provided initial values
   * For this version, it is the responsibility of the caller to provide
   * a feasible initial value.
   * @return a pair of <primal, dual> solutions
   */
  std::pair<VectorValues, VectorValues> optimize(
      const VectorValues& initialValues) const;

};

} /* namespace gtsam */
refactor QPSolver into its own class 2014-04-16 04:27:19 +08:00			`/*`
			`* QPSolver.h`
			`* @brief: A quadratic programming solver implements the active set method`
			`* @date: Apr 15, 2014`
			`* @author: thduynguyen`
			`*/`

			`#pragma once`

			`#include <gtsam/linear/VectorValues.h>`
refactor QPSolver inprogress... Compiled but tests failed. 2014-12-09 19:13:57 +08:00			`#include <gtsam_unstable/linear/QP.h>`
refactor QPSolver into its own class 2014-04-16 04:27:19 +08:00
Headers and standard formatting 2014-11-26 16:04:34 +08:00			`#include <vector>`
			`#include <set>`

refactor QPSolver into its own class 2014-04-16 04:27:19 +08:00			`namespace gtsam {`

refactor QPSolver inprogress... Compiled but tests failed. 2014-12-09 19:13:57 +08:00			`/// This struct holds the state of QPSolver at each iteration`
			`struct QPState {`
			`VectorValues values;`
			`VectorValues duals;`
			`LinearInequalityFactorGraph workingSet;`
			`bool converged;`

			`/// default constructor`
			`QPState() :`
			`values(), duals(), workingSet(), converged(false) {`
			`}`

			`/// constructor with initial values`
			`QPState(const VectorValues& initialValues, const VectorValues& initialDuals,`
			`const LinearInequalityFactorGraph& initialWorkingSet, bool _converged) :`
			`values(initialValues), duals(initialDuals), workingSet(initialWorkingSet), converged(`
			`_converged) {`
			`}`
			`};`

refactor QPSolver into its own class 2014-04-16 04:27:19 +08:00			`/**`
			`* This class implements the active set method to solve quadratic programming problems`
			`* encoded in a GaussianFactorGraph with special mixed constrained noise models, in which`
			`* a negative sigma denotes an inequality <=0 constraint,`
			`* a zero sigma denotes an equality =0 constraint,`
			`* and a positive sigma denotes a normal Gaussian noise model.`
			`*/`
			`class QPSolver {`
Simplified freeHessians_ using inner class 2014-11-27 17:47:45 +08:00
refactor QPSolver inprogress... Compiled but tests failed. 2014-12-09 19:13:57 +08:00			`const QP& qp_; //!< factor graphs of the QP problem, can't be modified!`
			`GaussianFactorGraph baseGraph_; //!< factor graphs of cost factors and linear equalities. The working set of inequalities will be added to this base graph in the process.`
			`VariableIndex costVariableIndex_, equalityVariableIndex_,`
			`inequalityVariableIndex_;`
			`FastSet<Key> constrainedKeys_; //!< all constrained keys, will become factors in the dual graph`
refactor QPSolver into its own class 2014-04-16 04:27:19 +08:00
			`public:`
			`/// Constructor`
refactor QPSolver inprogress... Compiled but tests failed. 2014-12-09 19:13:57 +08:00			`QPSolver(const QP& qp);`

			`/// Find solution with the current working set`
			`VectorValues solveWithCurrentWorkingSet(`
			`const LinearInequalityFactorGraph& workingSet) const;`

			`/// @name Build the dual graph`
			`/// @{`

			`/// Collect the Jacobian terms for a dual factor`
			`template<typename FACTOR>`
			`std::vector<std::pair<Key, Matrix> > collectDualJacobians(Key key,`
			`const FactorGraph<FACTOR>& graph,`
			`const VariableIndex& variableIndex) const {`
			`std::vector<std::pair<Key, Matrix> > Aterms;`
fix QPSolver unit tests 2014-12-10 05:27:11 +08:00			`if (variableIndex.find(key) != variableIndex.end()) {`
			`BOOST_FOREACH(size_t factorIx, variableIndex[key]){`
remove lpsolve 2014-12-17 00:27:20 +08:00			`typename FACTOR::shared_ptr factor = graph.at(factorIx);`
			`if (!factor->active()) continue;`
			`Matrix Ai = factor->getA(factor->find(key)).transpose();`
			`Aterms.push_back(std::make_pair(factor->dualKey(), Ai));`
refactor QPSolver inprogress... Compiled but tests failed. 2014-12-09 19:13:57 +08:00			`}`
remove lpsolve 2014-12-17 00:27:20 +08:00			`}`
refactor QPSolver inprogress... Compiled but tests failed. 2014-12-09 19:13:57 +08:00			`return Aterms;`
Headers and standard formatting 2014-11-26 16:04:34 +08:00			`}`
refactor QPSolver into its own class 2014-04-16 04:27:19 +08:00
refactor QPSolver inprogress... Compiled but tests failed. 2014-12-09 19:13:57 +08:00			`/// Create a dual factor`
			`JacobianFactor::shared_ptr createDualFactor(Key key,`
			`const LinearInequalityFactorGraph& workingSet,`
			`const VectorValues& delta) const;`
refactor QPSolver into its own class 2014-04-16 04:27:19 +08:00
			`/**`
			`* Build the dual graph to solve for the Lagrange multipliers.`
			`*`
			`* The Lagrangian function is:`
			`* L(X,lambdas) = f(X) - \sum_k lambda_k * c_k(X),`
			`* where the unconstrained part is`
			`* f(X) = 0.5X'GX - X'g + 0.5*f0`
			`* and the linear equality constraints are`
			`* c1(X), c2(X), ..., cm(X)`
			`*`
			`* Take the derivative of L wrt X at the solution and set it to 0, we have`
			`* \grad f(X) = \sum_k lambda_k * \grad c_k(X) (*)`
			`*`
			`* For each set of rows of (*) corresponding to a variable xi involving in some constraints`
			`* we have:`
			`* \grad f(xi) = \frac{\partial f}{\partial xi}' = \sum_j G_ij*xj - gi`
			`* \grad c_k(xi) = \frac{\partial c_k}{\partial xi}'`
			`*`
			`* Note: If xi does not involve in any constraint, we have the trivial condition`
			`* \grad f(Xi) = 0, which should be satisfied as a usual condition for unconstrained variables.`
			`*`
			`* So each variable xi involving in some constraints becomes a linear factor A*lambdas - b = 0`
			`* on the constraints' lambda multipliers, as follows:`
			`* - The jacobian term A_k for each lambda_k is \grad c_k(xi)`
			`* - The constant term b is \grad f(xi), which can be computed from all unconstrained`
			`* Hessian factors connecting to xi: \grad f(xi) = \sum_j G_ij*xj - gi`
			`*/`
refactor QPSolver inprogress... Compiled but tests failed. 2014-12-09 19:13:57 +08:00			`GaussianFactorGraph::shared_ptr buildDualGraph(`
			`const LinearInequalityFactorGraph& workingSet,`
			`const VectorValues& delta) const;`

			`/// @}`
refactor QPSolver into its own class 2014-04-16 04:27:19 +08:00
			`/**`
more informative comment 2014-11-27 07:53:45 +08:00			`* The goal of this function is to find currently active inequality constraints`
			`* that violate the condition to be active. The one that violates the condition`
			`* the most will be removed from the active set. See Nocedal06book, pg 469-471`
			`*`
Fixed up comments 2014-11-27 05:59:33 +08:00			`* Find the BAD active inequality that pulls x strongest to the wrong direction`
			`* of its constraint (i.e. it is pulling towards >0, while its feasible region is <=0)`
Headers and standard formatting 2014-11-26 16:04:34 +08:00			`*`
Fixed up comments 2014-11-27 05:59:33 +08:00			`* For active inequality constraints (those that are enforced as equality constraints`
			`* in the current working set), we want lambda < 0.`
Headers and standard formatting 2014-11-26 16:04:34 +08:00			`* This is because:`
Fixed up comments 2014-11-27 05:59:33 +08:00			`* - From the Lagrangian L = f - lambda*c, we know that the constraint force`
more informative comment 2014-11-27 07:53:45 +08:00			`* is (lambda * \grad c) = \grad f. Intuitively, to keep the solution x stay`
			`* on the constraint surface, the constraint force has to balance out with`
			`* other unconstrained forces that are pulling x towards the unconstrained`
			`* minimum point. The other unconstrained forces are pulling x toward (-\grad f),`
			`* hence the constraint force has to be exactly \grad f, so that the total`
			`* force is 0.`
			`* - We also know that at the constraint surface c(x)=0, \grad c points towards + (>= 0),`
			`* while we are solving for - (<=0) constraint.`
			`* - We want the constraint force (lambda * \grad c) to pull x towards the - (<=0) direction`
			`* i.e., the opposite direction of \grad c where the inequality constraint <=0 is satisfied.`
			`* That means we want lambda < 0.`
			`* - This is because when the constrained force pulls x towards the infeasible region (+),`
			`* the unconstrained force is pulling x towards the opposite direction into`
			`* the feasible region (again because the total force has to be 0 to make x stay still)`
			`* So we can drop this constraint to have a lower error but feasible solution.`
			`*`
			`* In short, active inequality constraints with lambda > 0 are BAD, because they`
			`* violate the condition to be active.`
Headers and standard formatting 2014-11-26 16:04:34 +08:00			`*`
more informative comment 2014-11-27 07:53:45 +08:00			`* And we want to remove the worst one with the largest lambda from the active set.`
Headers and standard formatting 2014-11-26 16:04:34 +08:00			`*`
			`*/`
remove lpsolve 2014-12-17 00:27:20 +08:00			`int identifyLeavingConstraint(const LinearInequalityFactorGraph& workingSet,`
Headers and standard formatting 2014-11-26 16:04:34 +08:00			`const VectorValues& lambdas) const;`
refactor QPSolver into its own class 2014-04-16 04:27:19 +08:00
			`/**`
			`* Compute step size alpha for the new solution x' = xk + alpha*p, where alpha \in [0,1]`
			`*`
			`* @return a tuple of (alpha, factorIndex, sigmaIndex) where (factorIndex, sigmaIndex)`
			`* is the constraint that has minimum alpha, or (-1,-1) if alpha = 1.`
			`* This constraint will be added to the working set and become active`
			`* in the next iteration`
			`*/`
refactor QPSolver to work with single-valued linear inequality factors. Unit tests passed. 2014-12-13 01:03:00 +08:00			`boost::tuple<double, int> computeStepSize(`
refactor QPSolver inprogress... Compiled but tests failed. 2014-12-09 19:13:57 +08:00			`const LinearInequalityFactorGraph& workingSet, const VectorValues& xk,`
Headers and standard formatting 2014-11-26 16:04:34 +08:00			`const VectorValues& p) const;`
refactor QPSolver into its own class 2014-04-16 04:27:19 +08:00
refactor QPSolver inprogress... Compiled but tests failed. 2014-12-09 19:13:57 +08:00			`/** Iterate 1 step, return a new state with a new workingSet and values */`
			`QPState iterate(const QPState& state) const;`
refactor QPSolver into its own class 2014-04-16 04:27:19 +08:00
fix QPSolver unit tests 2014-12-10 05:27:11 +08:00			`/**`
			`* Identify active constraints based on initial values.`
			`*/`
			`LinearInequalityFactorGraph identifyActiveConstraints(`
			`const LinearInequalityFactorGraph& inequalities,`
			`const VectorValues& initialValues) const;`

first unittest finding QP's feasible initial point works 2014-05-02 11:55:43 +08:00			`/** Optimize with a provided initial values`
			`* For this version, it is the responsibility of the caller to provide`
remove lpsolve 2014-12-17 00:27:20 +08:00			`* a feasible initial value.`
Support non positive definite Hessian factors while doing EliminatePreferCholesky with some constrained factors. Currently, when eliminating a constrained variable, EliminatePreferCholesky converts every other factors to JacobianFactor before doing the special QR factorization for constrained variables. Unfortunately, after a constrained nonlinear graph is linearized, new hessian factors from constraints, multiplied with the dual variable (-lambda*\hessian{c} terms in the Lagrangian objective function), might become negative definite, thus cannot be converted to JacobianFactors. Following EliminateCholesky, this version of EliminatePreferCholesky for constrained var gathers all unconstrained factors into a big joint HessianFactor before converting it into a JacobianFactor to be eliminiated by QR together with the other constrained factors. Of course, this might not solve the non-positive-definite problem entirely, because (1) the original hessian factors might be non-positive definite and (2) large strange value of lambdas might cause the joint factor non-positive definite [is this true?]. But at least, this will help in typical cases. 2014-05-04 06:04:37 +08:00			`* @return a pair of <primal, dual> solutions`
first unittest finding QP's feasible initial point works 2014-05-02 11:55:43 +08:00			`*/`
Headers and standard formatting 2014-11-26 16:04:34 +08:00			`std::pair<VectorValues, VectorValues> optimize(`
initials -> initialValues 2014-11-27 17:52:25 +08:00			`const VectorValues& initialValues) const;`
refactor QPSolver into its own class 2014-04-16 04:27:19 +08:00
			`};`

			`} /* namespace gtsam */`