mirror of
https://gitlab.com/libeigen/eigen.git
synced 2025-03-13 18:37:27 +08:00
389 lines
15 KiB
Plaintext
389 lines
15 KiB
Plaintext
/* Non-Negagive Least Squares Algorithm for Eigen.
|
|
*
|
|
* Copyright (C) 2021 Essex Edwards, <essex.edwards@gmail.com>
|
|
* Copyright (C) 2013 Hannes Matuschek, hannes.matuschek at uni-potsdam.de
|
|
*
|
|
* This Source Code Form is subject to the terms of the Mozilla
|
|
* Public License v. 2.0. If a copy of the MPL was not distributed
|
|
* with this file, You can obtain one at http://mozilla.org/MPL/2.0/.
|
|
*/
|
|
|
|
/** \defgroup nnls Non-Negative Least Squares (NNLS) Module
|
|
* This module provides a single class @c Eigen::NNLS implementing the NNLS algorithm.
|
|
* The algorithm is described in "SOLVING LEAST SQUARES PROBLEMS", by Charles L. Lawson and
|
|
* Richard J. Hanson, Prentice-Hall, 1974 and solves optimization problems of the form
|
|
*
|
|
* \f[ \min \left\Vert Ax-b\right\Vert_2^2\quad s.t.\, x\ge 0\,.\f]
|
|
*
|
|
* The algorithm solves the constrained least-squares problem above by iteratively improving
|
|
* an estimate of which constraints are active (elements of \f$x\f$ equal to zero)
|
|
* and which constraints are inactive (elements of \f$x\f$ greater than zero).
|
|
* Each iteration, an unconstrained linear least-squares problem solves for the
|
|
* components of \f$x\f$ in the (estimated) inactive set and the sets are updated.
|
|
* The unconstrained problem minimizes \f$\left\Vert A^Nx^N-b\right\Vert_2^2\f$,
|
|
* where \f$A^N\f$ is a matrix formed by selecting all columns of A which are
|
|
* in the inactive set \f$N\f$.
|
|
*
|
|
*/
|
|
|
|
#ifndef EIGEN_NNLS_H
|
|
#define EIGEN_NNLS_H
|
|
|
|
#include "../../Eigen/Core"
|
|
#include "../../Eigen/QR"
|
|
|
|
#include <limits>
|
|
|
|
namespace Eigen {
|
|
|
|
/** \ingroup nnls
|
|
* \class NNLS
|
|
* \brief Implementation of the Non-Negative Least Squares (NNLS) algorithm.
|
|
* \tparam MatrixType The type of the system matrix \f$A\f$.
|
|
*
|
|
* This class implements the NNLS algorithm as described in "SOLVING LEAST SQUARES PROBLEMS",
|
|
* Charles L. Lawson and Richard J. Hanson, Prentice-Hall, 1974. This algorithm solves a least
|
|
* squares problem iteratively and ensures that the solution is non-negative. I.e.
|
|
*
|
|
* \f[ \min \left\Vert Ax-b\right\Vert_2^2\quad s.t.\, x\ge 0 \f]
|
|
*
|
|
* The algorithm solves the constrained least-squares problem above by iteratively improving
|
|
* an estimate of which constraints are active (elements of \f$x\f$ equal to zero)
|
|
* and which constraints are inactive (elements of \f$x\f$ greater than zero).
|
|
* Each iteration, an unconstrained linear least-squares problem solves for the
|
|
* components of \f$x\f$ in the (estimated) inactive set and the sets are updated.
|
|
* The unconstrained problem minimizes \f$\left\Vert A^Nx^N-b\right\Vert_2^2\f$,
|
|
* where \f$A^N\f$ is a matrix formed by selecting all columns of A which are
|
|
* in the inactive set \f$N\f$.
|
|
*
|
|
* See <a href="https://en.wikipedia.org/wiki/Non-negative_least_squares">the
|
|
* wikipedia page on non-negative least squares</a> for more background information.
|
|
*
|
|
* \note Please note that it is possible to construct an NNLS problem for which the
|
|
* algorithm does not converge. In practice these cases are extremely rare.
|
|
*/
|
|
template <class MatrixType_>
|
|
class NNLS {
|
|
public:
|
|
typedef MatrixType_ MatrixType;
|
|
|
|
enum {
|
|
RowsAtCompileTime = MatrixType::RowsAtCompileTime,
|
|
ColsAtCompileTime = MatrixType::ColsAtCompileTime,
|
|
Options = MatrixType::Options,
|
|
MaxRowsAtCompileTime = MatrixType::MaxRowsAtCompileTime,
|
|
MaxColsAtCompileTime = MatrixType::MaxColsAtCompileTime
|
|
};
|
|
|
|
typedef typename MatrixType::Scalar Scalar;
|
|
typedef typename MatrixType::RealScalar RealScalar;
|
|
typedef typename MatrixType::Index Index;
|
|
|
|
/** Type of a row vector of the system matrix \f$A\f$. */
|
|
typedef Matrix<Scalar, ColsAtCompileTime, 1> SolutionVectorType;
|
|
/** Type of a column vector of the system matrix \f$A\f$. */
|
|
typedef Matrix<Scalar, RowsAtCompileTime, 1> RhsVectorType;
|
|
typedef Matrix<Index, ColsAtCompileTime, 1> IndicesType;
|
|
|
|
/** */
|
|
NNLS();
|
|
|
|
/** \brief Constructs a NNLS sovler and initializes it with the given system matrix @c A.
|
|
* \param A Specifies the system matrix.
|
|
* \param max_iter Specifies the maximum number of iterations to solve the system.
|
|
* \param tol Specifies the precision of the optimum.
|
|
* This is an absolute tolerance on the gradient of the Lagrangian, \f$A^T(Ax-b)-\lambda\f$
|
|
* (with Lagrange multipliers \f$\lambda\f$).
|
|
*/
|
|
NNLS(const MatrixType &A, Index max_iter = -1, Scalar tol = NumTraits<Scalar>::dummy_precision());
|
|
|
|
/** Initializes the solver with the matrix \a A for further solving NNLS problems.
|
|
*
|
|
* This function mostly initializes/computes the preconditioner. In the future
|
|
* we might, for instance, implement column reordering for faster matrix vector products.
|
|
*/
|
|
template <typename MatrixDerived>
|
|
NNLS<MatrixType> &compute(const EigenBase<MatrixDerived> &A);
|
|
|
|
/** \brief Solves the NNLS problem.
|
|
*
|
|
* The dimension of @c b must be equal to the number of rows of @c A, given to the constructor.
|
|
*
|
|
* \returns The approximate solution vector \f$ x \f$. Use info() to determine if the solve was a success or not.
|
|
* \sa info()
|
|
*/
|
|
const SolutionVectorType &solve(const RhsVectorType &b);
|
|
|
|
/** \brief Returns the solution if a problem was solved.
|
|
* If not, an uninitialized vector may be returned. */
|
|
const SolutionVectorType &x() const { return x_; }
|
|
|
|
/** \returns the tolerance threshold used by the stopping criteria.
|
|
* \sa setTolerance()
|
|
*/
|
|
Scalar tolerance() const { return tolerance_; }
|
|
|
|
/** Sets the tolerance threshold used by the stopping criteria.
|
|
*
|
|
* This is an absolute tolerance on the gradient of the Lagrangian, \f$A^T(Ax-b)-\lambda\f$
|
|
* (with Lagrange multipliers \f$\lambda\f$).
|
|
*/
|
|
NNLS<MatrixType> &setTolerance(const Scalar &tolerance) {
|
|
tolerance_ = tolerance;
|
|
return *this;
|
|
}
|
|
|
|
/** \returns the max number of iterations.
|
|
* It is either the value set by setMaxIterations or, by default, twice the number of columns of the matrix.
|
|
*/
|
|
Index maxIterations() const { return max_iter_ < 0 ? 2 * A_.cols() : max_iter_; }
|
|
|
|
/** Sets the max number of iterations.
|
|
* Default is twice the number of columns of the matrix.
|
|
* The algorithm requires at least k iterations to produce a solution vector with k non-zero entries.
|
|
*/
|
|
NNLS<MatrixType> &setMaxIterations(Index maxIters) {
|
|
max_iter_ = maxIters;
|
|
return *this;
|
|
}
|
|
|
|
/** \returns the number of iterations (least-squares solves) performed during the last solve */
|
|
Index iterations() const { return iterations_; }
|
|
|
|
/** \returns Success if the iterations converged, and an error values otherwise. */
|
|
ComputationInfo info() const { return info_; }
|
|
|
|
private:
|
|
/** \internal Adds the given index @c idx to the inactive set N and updates the QR decomposition of \f$A^N\f$. */
|
|
void moveToInactiveSet_(Index idx);
|
|
|
|
/** \internal Removes the given index idx from the inactive set N and updates the QR decomposition of \f$A^N\f$. */
|
|
void moveToActiveSet_(Index idx);
|
|
|
|
/** \internal Solves the least-squares problem \f$\left\Vert y-A^Nx\right\Vert_2^2\f$. */
|
|
void solveInactiveSet_(const RhsVectorType &b);
|
|
|
|
private:
|
|
typedef Matrix<Scalar, ColsAtCompileTime, ColsAtCompileTime> MatrixAtAType;
|
|
|
|
/** \internal Holds the maximum number of iterations for the NNLS algorithm.
|
|
* @c -1 means to use the default value. */
|
|
Index max_iter_;
|
|
/** \internal Holds the number of iterations. */
|
|
Index iterations_;
|
|
/** \internal Holds success/fail of the last solve. */
|
|
ComputationInfo info_;
|
|
/** \internal Size of the inactive set. */
|
|
Index numInactive_;
|
|
/** \internal Accuracy of the algorithm w.r.t the optimality of the solution (gradient). */
|
|
Scalar tolerance_;
|
|
/** \internal The system matrix, a copy of the one given to the constructor. */
|
|
MatrixType A_;
|
|
/** \internal Precomputed product \f$A^TA\f$. */
|
|
MatrixAtAType AtA_;
|
|
/** \internal Will hold the solution. */
|
|
SolutionVectorType x_;
|
|
/** \internal Will hold the current gradient.\f$A^Tb - A^TAx\f$ */
|
|
SolutionVectorType gradient_;
|
|
/** \internal Will hold the partial solution. */
|
|
SolutionVectorType y_;
|
|
/** \internal Precomputed product \f$A^Tb\f$. */
|
|
SolutionVectorType Atb_;
|
|
/** \internal Holds the current permutation partitioning the active and inactive sets.
|
|
* The first @c numInactive_ elements form the inactive set and the rest the active set. */
|
|
IndicesType index_sets_;
|
|
/** \internal QR decomposition to solve the (inactive) sub system (together with @c qrCoeffs_). */
|
|
MatrixType QR_;
|
|
/** \internal QR decomposition to solve the (inactive) sub system (together with @c QR_). */
|
|
SolutionVectorType qrCoeffs_;
|
|
/** \internal Some workspace for QR decomposition. */
|
|
SolutionVectorType tempSolutionVector_;
|
|
RhsVectorType tempRhsVector_;
|
|
};
|
|
|
|
/* ********************************************************************************************
|
|
* Implementation
|
|
* ******************************************************************************************** */
|
|
|
|
template <typename MatrixType>
|
|
NNLS<MatrixType>::NNLS()
|
|
: max_iter_(-1),
|
|
iterations_(0),
|
|
info_(ComputationInfo::InvalidInput),
|
|
numInactive_(0),
|
|
tolerance_(NumTraits<Scalar>::dummy_precision()) {}
|
|
|
|
template <typename MatrixType>
|
|
NNLS<MatrixType>::NNLS(const MatrixType &A, Index max_iter, Scalar tol) : max_iter_(max_iter), tolerance_(tol) {
|
|
compute(A);
|
|
}
|
|
|
|
template <typename MatrixType>
|
|
template <typename MatrixDerived>
|
|
NNLS<MatrixType> &NNLS<MatrixType>::compute(const EigenBase<MatrixDerived> &A) {
|
|
// Ensure Scalar type is real. The non-negativity constraint doesn't obviously extend to complex numbers.
|
|
EIGEN_STATIC_ASSERT(!NumTraits<Scalar>::IsComplex, NUMERIC_TYPE_MUST_BE_REAL);
|
|
|
|
// max_iter_: unchanged
|
|
iterations_ = 0;
|
|
info_ = ComputationInfo::Success;
|
|
numInactive_ = 0;
|
|
// tolerance: unchanged
|
|
A_ = A.derived();
|
|
AtA_.noalias() = A_.transpose() * A_;
|
|
x_.resize(A_.cols());
|
|
gradient_.resize(A_.cols());
|
|
y_.resize(A_.cols());
|
|
Atb_.resize(A_.cols());
|
|
index_sets_.resize(A_.cols());
|
|
QR_.resize(A_.rows(), A_.cols());
|
|
qrCoeffs_.resize(A_.cols());
|
|
tempSolutionVector_.resize(A_.cols());
|
|
tempRhsVector_.resize(A_.rows());
|
|
|
|
return *this;
|
|
}
|
|
|
|
template <typename MatrixType>
|
|
const typename NNLS<MatrixType>::SolutionVectorType &NNLS<MatrixType>::solve(const RhsVectorType &b) {
|
|
// Initialize solver
|
|
iterations_ = 0;
|
|
info_ = ComputationInfo::NumericalIssue;
|
|
x_.setZero();
|
|
|
|
index_sets_ = IndicesType::LinSpaced(A_.cols(), 0, A_.cols() - 1); // Identity permutation.
|
|
numInactive_ = 0;
|
|
|
|
// Precompute A^T*b
|
|
Atb_.noalias() = A_.transpose() * b;
|
|
|
|
const Index maxIterations = this->maxIterations();
|
|
|
|
// OUTER LOOP
|
|
while (true) {
|
|
// Early exit if all variables are inactive, which breaks 'maxCoeff' below.
|
|
if (A_.cols() == numInactive_) {
|
|
info_ = ComputationInfo::Success;
|
|
return x_;
|
|
}
|
|
|
|
// Find the maximum element of the gradient in the active set.
|
|
// If it is small or negative, then we have converged.
|
|
// Else, we move that variable to the inactive set.
|
|
gradient_.noalias() = Atb_ - AtA_ * x_;
|
|
|
|
const Index numActive = A_.cols() - numInactive_;
|
|
Index argmaxGradient = -1;
|
|
const Scalar maxGradient = gradient_(index_sets_.tail(numActive)).maxCoeff(&argmaxGradient);
|
|
argmaxGradient += numInactive_; // beacause tail() skipped the first numInactive_ elements
|
|
|
|
if (maxGradient < tolerance_) {
|
|
info_ = ComputationInfo::Success;
|
|
return x_;
|
|
}
|
|
|
|
moveToInactiveSet_(argmaxGradient);
|
|
|
|
// INNER LOOP
|
|
while (true) {
|
|
// Check if max. number of iterations is reached
|
|
if (iterations_ >= maxIterations) {
|
|
info_ = ComputationInfo::NoConvergence;
|
|
return x_;
|
|
}
|
|
|
|
// Solve least-squares problem in inactive set only,
|
|
// this step is rather trivial as moveToInactiveSet_ & moveToActiveSet_
|
|
// updates the QR decomposition of inactive columns A^N.
|
|
// solveInactiveSet_ puts the solution in y_
|
|
solveInactiveSet_(b);
|
|
++iterations_; // The solve is expensive, so that is what we count as an iteration.
|
|
|
|
// Check feasability...
|
|
bool feasible = true;
|
|
Scalar alpha = NumTraits<Scalar>::highest();
|
|
Index infeasibleIdx = -1; // Which variable became infeasible first.
|
|
for (Index i = 0; i < numInactive_; i++) {
|
|
Index idx = index_sets_[i];
|
|
if (y_(idx) < 0) {
|
|
// t should always be in [0,1].
|
|
Scalar t = -x_(idx) / (y_(idx) - x_(idx));
|
|
if (alpha > t) {
|
|
alpha = t;
|
|
infeasibleIdx = i;
|
|
feasible = false;
|
|
}
|
|
}
|
|
}
|
|
eigen_assert(feasible || 0 <= infeasibleIdx);
|
|
|
|
// If solution is feasible, exit to outer loop
|
|
if (feasible) {
|
|
x_ = y_;
|
|
break;
|
|
}
|
|
|
|
// Infeasible solution -> interpolate to feasible one
|
|
for (Index i = 0; i < numInactive_; i++) {
|
|
Index idx = index_sets_[i];
|
|
x_(idx) += alpha * (y_(idx) - x_(idx));
|
|
}
|
|
|
|
// Remove these indices from the inactive set and update QR decomposition
|
|
moveToActiveSet_(infeasibleIdx);
|
|
}
|
|
}
|
|
}
|
|
|
|
template <typename MatrixType>
|
|
void NNLS<MatrixType>::moveToInactiveSet_(Index idx) {
|
|
// Update permutation matrix:
|
|
std::swap(index_sets_(idx), index_sets_(numInactive_));
|
|
numInactive_++;
|
|
|
|
// Perform rank-1 update of the QR decomposition stored in QR_ & qrCoeff_
|
|
internal::householder_qr_inplace_update(QR_, qrCoeffs_, A_.col(index_sets_(numInactive_ - 1)), numInactive_ - 1,
|
|
tempSolutionVector_.data());
|
|
}
|
|
|
|
template <typename MatrixType>
|
|
void NNLS<MatrixType>::moveToActiveSet_(Index idx) {
|
|
// swap index with last inactive one & reduce number of inactive columns
|
|
std::swap(index_sets_(idx), index_sets_(numInactive_ - 1));
|
|
numInactive_--;
|
|
// Update QR decomposition starting from the removed index up to the end [idx, ..., numInactive_]
|
|
for (Index i = idx; i < numInactive_; i++) {
|
|
Index col = index_sets_(i);
|
|
internal::householder_qr_inplace_update(QR_, qrCoeffs_, A_.col(col), i, tempSolutionVector_.data());
|
|
}
|
|
}
|
|
|
|
template <typename MatrixType>
|
|
void NNLS<MatrixType>::solveInactiveSet_(const RhsVectorType &b) {
|
|
eigen_assert(numInactive_ > 0);
|
|
|
|
tempRhsVector_ = b;
|
|
|
|
// tmpRHS(0:numInactive_-1) := Q'*b
|
|
// tmpRHS(numInactive_:end) := useless stuff we would rather not compute at all.
|
|
tempRhsVector_.applyOnTheLeft(
|
|
householderSequence(QR_.leftCols(numInactive_), qrCoeffs_.head(numInactive_)).transpose());
|
|
|
|
// tempSol(0:numInactive_-1) := inv(R) * Q' * b
|
|
// = the least-squares solution for the inactive variables.
|
|
tempSolutionVector_.head(numInactive_) = //
|
|
QR_.topLeftCorner(numInactive_, numInactive_) //
|
|
.template triangularView<Upper>() //
|
|
.solve(tempRhsVector_.head(numInactive_)); //
|
|
|
|
// tempSol(numInactive_:end) := 0 = the value for the constrained variables.
|
|
tempSolutionVector_.tail(y_.size() - numInactive_).setZero();
|
|
|
|
// Back permute into original column order of A
|
|
y_.noalias() = index_sets_.asPermutation() * tempSolutionVector_.head(y_.size());
|
|
}
|
|
|
|
} // namespace Eigen
|
|
|
|
#endif // EIGEN_NNLS_H
|