Object/Programmer/_least_squares_8cpp_source.html

/* SPDX-License-Identifier: CC0-1.0 */

#include "jama/jama_svd.h"

#include "jama/jama_qr.h"


#include <armadillo>


#include "LeastSquares.h"

#include "IException.h"

#include "IString.h"


namespace Isis {


  LeastSquares::LeastSquares(Isis::BasisFunction &basis, bool sparse,

                             int sparseRows, int sparseCols, bool jigsaw) {

    p_jigsaw = jigsaw;

    p_basis = &basis;

    p_solved = false;

    p_sparse = sparse;

    p_sigma0 = 0.;


    p_sparseRows = sparseRows;

    p_sparseCols = sparseCols;


    if (p_sparse) {


      //  make sure sparse nrows/ncols have been set

      if (sparseRows == 0  ||  sparseCols == 0) {

        QString msg = "If solving using sparse matrices, you must enter the "

                      "number of rows/columns";

        throw IException(IException::Programmer, msg, _FILEINFO_);

      }


      p_sparseA.set_size(sparseRows, sparseCols);

      p_normals.set_size(sparseCols, sparseCols);

      p_ATb.resize(sparseCols, 1);

      p_xSparse.resize(sparseCols);


      if( p_jigsaw ) {

        p_epsilonsSparse.resize(sparseCols);

        std::fill_n(p_epsilonsSparse.begin(), sparseCols, 0.0);


        p_parameterWeights.resize(sparseCols);

      }


    }

    p_currentFillRow = -1;

  }


  LeastSquares::~LeastSquares() {

  }


  void LeastSquares::AddKnown(const std::vector<double> &data, double result,

                              double weight) {

    if((int) data.size() != p_basis->Variables()) {

      QString msg = "Number of elements in data does not match basis [" +

                        p_basis->Name() + "] requirements";

      throw IException(IException::Programmer, msg, _FILEINFO_);

    }


    p_expected.push_back(result);


    if (weight == 1) {

      p_sqrtWeight.push_back(weight);

    }

    else {

      p_sqrtWeight.push_back(sqrt(weight));

    }


    if(p_sparse) {

      FillSparseA(data);

    }

    else {

      p_input.push_back(data);

    }

  }


  void LeastSquares::FillSparseA(const std::vector<double> &data) {


    p_basis->Expand(data);


    p_currentFillRow++;


    int ncolumns = (int)data.size();


    for(int c = 0;  c < ncolumns; c++) {

      p_sparseA(p_currentFillRow, c) = p_basis->Term(c) * p_sqrtWeight[p_currentFillRow];

    }

  }


  std::vector<double> LeastSquares::GetInput(int row) const {

    if((row >= Rows()) || (row < 0)) {

      QString msg = "Index out of bounds [Given = " + toString(row) + "]";

      throw IException(IException::Programmer, msg, _FILEINFO_);

    }

    return p_input[row];

  }


  double LeastSquares::GetExpected(int row) const {

    if((row >= Rows()) || (row < 0)) {

      QString msg = "Index out of bounds [Given = " + toString(row) + "]";

      throw IException(IException::Programmer, msg, _FILEINFO_);

    }

    return p_expected[row];

  }


  int LeastSquares::Rows() const {

    return (int)p_input.size();

  }


  int LeastSquares::Solve(Isis::LeastSquares::SolveMethod method) {


    if((method == SPARSE  &&  p_sparseRows == 0)  ||

       (method != SPARSE  &&  Rows() == 0 )) {

      p_solved = false;

      QString msg = "No solution available because no input data was provided";

      throw IException(IException::Unknown, msg, _FILEINFO_);

    }


    if(method == SVD) {

      SolveSVD();

    }

    else if(method == QRD) {

      SolveQRD();

    }

    else if(method == SPARSE) {

      int column = SolveSparse();

      return column;

    }

    return 0;

  }


  void LeastSquares::SolveSVD() {


    // We are solving Ax=b ... start by creating A

    TNT::Array2D<double> A(p_input.size(), p_basis->Coefficients());

    for(int r = 0; r < A.dim1(); r++) {

      p_basis->Expand(p_input[r]);

      for(int c = 0; c < A.dim2(); c++) {

        A[r][c] = p_basis->Term(c) * p_sqrtWeight[r];

      }

    }


    // Ok use singular value decomposition to solve for the coefficients

    // A = [U][S][V']  where [U] is MxN, [S] is NxN, [V'] is NxN transpose

    // of [V].  We are solving for [A]x=b and need inverse of [A] such

    // that x = [invA]b. Since inverse may not exist we use the

    // pseudo-inverse [A+] from SVD which is [A+] = [V][invS][U']

    // Our coefficents are then x = [A+]b where b is p_b.

    JAMA::SVD<double> svd(A);


    TNT::Array2D<double> V;

    svd.getV(V);


    // The inverse of S is the 1 over each diagonal element of S

    TNT::Array2D<double> invS;

    svd.getS(invS);


    for(int i = 0; i < invS.dim1(); i++) {

      if(invS[i][i] != 0.0) invS[i][i] = 1.0 / invS[i][i];

    }


    // Transpose U

    TNT::Array2D<double> U;

    svd.getU(U);

    TNT::Array2D<double> transU(U.dim2(), U.dim1());


    for(int r = 0; r < U.dim1(); r++) {

      for(int c = 0; c < U.dim2(); c++) {

        transU[c][r] = U[r][c];

      }

    }


    // Now multiply everything together to get [A+]

    TNT::Array2D<double> VinvS = TNT::matmult(V, invS);

    TNT::Array2D<double> Aplus = TNT::matmult(VinvS, transU);


    // Using Aplus and our b we can solve for the coefficients

    TNT::Array2D<double> b(p_expected.size(), 1);


    for(int r = 0; r < (int)p_expected.size(); r++) {

      b[r][0] = p_expected[r] * p_sqrtWeight[r];

    }


    TNT::Array2D<double> coefs = TNT::matmult(Aplus, b);


    // If the rank of the matrix is not large enough we don't

    // have enough coefficients for the solution

    if (coefs.dim1() < p_basis->Coefficients()) {

      QString msg = "Unable to solve least-squares using SVD method. No "

                    "solution available. Not enough knowns or knowns are "

                    "co-linear ... [Unknowns = "

                    + toString(p_basis->Coefficients()) + "] [Knowns = "

                    + toString(coefs.dim1()) + "]";

      throw IException(IException::Unknown, msg, _FILEINFO_);

    }


    // Set the coefficients in our basis equation

    std::vector<double> bcoefs;

    for (int i = 0; i < coefs.dim1(); i++) bcoefs.push_back(coefs[i][0]);


    p_basis->SetCoefficients(bcoefs);


    // Compute the errors

    for(int i = 0; i < (int)p_input.size(); i++) {

      double value = p_basis->Evaluate(p_input[i]);

      p_residuals.push_back(value - p_expected[i]);

      p_sigma0 += p_residuals[i]*p_residuals[i]*p_sqrtWeight[i]*p_sqrtWeight[i];

    }

    // calculate degrees of freedom (or redundancy)

    // DOF = # observations + # constrained parameters - # unknown parameters

    p_degreesOfFreedom = p_basis->Coefficients() - coefs.dim1();


    if( p_degreesOfFreedom > 0.0 )  {

      p_sigma0 = p_sigma0/(double)p_degreesOfFreedom;

    }


    // check for p_sigma0 < 0

    p_sigma0 = sqrt(p_sigma0);


    // All done

    p_solved = true;

  }


  void LeastSquares::SolveQRD() {


    // We are solving Ax=b ... start by creating an MxN matrix, A

    TNT::Array2D<double> A(p_input.size(), p_basis->Coefficients());

    for(int r = 0; r < A.dim1(); r++) {

      p_basis->Expand(p_input[r]);

      for(int c = 0; c < A.dim2(); c++) {

        A[r][c] = p_basis->Term(c) * p_sqrtWeight[r];

      }

    }


    // Ok use  to solve for the coefficients

    // [A] = [Q][R]  where [Q] is MxN and orthogonal and  [R] is an NxN,

    // upper triangular matrix.  TNT provides the solve method that inverts

    // [Q] and backsolves [R] to get the coefficients in the vector x.

    // That is, we solve the system Rx = Q^T b

    JAMA::QR<double> qr(A);


    // Using A and our b we can solve for the coefficients

    TNT::Array1D<double> b(p_expected.size());

    for(int r = 0; r < (int)p_expected.size(); r++) {

      b[r] = p_expected[r] * p_sqrtWeight[r];

    }// by construction, we know the size of b is equal to M, so b is conformant


    // Check to make sure the matrix is full rank before solving

    // -- rectangular matrices must be full rank in order for the solve method

    //    to be successful

    int full = qr.isFullRank();

    if(full == 0) {

      QString msg = "Unable to solve-least squares using QR Decomposition. "

                    "The upper triangular R matrix is not full rank";

      throw IException(IException::Unknown, msg, _FILEINFO_);

    }


    TNT::Array1D<double> coefs = qr.solve(b);


    // Set the coefficients in our basis equation

    std::vector<double> bcoefs;

    for(int i = 0; i < coefs.dim1(); i++) {

      bcoefs.push_back(coefs[i]);

    }

    p_basis->SetCoefficients(bcoefs);


    // Compute the errors

    for(int i = 0; i < (int)p_input.size(); i++) {

      double value = p_basis->Evaluate(p_input[i]);

      p_residuals.push_back(value - p_expected[i]);

    }


    // All done

    p_solved = true;

  }


  int LeastSquares::SolveSparse() {


    // form "normal equations" matrix by multiplying ATA

    p_normals = p_sparseA.t()*p_sparseA;


    // Create the right-hand-side column vector 'b'

    arma::mat b(p_sparseRows, 1);


    // multiply each element of 'b' by it's associated weight

    for ( int r = 0; r < p_sparseRows; r++ )

      b(r,0) = p_expected[r] * p_sqrtWeight[r];


    // form ATb

    p_ATb = p_sparseA.t()*b;


    // apply parameter weighting if Jigsaw (bundle adjustment)

    if ( p_jigsaw ) {

      for( int i = 0; i < p_sparseCols; i++) {

        double weight = p_parameterWeights[i];


        if( weight <= 0.0 )

          continue;


        p_normals(i, i) += weight;

        p_ATb(i, 0) -= p_epsilonsSparse[i]*weight;

      }

    }


    bool status = spsolve(p_xSparse, p_normals, p_ATb, "superlu");


    if (status == false) {

      QString msg = "Could not solve sparse least squares problem.";

      throw IException(IException::Unknown, msg, _FILEINFO_);

    }


    // Set the coefficients in our basis equation

    p_basis->SetCoefficients(arma::conv_to< std::vector<double> >::from(p_xSparse));


    // if Jigsaw (bundle adjustment)

    // add corrections into epsilon vector (keeping track of total corrections)

    if ( p_jigsaw ) {

      for( int i = 0; i < p_sparseCols; i++ )

        p_epsilonsSparse[i] += p_xSparse[i];

    }


    // Compute the image coordinate residuals and sum into Sigma0

    // (note this is exactly what was being done before, but with less overhead - I think)

    // ultimately, we should not be using the A matrix but forming the normals

    // directly. Then we'll have to compute the residuals by back projection


    p_residuals.resize(p_sparseRows);

    p_residuals = arma::conv_to< std::vector<double> >::from(p_sparseA*p_xSparse);

    p_sigma0 = 0.0;


    for ( int i = 0; i < p_sparseRows; i++ ) {

        p_residuals[i] = p_residuals[i]/p_sqrtWeight[i];

        p_residuals[i] -= p_expected[i];

        p_sigma0 += p_residuals[i]*p_residuals[i]*p_sqrtWeight[i]*p_sqrtWeight[i];

    }


    // if Jigsaw (bundle adjustment)

    // add contibution to Sigma0 from constrained parameters

    if ( p_jigsaw ) {

      double constrained_vTPv = 0.0;


      for ( int i = 0; i < p_sparseCols; i++ ) {

        double weight = p_parameterWeights[i];


        if ( weight <= 0.0 )

          continue;


        constrained_vTPv += p_epsilonsSparse[i]*p_epsilonsSparse[i]*weight;

      }

      p_sigma0 += constrained_vTPv;

    }

    // calculate degrees of freedom (or redundancy)

    // DOF = # observations + # constrained parameters - # unknown parameters

    p_degreesOfFreedom = p_sparseRows + p_constrainedParameters - p_sparseCols;


    if( p_degreesOfFreedom <= 0.0 ) {

      p_sigma0 = 1.0;

    }

    else {

      p_sigma0 = p_sigma0/(double)p_degreesOfFreedom;

    }


    // check for p_sigma0 < 0

    p_sigma0 = sqrt(p_sigma0);


    // All done

    p_solved = true;

    return 0;

  }


  void LeastSquares::Reset ()

  {

    if ( p_sparse ) {

      p_sparseA.zeros();

      p_ATb.zeros();

      p_normals.zeros();

      p_currentFillRow = -1;

    }

    else {

      p_input.clear();

    }

      p_sigma0 = 0.;

    p_residuals.clear();

    p_expected.clear();

    p_sqrtWeight.clear();

    p_solved = false;

  }


  double LeastSquares::Evaluate(const std::vector<double> &data) {

    if(!p_solved) {

      QString msg = "Unable to evaluate until a solution has been computed";

      throw IException(IException::Programmer, msg, _FILEINFO_);

    }

    return p_basis->Evaluate(data);

  }


  std::vector<double> LeastSquares::Residuals() const {

    if(!p_solved) {

      QString msg = "Unable to return residuals until a solution has been computed";

      throw IException(IException::Programmer, msg, _FILEINFO_);

    }

    return p_residuals;

  }


  double LeastSquares::Residual(int i) const {

    if(!p_solved) {

      QString msg = "Unable to return residuals until a solution has been computed";

      throw IException(IException::Programmer, msg, _FILEINFO_);

    }

    return p_residuals[i];

  }


  void LeastSquares::Weight(int index, double weight) {

    if(weight == 1) {

      p_sqrtWeight[index] = weight;

    }

    else {

      p_sqrtWeight[index] = sqrt(weight);

    }

  }


} // end namespace isis

Isis::BasisFunction
Generic linear equation class.
Definition BasisFunction.h:48

Isis::IException
Isis exception class.
Definition IException.h:91

Isis::IException::Unknown
@ Unknown
A type of error that cannot be classified as any of the other error types.
Definition IException.h:118

Isis::IException::Programmer
@ Programmer
This error is for when a programmer made an API call that was illegal.
Definition IException.h:146

Isis::LeastSquares::p_xSparse
arma::mat p_xSparse
sparse solution matrix
Definition LeastSquares.h:151

Isis::LeastSquares::p_normals
arma::SpMat< double > p_normals
normal equations matrix 'N'
Definition LeastSquares.h:156

Isis::LeastSquares::GetExpected
double GetExpected(int row) const
This method returns the expected value at the given row.
Definition LeastSquares.cpp:173

Isis::LeastSquares::Weight
void Weight(int index, double weight)
Reset the weight for the ith known.
Definition LeastSquares.cpp:614

Isis::LeastSquares::p_sigma0
double p_sigma0
sigma nought - reference variance
Definition LeastSquares.h:170

Isis::LeastSquares::SolveSparse
int SolveSparse()
Solve using sparse class.
Definition LeastSquares.cpp:428

Isis::LeastSquares::p_sparseA
arma::SpMat< double > p_sparseA
design matrix 'A'
Definition LeastSquares.h:155

Isis::LeastSquares::p_parameterWeights
std::vector< double > p_parameterWeights
vector of parameter weights
Definition LeastSquares.h:153

Isis::LeastSquares::Residual
double Residual(int i) const
Returns the ith residual.
Definition LeastSquares.cpp:590

Isis::LeastSquares::p_solved
bool p_solved
Boolean value indicating solution is complete.
Definition LeastSquares.h:162

Isis::LeastSquares::Rows
int Rows() const
This methods returns the number of rows in the matrix.
Definition LeastSquares.cpp:187

Isis::LeastSquares::p_basis
Isis::BasisFunction * p_basis
Pointer to the BasisFunction object.
Definition LeastSquares.h:183

Isis::LeastSquares::~LeastSquares
~LeastSquares()
Destroys the LeastSquares object.
Definition LeastSquares.cpp:62

Isis::LeastSquares::SolveMethod
SolveMethod
Definition LeastSquares.h:112

Isis::LeastSquares::SPARSE
@ SPARSE
Sparse.
Definition LeastSquares.h:114

Isis::LeastSquares::QRD
@ QRD
QR Decomposition.
Definition LeastSquares.h:113

Isis::LeastSquares::SVD
@ SVD
Singular Value Decomposition.
Definition LeastSquares.h:112

Isis::LeastSquares::Evaluate
double Evaluate(const std::vector< double > &input)
Invokes the BasisFunction Evaluate method.
Definition LeastSquares.cpp:553

Isis::LeastSquares::p_input
std::vector< std::vector< double > > p_input
A vector of the input variables to evaluate.
Definition LeastSquares.h:172

Isis::LeastSquares::p_constrainedParameters
int p_constrainedParameters
constrained parameters
Definition LeastSquares.h:167

Isis::LeastSquares::p_ATb
arma::mat p_ATb
right-hand side vector
Definition LeastSquares.h:157

Isis::LeastSquares::Solve
int Solve(Isis::LeastSquares::SolveMethod method=SVD)
After all the data has been registered through AddKnown, invoke this method to solve the system of eq...
Definition LeastSquares.cpp:205

Isis::LeastSquares::SolveQRD
void SolveQRD()
After all the data has been registered through AddKnown, invoke this method to solve the system of eq...
Definition LeastSquares.cpp:339

Isis::LeastSquares::p_epsilonsSparse
std::vector< double > p_epsilonsSparse
sparse vector of total parameter corrections
Definition LeastSquares.h:152

Isis::LeastSquares::SolveSVD
void SolveSVD()
After all the data has been registered through AddKnown, invoke this method to solve the system of eq...
Definition LeastSquares.cpp:236

Isis::LeastSquares::LeastSquares
LeastSquares(Isis::BasisFunction &basis, bool sparse=false, int sparseRows=0, int sparseCols=0, bool jigsaw=false)
Creates a LeastSquares Object.
Definition LeastSquares.cpp:23

Isis::LeastSquares::Residuals
std::vector< double > Residuals() const
Returns a vector of residuals (errors).
Definition LeastSquares.cpp:570

Isis::LeastSquares::FillSparseA
void FillSparseA(const std::vector< double > &data)
Invoke this method for each set of knowns for sparse solutions.
Definition LeastSquares.cpp:137

Isis::LeastSquares::p_sqrtWeight
std::vector< double > p_sqrtWeight
A vector of the square roots of the weights for each known value.
Definition LeastSquares.h:176

Isis::LeastSquares::p_residuals
std::vector< double > p_residuals
A vector of the residuals (or difference between expected and solved values).
Definition LeastSquares.h:179

Isis::LeastSquares::AddKnown
void AddKnown(const std::vector< double > &input, double expected, double weight=1.0)
Invoke this method for each set of knowns.
Definition LeastSquares.cpp:96

Isis::LeastSquares::p_expected
std::vector< double > p_expected
A vector of the expected values when solved.
Definition LeastSquares.h:174

Isis::LeastSquares::GetInput
std::vector< double > GetInput(int row) const
This method returns the data at the given row.
Definition LeastSquares.cpp:158

Isis::LeastSquares::p_degreesOfFreedom
int p_degreesOfFreedom
degrees of freedom (redundancy)
Definition LeastSquares.h:168

Isis
This is free and unencumbered software released into the public domain.
Definition Apollo.h:16

Isis::toString
QString toString(bool boolToConvert)
Global function to convert a boolean to a string.
Definition IString.cpp:211