d5/d90/LevenbergMarquardtMDMinimizer_8cpp_source.html

// Mantid Repository : https://github.com/mantidproject/mantid

//

// Copyright &copy; 2018 ISIS Rutherford Appleton Laboratory UKRI,

//   NScD Oak Ridge National Laboratory, European Spallation Source,

//   Institut Laue - Langevin & CSNS, Institute of High Energy Physics, CAS

// SPDX - License - Identifier: GPL - 3.0 +

//----------------------------------------------------------------------

// Includes

//----------------------------------------------------------------------

#include "MantidCurveFitting/FuncMinimizers/LevenbergMarquardtMDMinimizer.h"

#include "MantidCurveFitting/CostFunctions/CostFuncFitting.h"

#include "MantidCurveFitting/GSLFunctions.h"


#include "MantidAPI/CostFunctionFactory.h"

#include "MantidAPI/FuncMinimizerFactory.h"

#include "MantidAPI/IFunction.h"


#include "MantidKernel/Logger.h"


#include <cmath>

#include <gsl/gsl_blas.h>


namespace Mantid::CurveFitting::FuncMinimisers {

namespace {

Kernel::Logger g_log("LevenbergMarquardMD");

} // namespace


// clang-format off

DECLARE_FUNCMINIMIZER(LevenbergMarquardtMDMinimizer, Levenberg-MarquardtMD)

// clang-format on


LevenbergMarquardtMDMinimizer::LevenbergMarquardtMDMinimizer()

    : IFuncMinimizer(), m_tau(1e-6), m_mu(1e-6), m_nu(2.0), m_rho(1.0), m_F(0.0) {

  declareProperty("MuMax", 1e6, "Maximum value of mu - a stopping parameter in failure.");

  declareProperty("AbsError", 0.0001,

                  "Absolute error allowed for parameters - "

                  "a stopping parameter in success.");

  declareProperty("Verbose", false, "Make output more verbose.");

}


void LevenbergMarquardtMDMinimizer::initialize(API::ICostFunction_sptr function, size_t /*maxIterations*/) {

  m_costFunction = std::dynamic_pointer_cast<CostFunctions::CostFuncFitting>(function);

  if (!m_costFunction) {

    throw std::invalid_argument("Levenberg-Marquardt minimizer works only with "

                                "functions which define the Hessian. Different function was given.");

  }

  m_mu = 0;

  m_nu = 2.0;

  m_rho = 1.0;

}


bool LevenbergMarquardtMDMinimizer::iterate(size_t /*iteration*/) {

  const bool verbose = getProperty("Verbose");

  const double muMax = getProperty("MuMax");

  const double absError = getProperty("AbsError");


  if (!m_costFunction) {

    throw std::runtime_error("Cost function isn't set up.");

  }

  size_t n = m_costFunction->nParams();


  if (n == 0) {

    m_errorString = "No parameters to fit.";

    return false;

  }


  if (m_mu > muMax) {

    m_errorString = "Failed to converge, maximum mu reached.";

    return false;

  }


  // calculate the first and second derivatives of the cost function.

  if (m_mu == 0.0 || m_rho > 0) {

    // calculate everything first time or

    // if last iteration was good

    m_F = m_costFunction->valDerivHessian();

  }

  // else if m_rho < 0 last iteration was bad: reuse m_der and m_hessian


  // Calculate damping to hessian

  if (m_mu == 0) // first iteration or accidental zero

  {

    m_mu = m_tau;

    m_nu = 2.0;

  }


  if (verbose) {

    g_log.warning() << "===========================================================\n";

    g_log.warning() << "mu=" << m_mu << "\n\n";

  }


  if (m_D.empty()) {

    m_D.resize(n);

  }


  // copy the hessian

  EigenMatrix H(m_costFunction->getHessian());

  EigenVector dd(m_costFunction->getDeriv());


  // scaling factors

  std::vector<double> sf(n);


  for (size_t i = 0; i < n; ++i) {

    double d = fabs(dd.get(i));

    if (m_D[i] > d)

      d = m_D[i];

    m_D[i] = d;

    double tmp = H.get(i, i) + m_mu * d;

    H.set(i, i, tmp);

    sf[i] = sqrt(tmp);

    if (tmp == 0.0) {

      m_errorString = "Function doesn't depend on parameter " + m_costFunction->parameterName(i);

      return false;

    }

  }


  // apply scaling

  for (size_t i = 0; i < n; ++i) {

    double d = dd.get(i);

    dd.set(i, d / sf[i]);

    for (size_t j = i; j < n; ++j) {

      const double f = sf[i] * sf[j];

      double tmp = H.get(i, j);

      H.set(i, j, tmp / f);

      if (i != j) {

        tmp = H.get(j, i);

        H.set(j, i, tmp / f);

      }

    }

  }


  if (verbose && m_rho > 0) {

    g_log.warning() << "Hessian:\n" << H;

    g_log.warning() << "Right-hand side:\n";

    for (size_t j = 0; j < n; ++j) {

      g_log.warning() << dd.get(j) << ' ';

    }

    g_log.warning() << '\n';

    g_log.warning() << "Determinant=" << H.det() << '\n';

  }


  // Parameter corrections

  EigenVector dx(n);

  // To find dx solve the system of linear equations   H * dx == -m_der

  dd *= -1.0;

  try {

    H.solve(dd, dx);

  } catch (std::runtime_error &error) {

    m_errorString = error.what();

    return false;

  }


  if (verbose) {

    g_log.warning() << "\nScaling factors:\n";

    for (size_t j = 0; j < n; ++j) {

      g_log.warning() << sf[j] << ' ';

    }

    g_log.warning() << '\n';

    g_log.warning() << "Corrections:\n";

    for (size_t j = 0; j < n; ++j) {

      g_log.warning() << dx.get(j) << ' ';

    }

    g_log.warning() << "\n\n";

  }


  // restore scaling

  for (size_t i = 0; i < n; ++i) {

    double d = dx.get(i);

    dx.set(i, d / sf[i]);

    d = dd.get(i);

    dd.set(i, d * sf[i]);

  }


  // save previous state

  m_costFunction->push();

  // Update the parameters of the cost function.

  EigenVector parameters(n);

  m_costFunction->getParameters(parameters);

  parameters += dx;

  m_costFunction->setParameters(parameters);

  if (verbose) {

    for (size_t i = 0; i < n; ++i) {

      g_log.warning() << "Parameter(" << i << ")=" << parameters[i] << '\n';

    }

  }

  m_costFunction->getFittingFunction()->applyTies();


  // --- prepare for the next iteration --- //


  double dL;

  // der -> - der - 0.5 * hessian * dx


  EigenMatrix tempHessianTr = m_costFunction->getHessian().tr();

  const gsl_matrix_const_view tempHessianTrGSL = getGSLMatrixView_const(tempHessianTr.inspector());

  const gsl_vector_const_view dxGSL = getGSLVectorView_const(dx.inspector());

  gsl_vector_view ddGSL = getGSLVectorView(dd.mutator());


  gsl_blas_dgemv(CblasNoTrans, -0.5, &tempHessianTrGSL.matrix, &dxGSL.vector, 1., &ddGSL.vector);

  // calculate the linear part of the change in cost function

  // dL = - der * dx - 0.5 * dx * hessian * dx

  gsl_blas_ddot(&ddGSL.vector, &dxGSL.vector, &dL);


  double F1 = m_costFunction->val();

  if (verbose) {

    g_log.warning() << '\n';

    g_log.warning() << "Old cost function " << m_F << '\n';

    g_log.warning() << "New cost function " << F1 << '\n';

    g_log.warning() << "Linear part " << dL << '\n';

  }


  // Try the stop condition

  if (m_rho >= 0) {

    EigenVector p(n);

    m_costFunction->getParameters(p);

    double dx_norm = gsl_blas_dnrm2(&dxGSL.vector);

    if (dx_norm < absError) {

      if (verbose) {

        g_log.warning() << "Successful fit, parameters changed by less than " << absError << '\n';

      }

      return false;

    }

    if (m_rho == 0) {

      if (m_F != F1) {

        this->m_errorString = "Failed to converge, rho == 0";

      }

      if (verbose) {

        g_log.warning() << "Successful fit, cost function didn't change.\n";

      }

      return false;

    }

  }


  if (fabs(dL) == 0.0) {

    if (m_F == F1)

      m_rho = 1.0;

    else

      m_rho = 0;

  } else {

    m_rho = (m_F - F1) / dL;

    if (m_rho == 0) {

      return false;

    }

  }

  if (verbose) {

    g_log.warning() << "rho=" << m_rho << '\n';

  }


  if (m_rho > 0) { // good progress, decrease m_mu but no more than by 1/3

    // rho = 1 - (2*rho - 1)^3

    m_rho = 2.0 * m_rho - 1.0;

    m_rho = 1.0 - m_rho * m_rho * m_rho;

    const double I3 = 1.0 / 3.0;

    if (m_rho > I3)

      m_rho = I3;

    if (m_rho < 0.0001)

      m_rho = 0.1;

    m_mu *= m_rho;

    m_nu = 2.0;

    m_F = F1;

    if (verbose) {

      g_log.warning() << "Good iteration, accept new parameters.\n";

      g_log.warning() << "rho=" << m_rho << '\n';

    }

    // drop saved state, accept new parameters

    m_costFunction->drop();

  } else { // bad iteration. increase m_mu and revert changes to parameters

    m_mu *= m_nu;

    m_nu *= 2.0;

    // undo parameter update

    m_costFunction->pop();

    m_F = m_costFunction->val();

    if (verbose) {

      g_log.warning() << "Bad iteration, increase mu and revert changes to parameters.\n";

    }

  }


  return true;

}


double LevenbergMarquardtMDMinimizer::costFunctionVal() {

  if (!m_costFunction) {

    throw std::runtime_error("Cost function isn't set up.");

  }

  return m_costFunction->val();

}


} // namespace Mantid::CurveFitting::FuncMinimisers

n
size_t n
Definition: AugmentedLagrangianOptimizer.cpp:42

tmp
gsl_vector * tmp
Definition: AugmentedLagrangianOptimizer.cpp:49

CostFuncFitting.h

CostFunctionFactory.h

GSLFunctions.h

FuncMinimizerFactory.h

DECLARE_FUNCMINIMIZER
#define DECLARE_FUNCMINIMIZER(classname, username)
Macro for declaring a new type of minimizers to be used with the FuncMinimizerFactory.
Definition: FuncMinimizerFactory.h:62

IFunction.h

error
double error
Definition: IndexPeaks.cpp:133

LevenbergMarquardtMDMinimizer.h

Logger.h

fabs
#define fabs(x)
Definition: Matrix.cpp:22

Mantid::API::IFuncMinimizer
An interface for function minimizers.
Definition: IFuncMinimizer.h:26

Mantid::API::IFuncMinimizer::m_errorString
std::string m_errorString
Error string.
Definition: IFuncMinimizer.h:57

Mantid::CurveFitting::EigenMatrix
A wrapper around Eigen::Matrix.
Definition: EigenMatrix.h:33

Mantid::CurveFitting::EigenMatrix::inspector
const map_type inspector() const
Get a const copy of the Eigen matrix.
Definition: EigenMatrix.h:58

Mantid::CurveFitting::EigenVector
A wrapper around Eigen::Vector.
Definition: EigenVector.h:27

Mantid::CurveFitting::EigenVector::set
void set(const size_t i, const double value)
Set an element.
Definition: EigenVector.cpp:113

Mantid::CurveFitting::EigenVector::get
double get(const size_t i) const
Get an element.
Definition: EigenVector.cpp:124

Mantid::CurveFitting::EigenVector::mutator
vec_map_type & mutator()
Get the map of the eigen vector.
Definition: EigenVector.h:51

Mantid::CurveFitting::EigenVector::inspector
const vec_map_type inspector() const
Get the const map of the eigen vector.
Definition: EigenVector.h:53

Mantid::CurveFitting::FuncMinimisers::LevenbergMarquardtMDMinimizer
Implementing Levenberg-Marquardt algorithm.
Definition: LevenbergMarquardtMDMinimizer.h:30

Mantid::CurveFitting::FuncMinimisers::LevenbergMarquardtMDMinimizer::m_mu
double m_mu
The damping mu parameter in the Levenberg-Marquardt method.
Definition: LevenbergMarquardtMDMinimizer.h:50

Mantid::CurveFitting::FuncMinimisers::LevenbergMarquardtMDMinimizer::m_costFunction
std::shared_ptr< CostFunctions::CostFuncFitting > m_costFunction
Pointer to the cost function.
Definition: LevenbergMarquardtMDMinimizer.h:46

Mantid::CurveFitting::FuncMinimisers::LevenbergMarquardtMDMinimizer::m_rho
double m_rho
The rho parameter in the Levenberg-Marquardt method.
Definition: LevenbergMarquardtMDMinimizer.h:54

Mantid::CurveFitting::FuncMinimisers::LevenbergMarquardtMDMinimizer::m_D
std::vector< double > m_D
Definition: LevenbergMarquardtMDMinimizer.h:57

Mantid::CurveFitting::FuncMinimisers::LevenbergMarquardtMDMinimizer::iterate
bool iterate(size_t iteration) override
Do one iteration.
Definition: LevenbergMarquardtMDMinimizer.cpp:56

Mantid::CurveFitting::FuncMinimisers::LevenbergMarquardtMDMinimizer::initialize
void initialize(API::ICostFunction_sptr function, size_t maxIterations=0) override
Initialize minimizer, i.e. pass a function to minimize.
Definition: LevenbergMarquardtMDMinimizer.cpp:44

Mantid::CurveFitting::FuncMinimisers::LevenbergMarquardtMDMinimizer::m_nu
double m_nu
The nu parameter in the Levenberg-Marquardt method.
Definition: LevenbergMarquardtMDMinimizer.h:52

Mantid::CurveFitting::FuncMinimisers::LevenbergMarquardtMDMinimizer::m_F
double m_F
To keep function value.
Definition: LevenbergMarquardtMDMinimizer.h:56

Mantid::CurveFitting::FuncMinimisers::LevenbergMarquardtMDMinimizer::costFunctionVal
double costFunctionVal() override
Return current value of the cost function.
Definition: LevenbergMarquardtMDMinimizer.cpp:285

Mantid::CurveFitting::FuncMinimisers::LevenbergMarquardtMDMinimizer::m_tau
double m_tau
The tau parameter in the Levenberg-Marquardt method.
Definition: LevenbergMarquardtMDMinimizer.h:48

Mantid::Kernel::Logger::warning
void warning(const std::string &msg)
Logs at warning level.
Definition: Logger.cpp:86

Mantid::Kernel::PropertyManager::getProperty
TypedValue getProperty(const std::string &name) const override
Get the value of a property.
Definition: PropertyManager.cpp:693

Mantid::API::g_log
Kernel::Logger g_log("ExperimentInfo")
static logger object

Mantid::API::ICostFunction_sptr
std::shared_ptr< ICostFunction > ICostFunction_sptr
define a shared pointer to a cost function
Definition: ICostFunction.h:60

Mantid::CurveFitting::FuncMinimisers
Definition: BFGS_Minimizer.h:17

Mantid::CurveFitting::getGSLVectorView
gsl_vector_view getGSLVectorView(vec_map_type &v)
take data from Eigen Vector and take a gsl view
Definition: GSLFunctions.h:54

Mantid::CurveFitting::getGSLMatrixView_const
gsl_matrix_const_view const getGSLMatrixView_const(const map_type m)
take data from a constEigen Matrix and return a transposed gsl view.
Definition: GSLFunctions.h:63

Mantid::CurveFitting::getGSLVectorView_const
gsl_vector_const_view const getGSLVectorView_const(const vec_map_type v)
take const data from Eigen Vector and take a gsl view
Definition: GSLFunctions.h:59

Mantid::Geometry::d
I a m d
Definition: SpaceGroupFactory.cpp:674