2.7.0/html/GumbelMaxLikelihoodFitter_8h_source.html

 // --------------------------------------------------------------------------

 //                   OpenMS -- Open-Source Mass Spectrometry

 // --------------------------------------------------------------------------

 // Copyright The OpenMS Team -- Eberhard Karls University Tuebingen,

 // ETH Zurich, and Freie Universitaet Berlin 2002-2021.

 //

 // This software is released under a three-clause BSD license:

 //  * Redistributions of source code must retain the above copyright

 //    notice, this list of conditions and the following disclaimer.

 //  * Redistributions in binary form must reproduce the above copyright

 //    notice, this list of conditions and the following disclaimer in the

 //    documentation and/or other materials provided with the distribution.

 //  * Neither the name of any author or any participating institution

 //    may be used to endorse or promote products derived from this software

 //    without specific prior written permission.

 // For a full list of authors, refer to the file AUTHORS.

 // --------------------------------------------------------------------------

 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"

 // AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE

 // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE

 // ARE DISCLAIMED. IN NO EVENT SHALL ANY OF THE AUTHORS OR THE CONTRIBUTING

 // INSTITUTIONS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,

 // EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,

 // PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;

 // OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,

 // WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR

 // OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF

 // ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

 //

 // --------------------------------------------------------------------------

 // $Maintainer: Julianus Pfeuffer $

 // $Authors: Julianus Pfeuffer $

 // --------------------------------------------------------------------------

 //

 #pragma once


 #include <OpenMS/DATASTRUCTURES/String.h>

 #include <OpenMS/DATASTRUCTURES/DPosition.h>

 #include <unsupported/Eigen/NonLinearOptimization>

 #include <vector>


 namespace OpenMS

 {

   namespace Math

   {

     class OPENMS_DLLAPI GumbelMaxLikelihoodFitter

     {


 public:


       struct GumbelDistributionFitResult

       {

         GumbelDistributionFitResult(double local_a, double local_b) :

           a(local_a),

           b(local_b)

         {

         }


         double a;

         double b;


         double log_eval_no_normalize(double x) const;

       };


       GumbelMaxLikelihoodFitter();

       GumbelMaxLikelihoodFitter(GumbelDistributionFitResult init);

       virtual ~GumbelMaxLikelihoodFitter();


       void setInitialParameters(const GumbelDistributionFitResult & result);


       // Generic functor

       template<typename _Scalar, int NX = Eigen::Dynamic, int NY = Eigen::Dynamic>

       struct Functor

       {

         typedef _Scalar Scalar;

         enum {

           InputsAtCompileTime = NX,

           ValuesAtCompileTime = NY

         };

         typedef Eigen::Matrix<Scalar,InputsAtCompileTime,1> InputType;

         typedef Eigen::Matrix<Scalar,ValuesAtCompileTime,1> ValueType;

         typedef Eigen::Matrix<Scalar,ValuesAtCompileTime,InputsAtCompileTime> JacobianType;


         int m_inputs, m_values;


         Functor() : m_inputs(InputsAtCompileTime), m_values(ValuesAtCompileTime) {}

         Functor(int inputs, int values) : m_inputs(inputs), m_values(values) {}


         int inputs() const { return m_inputs; }

         int values() const { return m_values; }


       };


       struct GumbelDistributionFunctor : Functor<double>

       {


         GumbelDistributionFunctor(const std::vector<double>& data, const std::vector<double>& weights):

             Functor<double>(2,2),

             m_data(data), m_weights(weights)

         {

         }


         int operator()(const Eigen::VectorXd &x, Eigen::VectorXd &fvec) const

         {

           fvec(0) = 0.0;

           double sigma = fabs(x(1));

           double logsigma = log(sigma);

           auto wit = m_weights.cbegin();

           for (auto it = m_data.cbegin(); it != m_data.cend(); ++it, ++wit)

           {

             double diff = (*it - x(0)) / sigma;

             fvec(0) += *wit * (-logsigma - diff - exp(-diff));

           }

           double foo = -fvec(0);

           fvec(0) = foo;

           fvec(1) = 0.0;

           return 0;

         }

         const std::vector<double>& m_data;

         const std::vector<double>& m_weights;

       };


       GumbelDistributionFitResult fitWeighted(const std::vector<double> & x, const std::vector<double> & w)

       {


         Eigen::VectorXd x_init (2);

         x_init(0) = init_param_.a;

         x_init(1) = init_param_.b;

         GumbelDistributionFunctor functor (x, w);

         Eigen::NumericalDiff<GumbelDistributionFunctor> numDiff(functor);

         Eigen::LevenbergMarquardt<Eigen::NumericalDiff<GumbelDistributionFunctor>,double> lm(numDiff);

         Eigen::LevenbergMarquardtSpace::Status status = lm.minimize(x_init);


         //the states are poorly documented. after checking the source, we believe that

         //all states except NotStarted, Running and ImproperInputParameters are good

         //termination states.

         if (status <= Eigen::LevenbergMarquardtSpace::Status::ImproperInputParameters)

         {

           throw Exception::UnableToFit(__FILE__, __LINE__, OPENMS_PRETTY_FUNCTION, "UnableToFit-GumbelMaxLikelihoodFitter", "Could not fit the gumbel distribution to the data");

         }


         #ifdef GUMBEL_DISTRIBUTION_FITTER_VERBOSE

         // build a formula with the fitted parameters for gnuplot

       stringstream formula;

       formula << "f(x)=" << "(1/" << x_init(1) << ") * " << "exp(( " << x_init(0) << "- x)/" << x_init(1) << ") * exp(-exp((" << x_init(0) << " - x)/" << x_init(1) << "))";

       cout << formula.str() << endl;

         #endif

         init_param_.a = x_init(0);

         init_param_.b = fabs(x_init(1));


         return {x_init(0), fabs(x_init(1))};

       }


 protected:


       GumbelDistributionFitResult init_param_;


 private:

       GumbelMaxLikelihoodFitter(const GumbelMaxLikelihoodFitter & rhs);

       GumbelMaxLikelihoodFitter & operator=(const GumbelMaxLikelihoodFitter & rhs);

     };

   }

 }


DPosition.h

String.h

OpenMS::Exception::UnableToFit
Exception used if an error occurred while fitting a model to a given dataset.
Definition: Exception.h:684

OpenMS::Math::GumbelMaxLikelihoodFitter
Implements a fitter for the Gumbel distribution.
Definition: GumbelMaxLikelihoodFitter.h:60

OpenMS::Math::GumbelMaxLikelihoodFitter::~GumbelMaxLikelihoodFitter
virtual ~GumbelMaxLikelihoodFitter()
Destructor.

OpenMS::Math::GumbelMaxLikelihoodFitter::operator=
GumbelMaxLikelihoodFitter & operator=(const GumbelMaxLikelihoodFitter &rhs)
assignment operator (not implemented)

OpenMS::Math::GumbelMaxLikelihoodFitter::GumbelMaxLikelihoodFitter
GumbelMaxLikelihoodFitter(const GumbelMaxLikelihoodFitter &rhs)
Copy constructor (not implemented)

OpenMS::Math::GumbelMaxLikelihoodFitter::fitWeighted
GumbelDistributionFitResult fitWeighted(const std::vector< double > &x, const std::vector< double > &w)
Fits a gumbel distribution to the given data x values. Fills a weighted histogram first and generates...
Definition: GumbelMaxLikelihoodFitter.h:152

OpenMS::Math::GumbelMaxLikelihoodFitter::init_param_
GumbelDistributionFitResult init_param_
Definition: GumbelMaxLikelihoodFitter.h:185

OpenMS::Math::GumbelMaxLikelihoodFitter::GumbelMaxLikelihoodFitter
GumbelMaxLikelihoodFitter(GumbelDistributionFitResult init)
Default constructor.

OpenMS::Math::GumbelMaxLikelihoodFitter::GumbelMaxLikelihoodFitter
GumbelMaxLikelihoodFitter()
Default constructor.

OpenMS::Math::GumbelMaxLikelihoodFitter::setInitialParameters
void setInitialParameters(const GumbelDistributionFitResult &result)
sets the gumbel distribution start parameters a and b for the fitting

OpenMS
Main OpenMS namespace.
Definition: FeatureDeconvolution.h:47

OpenMS::Math::GumbelMaxLikelihoodFitter::Functor
Definition: GumbelMaxLikelihoodFitter.h:94

OpenMS::Math::GumbelMaxLikelihoodFitter::Functor::Functor
Functor()
Definition: GumbelMaxLikelihoodFitter.h:106

OpenMS::Math::GumbelMaxLikelihoodFitter::Functor::InputType
Eigen::Matrix< Scalar, InputsAtCompileTime, 1 > InputType
Definition: GumbelMaxLikelihoodFitter.h:100

OpenMS::Math::GumbelMaxLikelihoodFitter::Functor::values
int values() const
Definition: GumbelMaxLikelihoodFitter.h:110

OpenMS::Math::GumbelMaxLikelihoodFitter::Functor::JacobianType
Eigen::Matrix< Scalar, ValuesAtCompileTime, InputsAtCompileTime > JacobianType
Definition: GumbelMaxLikelihoodFitter.h:102

OpenMS::Math::GumbelMaxLikelihoodFitter::Functor::ValueType
Eigen::Matrix< Scalar, ValuesAtCompileTime, 1 > ValueType
Definition: GumbelMaxLikelihoodFitter.h:101

OpenMS::Math::GumbelMaxLikelihoodFitter::Functor::m_inputs
int m_inputs
Definition: GumbelMaxLikelihoodFitter.h:104

OpenMS::Math::GumbelMaxLikelihoodFitter::Functor::Scalar
_Scalar Scalar
Definition: GumbelMaxLikelihoodFitter.h:95

OpenMS::Math::GumbelMaxLikelihoodFitter::Functor::Functor
Functor(int inputs, int values)
Definition: GumbelMaxLikelihoodFitter.h:107

OpenMS::Math::GumbelMaxLikelihoodFitter::Functor::inputs
int inputs() const
Definition: GumbelMaxLikelihoodFitter.h:109

OpenMS::Math::GumbelMaxLikelihoodFitter::GumbelDistributionFitResult
struct to represent the parameters of a gumbel distribution
Definition: GumbelMaxLikelihoodFitter.h:66

OpenMS::Math::GumbelMaxLikelihoodFitter::GumbelDistributionFitResult::a
double a
location parameter a
Definition: GumbelMaxLikelihoodFitter.h:74

OpenMS::Math::GumbelMaxLikelihoodFitter::GumbelDistributionFitResult::b
double b
scale parameter b
Definition: GumbelMaxLikelihoodFitter.h:76

OpenMS::Math::GumbelMaxLikelihoodFitter::GumbelDistributionFitResult::log_eval_no_normalize
double log_eval_no_normalize(double x) const

OpenMS::Math::GumbelMaxLikelihoodFitter::GumbelDistributionFitResult::GumbelDistributionFitResult
GumbelDistributionFitResult(double local_a, double local_b)
Definition: GumbelMaxLikelihoodFitter.h:67

OpenMS::Math::GumbelMaxLikelihoodFitter::GumbelDistributionFunctor
Definition: GumbelMaxLikelihoodFitter.h:115

OpenMS::Math::GumbelMaxLikelihoodFitter::GumbelDistributionFunctor::GumbelDistributionFunctor
GumbelDistributionFunctor(const std::vector< double > &data, const std::vector< double > &weights)
Definition: GumbelMaxLikelihoodFitter.h:117

OpenMS::Math::GumbelMaxLikelihoodFitter::GumbelDistributionFunctor::operator()
int operator()(const Eigen::VectorXd &x, Eigen::VectorXd &fvec) const
Definition: GumbelMaxLikelihoodFitter.h:123

OpenMS::Math::GumbelMaxLikelihoodFitter::GumbelDistributionFunctor::m_data
const std::vector< double > & m_data
Definition: GumbelMaxLikelihoodFitter.h:139

OpenMS::Math::GumbelMaxLikelihoodFitter::GumbelDistributionFunctor::m_weights
const std::vector< double > & m_weights
Definition: GumbelMaxLikelihoodFitter.h:140