d3/da6/_c_r_n_statistic_sample_8h_source.html

 /* Copyright 2014-2015 INSA-Lyon

  *

  * This file is part of libcrn.

  *

  * libcrn is free software: you can redistribute it and/or modify

  * it under the terms of the GNU Lesser General Public License as published by

  * the Free Software Foundation, either version 3 of the License, or

  * (at your option) any later version.

  *

  * libcrn is distributed in the hope that it will be useful,

  * but WITHOUT ANY WARRANTY; without even the implied warranty of

  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

  * GNU Lesser General Public License for more details.

  *

  * You should have received a copy of the GNU Lesser General Public License

  * along with libcrn.  If not, see <http://www.gnu.org/licenses/>.

  *

  * file: CRNUnivariateStatisticSample.h

  * \author Jean DUONG, Yann LEYDIER

  */


 #ifndef CRNSTATISTICSAMPLE_HEADER

 #define CRNSTATISTICSAMPLE_HEADER


 #include <vector>

 #include <map>

 #include <algorithm>

 #include <iterator>

 #include <numeric>

 #include <tuple>


 #include <CRNMath/CRNMath.h>


 namespace crn

 {

     class Histogram;

     class UnivariateGaussianMixture;

     class MultivariateGaussianMixture;


     /****************************************************************************/

     template<typename T> inline T Max(const std::vector<T> &v) { return *std::max_element(v.begin(), v.end()); }

     template<typename T> inline T Max(const std::vector<std::vector<T>> &m)

     {

         auto ma = m.front().front();

         for (const auto &row : m)

         {

             auto rmax = *std::max_element(row.begin(), row.end());

             if (rmax > ma) ma = rmax;

         }

         return ma;

     }

     template<typename T> inline T Min(const std::vector<T> &v) { return *std::min_element(v.begin(), v.end()); }

     template<typename T> inline T Min(const std::vector<std::vector<T>> &m)

     {

         auto mi = m.front().front();

         for (const auto &row : m)

         {

             auto rmin = *std::max_element(row.begin(), row.end());

             if (rmin < mi) mi = rmin;

         }

         return mi;

     }

     template<typename T> inline std::tuple<T, T> MinMax(const std::vector<T> &v)

     {

         auto res = std::minmax_element(v.begin(), v.end());

         return std::make_tuple(*res.first, *res.second);

     }

     template<typename T> inline std::tuple<T, T> MinMax(const std::vector<std::vector<T>> &m)

     {

         auto mi = m.front().front();

         auto ma = m.front().front();

         for (const auto &row : m)

         {

             auto rmM = std::minmax_element(row.begin(), row.end());

             if (*rmM.first < mi) mi = *rmM.first;

             if (*rmM.second > ma) ma = *rmM.second;

         }

         return std::make_tuple(mi, ma);

     }

     template<typename T> inline size_t Argmax(const std::vector<T> &v) { return std::max_element(v.begin(), v.end()) - v.begin(); }

     template<typename T> inline size_t Argmin(const std::vector<T> &v) { return std::min_element(v.begin(), v.end()) - v.begin(); }

     template<typename T> size_t ColumnArgmax(const std::vector<std::vector<T>> &m, size_t col)

     {

         auto ma = m.front().front();

         auto index = size_t(0);

         for (size_t tmp = 1; tmp < m.size(); ++tmp)

             if (m[tmp][col] > ma)

             {

                 ma = m[tmp][col];

                 index = tmp;

             }

         return index;

     }

     template<typename T> size_t ColumnArgmin(const std::vector<std::vector<T>> &m, size_t col)

     {

         auto mi = m.front().front();

         auto index = size_t(0);

         for (size_t tmp = 1; tmp < m.size(); ++tmp)

             if (m[tmp][col] < mi)

             {

                 mi = m[tmp][col];

                 index = tmp;

             }

         return index;

     }


     double Mean(const std::vector<double> &v);

     template<typename ITER> typename std::iterator_traits<ITER>::value_type Mean(ITER be, ITER en)

     {

         using value_type = typename std::iterator_traits<ITER>::value_type;

         auto cumul = std::accumulate(be, en, SumType<value_type>(0));

         cumul /= SumType<value_type>(std::distance(be, en));

         return value_type(cumul);

     }

     template<typename ITER> double MeanAsDouble(ITER be, ITER en)

     {

         const auto s = double(std::distance(be, en));

         auto m = std::accumulate(be, en, 0.0);


         if (!isinf(m))

             return m / s;

         else

         {

             m = 0.0;

             for (auto it = be; it != en; ++it)

                 m += double(*it) / s;

             return m;

         }

     }


     std::vector<double> MeanPattern(const std::vector<std::vector<double>> &m);


     template<typename ITER> std::vector<double> MeanPattern(ITER it_begin, ITER it_end)

     {

         auto cardinal = 0.0;

         auto dimension = it_begin->first.size();

         auto pattern = std::vector<double>(dimension, 0.0);


         for (auto it = it_begin; it != it_end; ++it)

         {

             const auto& pat = it->first;


             if (pat.size() == dimension)

             {

                 const auto weight = double(it->second);


                 for (size_t k = 0; k < dimension; ++k)

                     pattern[k] +=  weight * pat[k];


                 cardinal += weight;

             }

         }


         auto valid = true;


         for (size_t k = 0; k < dimension; ++k)

             if (std::isinf(pattern[k]))

             {

                 valid = false;

                 break;

             }


         if (valid)

             for (size_t k = 0; k < dimension; ++k)

                 pattern[k] /= cardinal;

         else

         {

             for (size_t k = 0; k < dimension; ++k)

                 pattern[k] = 0.0;


             for (auto it = it_begin; it != it_end; ++it)

                 if (it->first.size() == dimension)

                 {

                     const auto scale = double(it->second) / double(cardinal);

                     const auto& pt = it->first;


                     for (size_t k = 0; k < dimension; ++k)

                         pattern[k] += pt[k] * scale;

                 }

         }


         return pattern;

     }


     double StdDeviation(const std::vector<double> &v);

     double Variance(const std::vector<double> &v);

     std::vector<std::vector<double>> MakeCovariance(const std::vector<std::vector<double>> &m);


     template<typename ITER> std::vector<std::vector<double>> MakeCovariance(ITER it_begin, ITER it_end)

     {

         auto card = 0.0;

         const auto dim = it_begin->first.size();

         auto cov = std::vector<std::vector<double>>(dim, std::vector<double>(dim));


         for (auto it = it_begin; it != it_end; ++it)

             card += double(it->second);


         for (size_t i = 0; i < dim; ++i)

             for (auto j = i; j < dim; ++j)

             {

                 for (auto it = it_begin; it != it_end; ++it)

                     cov[i][j] += it->first[i] * it->first[j] * double(it->second);


                 cov[i][j] /= double(card);


                 if (j != i)

                     cov[j][i] = cov[i][j];

             }


         return cov;

     }


     std::tuple<double, double, double> MeanVarDev(const std::vector<double> &v);

     template<typename ITER> std::tuple<double, double, double> MeanVarDev(ITER it_begin, ITER it_end)

     {

         // Compute cumul and cumul of squares in a same loop

         auto m = 0.0;

         auto m_2 = 0.0;

         auto s = 0.0;


         for (auto it = it_begin; it != it_end; ++it)

         {

             auto val = it->first;

             auto cnt = it->second;


             m += val * cnt;

             m_2 += Sqr(val) * cnt;

             s += double(cnt);

         }


         if (!std::isinf(m))

         {

             m /= s;

             m_2 /= s;

         }

         else // If cumul too large, re-compute mean with values downscaled by cardinal

         {

             m = 0.0;

             m_2 = 0.0;


             for (auto it = it_begin; it != it_end; ++it)

             {

                 auto val = it->first;

                 auto cnt = it->second;


                 m += val * cnt / s;

                 m_2 += Sqr(val) * cnt / s;

             }

         }


         if (!std::isinf(m_2))

         {

             auto var = m_2 - Sqr(m);

             return std::make_tuple(m, var, sqrt(var));

         }

         else // Konig-Huygens formula for variance cannot be used (too large values in cumul of squares)

         {

             auto var = 0.0;


             for (auto it = it_begin; it != it_end; ++it)

                 var += Sqr(it->first - m) * it->second;


             if (!std::isinf(var))

                 var /= s;

             else

             {

                 var = 0.0;


                 for (auto it = it_begin; it != it_end; ++it)

                     var += Sqr(it->first - m) * it->second / s;

             }


             return std::make_tuple(m, var, sqrt(var));

         }

     }


     std::vector<double> Quantiles(const std::vector<double> &v, size_t q, bool sort_flag = true);


     template<typename T> T MedianValue(const std::vector<T> &v)

     {

         auto sv = v;

         std::sort(sv.begin(), sv.end());

         return sv[sv.size() / 2];

     }


     template<typename T> inline bool AllEqual(const std::vector<T> &v) { return std::all_of(v.begin(), v.end(), [&v](const T &x){ return x == v.front(); }); }

     template<typename T> inline bool AllEqual(const std::vector<std::vector<T>> &m)

     {

         auto refval = m.front().front();

         for (const auto &row : m)

             if (std::any_of(row.begin(), row.end(), [refval](const T &x){ return x != refval; }))

                 return false;

         return true;

     }


     Histogram MakeHistogram(const std::vector<double> &v, size_t nb_bins);

     Histogram MakeHistogramSquareRoot(const std::vector<double> &v);

     Histogram MakeHistogramSturges(const std::vector<double> &v);

     Histogram MakeHistogramRice(const std::vector<double> &v);

     Histogram MakeHistogramScott(const std::vector<double> &v);

     Histogram MakeHistogramFreedmanDiaconis(const std::vector<double> &v, bool sort_flag = true);


     UnivariateGaussianMixture MakeGaussianMixtureModel(const std::vector<double> &v, size_t nb_seeds = 2);

     MultivariateGaussianMixture MakeGaussianMixtureModel(const std::vector<std::vector<double>> &patterns, size_t nb_seeds = 2);


 }


 #endif


crn::MedianValue
T MedianValue(const std::vector< T > &v)
Median value.
Definition: CRNStatisticSample.h:340

crn::SumType
typename TypeInfo< T >::SumType SumType
Definition: CRNType.h:185

CRNMath.h

crn::Argmin
size_t Argmin(const std::vector< T > &v)
Return index of a minimal.
Definition: CRNStatisticSample.h:104

crn::ColumnArgmax
size_t ColumnArgmax(const std::vector< std::vector< T >> &m, size_t col)
Return index of a maximal on a column.
Definition: CRNStatisticSample.h:106

crn::Variance
double Variance(const std::vector< double > &v)
Return variance of sample.
Definition: CRNStatisticSample.cpp:104

crn::MeanPattern
std::vector< double > MeanPattern(const std::vector< std::vector< double >> &m)
Return mean pattern of sample.
Definition: CRNStatisticSample.cpp:60

crn::ColumnArgmin
size_t ColumnArgmin(const std::vector< std::vector< T >> &m, size_t col)
Return index of a minimal on a column.
Definition: CRNStatisticSample.h:119

crn::Max
const T & Max(const T &a, const T &b)
Returns the max of two values.
Definition: CRNMath.h:47

crn::MakeHistogramSquareRoot
Histogram MakeHistogramSquareRoot(const std::vector< double > &v)
Returns count histogram (#bins = sqrt(pop) )
Definition: CRNStatisticSample.cpp:275

crn::Quantiles
std::vector< double > Quantiles(const std::vector< double > &v, size_t q, bool sort_flag=true)
Return quantile values of sample.
Definition: CRNStatisticSample.cpp:216

crn::AllEqual
bool AllEqual(const std::vector< T > &v)
Test if all data values are equal.
Definition: CRNStatisticSample.h:348

crn::MakeHistogramSturges
Histogram MakeHistogramSturges(const std::vector< double > &v)
Returns count histogram (#bins = 1+log_2(pop) )
Definition: CRNStatisticSample.cpp:284

crn::MakeCovariance
std::vector< std::vector< double > > MakeCovariance(const std::vector< std::vector< double >> &m)
Return covariance for sample.
Definition: CRNStatisticSample.cpp:129

crn::Argmax
size_t Argmax(const std::vector< T > &v)
Return index of a maximal.
Definition: CRNStatisticSample.h:102

crn::MeanAsDouble
double MeanAsDouble(ITER be, ITER en)
Return mean value of sample as a double value.
Definition: CRNStatisticSample.h:155

crn::Mean
double Mean(const std::vector< double > &v)
Return mean value of sample.
Definition: CRNStatisticSample.cpp:40

crn::Sqr
constexpr SumType< T > Sqr(const T &v) noexcept(noexcept(v *v))
Returns the square of a value.
Definition: CRNMath.h:61

crn::StdDeviation
double StdDeviation(const std::vector< double > &v)
Return deviation of sample.
Definition: CRNStatisticSample.cpp:95

crn::MakeGaussianMixtureModel
UnivariateGaussianMixture MakeGaussianMixtureModel(const std::vector< double > &v, size_t nb_seeds=2)
Return Gaussian mixture model modeling current (univariate) sample.
Definition: CRNStatisticSample.cpp:326

crn::Min
const T & Min(const T &a, const T &b)
Returns the min of two values.
Definition: CRNMath.h:49

crn::MinMax
std::pair< T, T > MinMax(const Image< T > &img, CMP cmp=CMP{})
Returns min and max pixel values.
Definition: CRNImage.hpp:1447

crn::MakeHistogramScott
Histogram MakeHistogramScott(const std::vector< double > &v)
Returns count histogram (bin width = 3.5 * stddev / pop^(1/3))
Definition: CRNStatisticSample.cpp:302

crn::MakeHistogramRice
Histogram MakeHistogramRice(const std::vector< double > &v)
Returns count histogram (#bins = 2n^(1/3) )
Definition: CRNStatisticSample.cpp:293

crn::MakeHistogramFreedmanDiaconis
Histogram MakeHistogramFreedmanDiaconis(const std::vector< double > &v, bool sort_flag=true)
Returns count histogram (bin width = 2 * IQR(v) / pop^(1/3))
Definition: CRNStatisticSample.cpp:313

crn::MeanVarDev
std::tuple< double, double, double > MeanVarDev(const std::vector< double > &v)
Return mean, variance and standard deviation of sample.
Definition: CRNStatisticSample.cpp:152

crn::MakeHistogram
Histogram MakeHistogram(const Image< T > &img, typename std::enable_if< std::is_arithmetic< T >::value >::type *dummy=nullptr)
Definition: CRNImageGray.h:64