// -*- mode: c++; c-indent-level: 4; c++-member-init-indent: 8; comment-column: 35; -*- //----------------------------------------------------------------------------- // eoStat.h // (c) Marc Schoenauer, Maarten Keijzer and GeNeura Team, 2000 // (c) 2010 Thales group /* This library is free software; you can redistribute it and/or modify it under the terms of the GNU Lesser General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version. This library is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public License for more details. You should have received a copy of the GNU Lesser General Public License along with this library; if not, write to the Free Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA Contact: http://eodev.sourceforge.net Authors: todos@geneura.ugr.es, http://geneura.ugr.es Marc.Schoenauer@polytechnique.fr mkeijzer@dhi.dk Johann Dréo */ //----------------------------------------------------------------------------- #ifndef _eoStat_h #define _eoStat_h #include #include // accumulate #include "../eoFunctor.h" #include "eoParam.h" #include "../eoPop.h" #include "eoMonitor.h" //#include "eoCheckPoint.h" #include "eoLogger.h" /** @defgroup Stats Statistics computation * * Compute various statistics on a population. * * Objects of those classes are generally called by an eoCheckPoint * to compute statistics about the population at a given generation. * As they inherit from eoValueParam, they can be printed drectly, * for instance by an eoMonitor. * * @see eoCheckPoint * @see eoMonitor * * @ingroup Utilities * @{ */ /** Base class for all statistics that need to be calculated over the (unsorted) population (I guess it is not really necessary? MS. Depstd::ends, there might be reasons to have a stat that is not an eoValueParam, but maybe I'm just kidding myself, MK) */ template class eoStatBase : public eoUF&, void> { public: virtual void lastCall(const eoPop&) {} virtual std::string className(void) const { return "eoStatBase"; } }; template class eoCheckPoint; /** The actual class that will be used as base for all statistics that need to be calculated over the (unsorted) population It is an eoStatBase AND an eoValueParam so it can be used in Monitors. */ template class eoStat : public eoValueParam, public eoStatBase { public: typedef EOT EOType; eoStat(T _value, std::string _description) : eoValueParam(_value, _description) {} virtual std::string className(void) const { return "eoStat"; } eoStat& addTo(eoCheckPoint& cp) { cp.add(*this); return *this; } eoStat& addTo(eoMonitor& mon) { mon.add(*this); return *this; } }; /** Base class for statistics calculated over a sorted snapshot of the population */ template class eoSortedStatBase : public eoUF&, void> { public: virtual void lastCall(const std::vector&) {} virtual std::string className(void) const { return "eoSortedStatBase"; } }; /** The actual class that will be used as base for all statistics that need to be calculated over the sorted population It's an eoSortedStatBase AND an eoValueParam so it can be used in Monitors. */ template class eoSortedStat : public eoSortedStatBase, public eoValueParam { public : typedef EOT EOType; eoSortedStat(ParamType _value, std::string _desc) : eoValueParam(_value, _desc) {} virtual std::string className(void) const { return "eoSortedStat"; } eoSortedStat& addTo(eoCheckPoint& cp) { cp.add(*this); return *this; } eoSortedStat& addTo(eoMonitor& mon) { mon.add(*this); return *this; } }; /** Average fitness of a population. Fitness can be: - double - eoMinimizingFitness or eoMaximizingFitness The average of each objective is evaluated. ( For eoScalarFitnessAssembled user eoAssembledFitnessStat classes.) */ #if defined(_MSC_VER) && (_MSC_VER < 1300) template class eoAverageStat : public eoStat #else template class eoAverageStat : public eoStat #endif { public : using eoStat::value; typedef typename EOT::Fitness Fitness; eoAverageStat(std::string _description = "Average Fitness") : eoStat(Fitness(), _description) {} static Fitness sumFitness(double _sum, const EOT& _eot){ _sum += _eot.fitness(); return _sum; } eoAverageStat(double _value, std::string _desc) : eoStat(_value, _desc) {} virtual void operator()(const eoPop& _pop){ doit(_pop, Fitness()); // specializations for scalar and std::vector } virtual std::string className(void) const { return "eoAverageStat"; } private : // Default behavior template void doit(const eoPop& _pop, T) { Fitness v = std::accumulate(_pop.begin(), _pop.end(), Fitness(0.0), eoAverageStat::sumFitness); value() = v / _pop.size(); } }; /** Average fitness + Std. dev. of a population, fitness HAVE TO BE to be scalar. */ template // FIXME find a way to use generic Fitness types instead of scala fitness here : // class eoSecondMomentStats : public eoStat > // Here, I failed to find a way to overload eoValueParam::getValue and setValue, // because there is no way to use the partial specializations located in eoParam.h // Indeed, eoValueParam is templatized on a ValueType, but the getValue signature does not // contain this type. // Thus, in order to use partial specializations the user would have to specify getValue(), // which is not the case in most of the existing code. // Overloading getValue in this class does not seems to work, the call falls to eoValueParam::getValue // and fails on the output stream. class eoSecondMomentStats : public eoStat > { public : // typedef typename EOT::Fitness FitT; typedef double FitT; using eoStat >::value; typedef std::pair SquarePair; eoSecondMomentStats(std::string _description = "Average & Stdev") : eoStat(std::make_pair(0.0,0.0), _description) {} static SquarePair sumOfSquares(SquarePair _sq, const EOT& _eo) { FitT fitness = _eo.fitness(); _sq.first += fitness; _sq.second += fitness * fitness; return _sq; } virtual void operator()(const eoPop& _pop) { SquarePair result = std::accumulate(_pop.begin(), _pop.end(), std::make_pair(0.0, 0.0), eoSecondMomentStats::sumOfSquares); double n = _pop.size(); value().first = result.first / n; // average value().second = sqrt( (result.second - n * value().first * value().first) / (n - 1.0)); // stdev } virtual std::string className(void) const { return "eoSecondMomentStats"; } }; /** The n_th element fitness in the population (see eoBestFitnessStat) */ #if defined(_MSC_VER) && (_MSC_VER < 1300) template class eoNthElementFitnessStat : public eoSortedStat #else template class eoNthElementFitnessStat : public eoSortedStat #endif { public : using eoSortedStat::value; typedef typename EOT::Fitness Fitness; eoNthElementFitnessStat(unsigned _whichElement, std::string _description = "nth element fitness") : eoSortedStat(Fitness(), _description), whichElement(_whichElement) {} virtual void operator()(const std::vector& _pop) { if (whichElement > _pop.size()) throw eoException("fitness requested of element outside of pop"); doit(_pop, Fitness()); } virtual std::string className(void) const { return "eoNthElementFitnessStat"; } private : /* Very old code... struct CmpFitness { CmpFitness(unsigned _whichElement, bool _maxim) : whichElement(_whichElement), maxim(_maxim) {} bool operator()(const EOT* a, const EOT* b) { if (maxim) return a->fitness()[whichElement] > b->fitness()[whichElement]; return a->fitness()[whichElement] < b->fitness()[whichElement]; } unsigned whichElement; bool maxim; }; */ // for everything else template void doit(const std::vector& _pop, T) { value() = _pop[whichElement]->fitness(); } unsigned whichElement; }; /* Actually, you shouldn't need to sort the population to get the best fitness MS - 17/11/00 But then again, if another stat needs sorted fitness anyway, getting the best out would be very fast. MK - 09/01/03 template class eoBestFitnessStat : public eoStat { public : typedef typename EOT::Fitness Fitness; eoBestFitnessStat(std::string _description = "Best Fitness") : eoStat(Fitness(), _description) {} virtual void operator()(const eoPop& _pop) { value() = _pop.nth_element_fitness(0); } }; */ /** Best fitness of a population. Fitness can be: - double - eoMinimizingFitness or eoMaximizingFitness ( For eoScalarFitnessAssembled look at eoAssembledFitnessStat ) */ #if defined(_MSC_VER) && (_MSC_VER < 1300) template class eoBestFitnessStat : public eoStat #else template class eoBestFitnessStat : public eoStat #endif { public: using eoStat::value; typedef typename EOT::Fitness Fitness; eoBestFitnessStat(std::string _description = "Best ") : eoStat(Fitness(), _description) {} void operator()(const eoPop& _pop) { doit(_pop, Fitness() ); // specializations for scalar and std::vector } virtual std::string className(void) const { return "eoBestFitnessStat"; } private : /* Very old code... struct CmpFitness { CmpFitness(unsigned _which, bool _maxim) : which(_which), maxim(_maxim) {} bool operator()(const EOT& a, const EOT& b) { if (maxim) return a.fitness()[which] < b.fitness()[which]; return a.fitness()[which] > b.fitness()[which]; } unsigned which; bool maxim; }; */ // default template void doit(const eoPop& _pop, T) { // find the largest elements value() = _pop.best_element().fitness(); } }; /** @example t-eoSSGA.cpp */ /** Keep the best individual found so far */ template class eoBestIndividualStat : public eoStat { public: using eoStat::value; eoBestIndividualStat(std::string _description = "BestIndiv ") : eoStat( EOT(), _description ) {} void operator()(const eoPop& pop) { EOT best = pop.best_element(); // on the first call, value() is invalid if( value().invalid() ) { // thus we cannot compare it to something else value() = best; } else { // keep the best individual found so far if( best.fitness() > value().fitness() ) { value() = best; } } } virtual std::string className(void) const { return "eoBestIndividualStat"; } }; template class eoDistanceStat : public eoStat { public: using eoStat::value; eoDistanceStat(std::string _name = "distance") : eoStat(0.0, _name) {} template double distance(T a, T b) { T res = a-b; return res < 0? -res : res; } double distance(bool a, bool b) { return (a==b)? 0 : 1; } void operator()(const eoPop& _pop) { double& v = value(); v = 0.0; for (unsigned i = 0; i < _pop.size(); ++i) { for (unsigned j = 0; j < _pop.size(); ++j) { for (unsigned k = 0; k < _pop[i].size(); ++k) { v += distance(_pop[i][k], _pop[j][k]); } } } double sz = _pop.size(); v /= sz * sz * _pop[0].size(); } virtual std::string className(void) const { return "eoDistanceStat"; } }; /* template class eoStdevStat : public eoStat { public : typedef typename eoSecondMomentStats::SquarePair SquarePair; eoStdevStat(std::string _description = "Stdev") : eoStat(0.0, _description) {} virtual void operator()(const eoPop& _pop) { SquarePair result = std::accumulate(pop.begin(), pop.end(), std::make_pair(0.0, 0.0), eoSecondMomentStats::sumOfSquares); double n = pop.size(); value() = sqrt( (result.second - (result.first / n)) / (n - 1.0)); // stdev } }; */ //! A robust measure of the mass (generally used to compute the median). Do not alter the given pop. template class eoNthElementStat : public eoStat< EOT, typename EOT::Fitness > { protected: int _nth; double _ratio; public: using eoStat::value; eoNthElementStat( int nth = 0, std::string description = "NthElement") : eoStat( 0.0, description ), _nth(nth), _ratio(-1.0) { assert( _nth >= 0 ); } eoNthElementStat( double ratio = 0.5, std::string description = "Median" ) : eoStat( 0.0, description ), _nth(-1), _ratio(ratio) { assert( _ratio >= 0 ); } virtual void operator()( const eoPop & _pop ) { unsigned int nth; if( _nth == -1 ) { // asked for a ratio assert( _ratio >= 0 && _ratio <= 1 ); nth = static_cast( std::floor(_pop.size() * _ratio) ); } else { assert( _ratio == -1 ); // asked for a position assert( _nth >= 0 ); nth = static_cast(_nth); } assert( nth < _pop.size() ); if( _pop.size() == 0 ) { //FIXME how to implement value() = 0 ? eo::log << eo::warnings << "Called " << className() << " on an empty pop, value unchanged" << std::endl; } else { eoPop pop = _pop; // copy, thus no sorting of the original pop std::nth_element( pop.begin(), pop.begin()+nth, pop.end() ); value() = pop[nth].fitness(); } } virtual std::string className(void) const { return "eoNthElementStat"; } }; /** @example t-eoIQRStat.cpp */ //! A robust measure of dispersion (also called midspread or middle fifty) that is the difference between the third and the first quartile. template class eoInterquartileRangeStat : public eoStat< EOT, typename EOT::Fitness > { public: using eoStat::value; eoInterquartileRangeStat( std::string description = "IQR" ) : eoStat( 0.0, description ) {} virtual void operator()( const eoPop & _pop ) { if( _pop.size() == 0 ) { //FIXME how to implement value() = 0 ? eo::log << eo::warnings << "Called " << className() << " on an empty pop, value unchanged" << std::endl; } else { eoPop pop = _pop; unsigned int quartile = pop.size()/4; std::nth_element( pop.begin(), pop.begin()+quartile*1, pop.end() ); typename EOT::Fitness Q1 = pop[quartile].fitness(); std::nth_element( pop.begin(), pop.begin()+quartile*3, pop.end() ); typename EOT::Fitness Q3 = pop[quartile*3].fitness(); value() = Q3 - Q1; } } virtual std::string className(void) const { return "eoInterquartileRangeStat"; } }; /** @example t-eoIQRStat.cpp */ /** Compute the average size of indivudals over the population * * Obviously, will work only on representations that implement the (standard) "size()" method, * like any STL container. */ template class eoAverageSizeStat : public eoStat< EOT, double> { public: using eoStat::value; eoAverageSizeStat( std::string description = "Av.Size" ) : eoStat( 0.0, description ) {} // 0 by default virtual void operator()( const eoPop & pop ) { size_t pop_size = pop.size(); std::vector sizes; sizes.reserve(pop_size); for( unsigned int i=0, s = pop_size; i(sum) / static_cast(pop_size); } virtual std::string className(void) const { return "eoAverageSizeStat"; } }; /** @} */ #endif