Added CMA
This commit is contained in:
parent
dd81a3ebc8
commit
8b03a5232a
11 changed files with 1198 additions and 2 deletions
365
eo/src/es/CMAState.cpp
Normal file
365
eo/src/es/CMAState.cpp
Normal file
|
|
@ -0,0 +1,365 @@
|
|||
/*
|
||||
* C++ification of Nikolaus Hansen's original C-source code for the
|
||||
* CMA-ES
|
||||
*
|
||||
* C++-ificiation performed by Maarten Keijzer (C) 2005. Licensed under
|
||||
* the LGPL. Original copyright of Nikolaus Hansen can be found below
|
||||
*
|
||||
*
|
||||
* Some changes have been made to the original flow and logic of the
|
||||
* algorithm:
|
||||
*
|
||||
* - Numerical issues are now treated 'before' going into the eigenvector decomposition
|
||||
* (this was done out of convenience)
|
||||
* - dMaxSignifiKond (smallest x such that x == x + 1.0) replaced by
|
||||
* numeric_limits<double>::epsilon() (smallest x such that 1.0 != 1.0 + x)
|
||||
*
|
||||
*
|
||||
*/
|
||||
|
||||
/* --------------------------------------------------------- */
|
||||
/* --------------------------------------------------------- */
|
||||
/* --- File: cmaes.c -------- Author: Nikolaus Hansen --- */
|
||||
/* --------------------------------------------------------- */
|
||||
/*
|
||||
* CMA-ES for non-linear function minimization.
|
||||
*
|
||||
* Copyright (C) 1996, 2003 Nikolaus Hansen.
|
||||
* e-mail: hansen@bionik.tu-berlin.de
|
||||
*
|
||||
* This library is free software; you can redistribute it and/or
|
||||
* modify it under the terms of the GNU Lesser General Public
|
||||
* License as published by the Free Software Foundation; either
|
||||
* version 2.1 of the License, or (at your option) any later
|
||||
* version (see http://www.gnu.org/copyleft/lesser.html).
|
||||
*
|
||||
* This library is distributed in the hope that it will be useful,
|
||||
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
||||
* Lesser General Public License for more details.
|
||||
*
|
||||
* */
|
||||
/* --- Changes : ---
|
||||
* 03/03/21: argument const double *rgFunVal of
|
||||
* cmaes_ReestimateDistribution() was treated incorrectly.
|
||||
* 03/03/29: restart via cmaes_resume_distribution() implemented.
|
||||
* 03/03/30: Always max std dev / largest axis is printed first.
|
||||
* 03/08/30: Damping is adjusted for large mueff.
|
||||
* 03/10/30: Damping is adjusted for large mueff always.
|
||||
* 04/04/22: Cumulation time and damping for step size adjusted.
|
||||
* No iniphase but conditional update of pc.
|
||||
* Version 2.23.
|
||||
* */
|
||||
|
||||
#include <valarray>
|
||||
#include <limits>
|
||||
#include <iostream>
|
||||
#include <cassert>
|
||||
|
||||
#include <utils/eoRNG.h>
|
||||
|
||||
#include <es/CMAState.h>
|
||||
#include <es/CMAParams.h>
|
||||
#include <es/matrices.h>
|
||||
#include <es/eig.h>
|
||||
|
||||
using namespace std;
|
||||
|
||||
namespace eo {
|
||||
|
||||
struct CMAStateImpl {
|
||||
|
||||
CMAParams p;
|
||||
|
||||
lower_triangular_matrix C; // Covariance matrix
|
||||
square_matrix B; // Eigen vectors (in columns)
|
||||
valarray<double> d; // eigen values (diagonal matrix)
|
||||
valarray<double> pc; // Evolution path
|
||||
valarray<double> ps; // Evolution path for stepsize;
|
||||
|
||||
vector<double> mean; // current mean to sample around
|
||||
double sigma; // global step size
|
||||
|
||||
unsigned gen;
|
||||
vector<double> fitnessHistory;
|
||||
|
||||
|
||||
CMAStateImpl(const CMAParams& params_, const vector<double>& m, double sigma_) :
|
||||
p(params_),
|
||||
C(p.n), B(p.n), d(p.n), pc(p.n), ps(p.n), mean(m), sigma(sigma_),
|
||||
gen(0), fitnessHistory(3)
|
||||
{
|
||||
double trace = (p.initialStdevs * p.initialStdevs).sum();
|
||||
/* Initialize covariance structure */
|
||||
for (unsigned i = 0; i < p.n; ++i)
|
||||
{
|
||||
B[i][i] = 1.;
|
||||
d[i] = p.initialStdevs[i] * sqrt(p.n / trace);
|
||||
C[i][i] = d[i] * d[i];
|
||||
pc[i] = 0.;
|
||||
ps[i] = 0.;
|
||||
}
|
||||
|
||||
}
|
||||
|
||||
void sample(vector<double>& v) {
|
||||
unsigned n = p.n;
|
||||
v.resize(n);
|
||||
|
||||
vector<double> tmp(n);
|
||||
for (unsigned i = 0; i < n; ++i)
|
||||
tmp[i] = d[i] * rng.normal();
|
||||
|
||||
/* add mutation (sigma * B * (D*z)) */
|
||||
for (unsigned i = 0; i < n; ++i) {
|
||||
double sum = 0;
|
||||
for (unsigned j = 0; j < n; ++j) {
|
||||
sum += B[i][j] * tmp[j];
|
||||
}
|
||||
v[i] = mean[i] + sigma * sum;
|
||||
}
|
||||
}
|
||||
|
||||
void reestimate(const vector<const vector<double>* >& pop, double muBest, double muWorst) {
|
||||
|
||||
assert(pop.size() == p.mu);
|
||||
|
||||
unsigned n = p.n;
|
||||
|
||||
fitnessHistory[gen % fitnessHistory.size()] = muBest; // needed for divergence check
|
||||
|
||||
vector<double> oldmean = mean;
|
||||
valarray<double> BDz(n);
|
||||
|
||||
/* calculate xmean and rgBDz~N(0,C) */
|
||||
for (unsigned i = 0; i < n; ++i) {
|
||||
mean[i] = 0.;
|
||||
for (unsigned j = 0; j < pop.size(); ++j) {
|
||||
mean[i] += p.weights[j] * (*pop[j])[i];
|
||||
}
|
||||
BDz[i] = sqrt(p.mueff)*(mean[i] - oldmean[i])/sigma;
|
||||
}
|
||||
|
||||
vector<double> tmp(n);
|
||||
/* calculate z := D^(-1) * B^(-1) * rgBDz into rgdTmp */
|
||||
for (unsigned i = 0; i < n; ++i) {
|
||||
double sum = 0.0;
|
||||
for (unsigned j = 0; j < n; ++j) {
|
||||
sum += B[j][i] * BDz[j];
|
||||
}
|
||||
tmp[i] = sum / d[i];
|
||||
}
|
||||
|
||||
/* cumulation for sigma (ps) using B*z */
|
||||
for (unsigned i = 0; i < n; ++i) {
|
||||
double sum = 0.0;
|
||||
for (unsigned j = 0; j < n; ++j)
|
||||
sum += B[i][j] * tmp[j];
|
||||
|
||||
ps[i] = (1. - p.ccumsig) * ps[i] + sqrt(p.ccumsig * (2. - p.ccumsig)) * sum;
|
||||
}
|
||||
|
||||
/* calculate norm(ps)^2 */
|
||||
double psxps = (ps * ps).sum();
|
||||
|
||||
|
||||
double chiN = sqrt((double) p.n) * (1. - 1./(4.*p.n) + 1./(21.*p.n*p.n));
|
||||
/* cumulation for covariance matrix (pc) using B*D*z~N(0,C) */
|
||||
double hsig = sqrt(psxps) / sqrt(1. - pow(1.-p.ccumsig, 2.*gen)) / chiN < 1.5 + 1./(p.n-0.5);
|
||||
|
||||
pc = (1. - p.ccumcov) * pc + hsig * sqrt(p.ccumcov * (2. - p.ccumcov)) * BDz;
|
||||
|
||||
/* stop initial phase (MK, this was not reachable in the org code, deleted) */
|
||||
|
||||
/* remove momentum in ps, if ps is large and fitness is getting worse */
|
||||
|
||||
if (gen >= fitnessHistory.size()) {
|
||||
|
||||
// find direction from muBest and muWorst (muBest == muWorst handled seperately
|
||||
double direction = muBest < muWorst? -1.0 : 1.0;
|
||||
|
||||
unsigned now = gen % fitnessHistory.size();
|
||||
unsigned prev = (gen-1) % fitnessHistory.size();
|
||||
unsigned prevprev = (gen-2) % fitnessHistory.size();
|
||||
|
||||
bool fitnessWorsens = (muBest == muWorst) || // <- increase norm also when population has converged (this deviates from Hansen's scheme)
|
||||
( (direction * fitnessHistory[now] < direction * fitnessHistory[prev])
|
||||
&&
|
||||
(direction * fitnessHistory[now] < direction * fitnessHistory[prevprev]));
|
||||
|
||||
if(psxps/p.n > 1.5 + 10.*sqrt(2./p.n) && fitnessWorsens) {
|
||||
double tfac = sqrt((1 + std::max(0., log(psxps/p.n))) * p.n / psxps);
|
||||
ps *= tfac;
|
||||
psxps *= tfac*tfac;
|
||||
}
|
||||
}
|
||||
|
||||
/* update of C */
|
||||
/* Adapt_C(t); not used anymore */
|
||||
if (p.ccov != 0.) {
|
||||
//flgEigensysIsUptodate = 0;
|
||||
|
||||
/* update covariance matrix */
|
||||
for (unsigned i = 0; i < n; ++i) {
|
||||
vector<double>::iterator c_row = C[i];
|
||||
for (unsigned j = 0; j <= i; ++j) {
|
||||
c_row[j] =
|
||||
(1 - p.ccov) * c_row[j]
|
||||
+
|
||||
p.ccov * (1./p.mucov) * pc[i] * pc[j]
|
||||
+
|
||||
(1-hsig) * p.ccumcov * (2. - p.ccumcov) * c_row[j];
|
||||
|
||||
/*C[i][j] = (1 - p.ccov) * C[i][j]
|
||||
+ sp.ccov * (1./sp.mucov)
|
||||
* (rgpc[i] * rgpc[j]
|
||||
+ (1-hsig)*sp.ccumcov*(2.-sp.ccumcov) * C[i][j]); */
|
||||
for (unsigned k = 0; k < p.mu; ++k) { /* additional rank mu update */
|
||||
c_row[j] += p.ccov * (1-1./p.mucov) * p.weights[k]
|
||||
* ( (*pop[k])[i] - oldmean[i])
|
||||
* ( (*pop[k])[j] - oldmean[j])
|
||||
/ sigma / sigma;
|
||||
|
||||
// * (rgrgx[index[k]][i] - rgxold[i])
|
||||
// * (rgrgx[index[k]][j] - rgxold[j])
|
||||
// / sigma / sigma;
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
/* update of sigma */
|
||||
sigma *= exp(((sqrt(psxps)/chiN)-1.)/p.damp);
|
||||
/* calculate eigensystem, must be done by caller */
|
||||
//cmaes_UpdateEigensystem(0);
|
||||
|
||||
|
||||
/* treat minimal standard deviations and numeric problems
|
||||
* Note that in contrast with the original code, some numerical issues are treated *before* we
|
||||
* go into the eigenvalue calculation */
|
||||
|
||||
treatNumericalIssues(muBest, muWorst);
|
||||
|
||||
gen++; // increase generation
|
||||
}
|
||||
|
||||
void treatNumericalIssues(double best, double worst) {
|
||||
|
||||
/* treat stdevs */
|
||||
for (unsigned i = 0; i < p.n; ++i) {
|
||||
if (sigma * sqrt(C[i][i]) < p.minStdevs[i]) {
|
||||
// increase stdev
|
||||
sigma *= exp(0.05+1./p.damp);
|
||||
break;
|
||||
}
|
||||
}
|
||||
|
||||
/* treat convergence */
|
||||
if (best == worst) {
|
||||
sigma *= exp(0.2 + 1./p.damp);
|
||||
}
|
||||
|
||||
/* Jede Hauptachse i testen, ob x == x + 0.1 * sigma * rgD[i] * B[i] */
|
||||
/* Test if all the means are not numerically out of whack with our coordinate system*/
|
||||
for (unsigned axis = 0; axis < p.n; ++axis) {
|
||||
double fac = 0.1 * sigma * d[axis];
|
||||
unsigned coord;
|
||||
for (coord = 0; coord < p.n; ++coord) {
|
||||
if (mean[coord] != mean[coord] + fac * B[coord][axis]) {
|
||||
break;
|
||||
}
|
||||
}
|
||||
|
||||
if (coord == p.n) { // means are way too big (little) for numerical accuraccy. Start rocking the craddle a bit more
|
||||
sigma *= exp(0.2+1./p.damp);
|
||||
}
|
||||
|
||||
}
|
||||
|
||||
/* Testen ob eine Komponente des Objektparameters festhaengt */
|
||||
/* Correct issues with scale between objective values and covariances */
|
||||
bool theresAnIssue = false;
|
||||
|
||||
for (unsigned i = 0; i < p.n; ++i) {
|
||||
if (mean[i] == mean[i] + 0.2 * sigma * sqrt(C[i][i])) {
|
||||
C[i][i] *= (1. + p.ccov);
|
||||
theresAnIssue = true;
|
||||
}
|
||||
}
|
||||
|
||||
if (theresAnIssue) {
|
||||
sigma *= exp(0.05 + 1./p.damp);
|
||||
}
|
||||
}
|
||||
|
||||
|
||||
bool updateEigenSystem(unsigned max_tries, unsigned max_iters) {
|
||||
|
||||
if (max_iters==0) max_iters = 30 * p.n;
|
||||
|
||||
static double lastGoodMinimumEigenValue = 1.0;
|
||||
|
||||
/* Try to get a valid calculation */
|
||||
for (unsigned tries = 0; tries < max_tries; ++tries) {
|
||||
|
||||
unsigned iters = eig( p.n, C, d, B, max_iters);
|
||||
if (iters < max_iters)
|
||||
{ // all is well
|
||||
|
||||
/* find largest/smallest eigenvalues */
|
||||
double minEV = d.min();
|
||||
double maxEV = d.max();
|
||||
|
||||
/* (MK Original comment was) :Limit Condition of C to dMaxSignifKond+1
|
||||
* replaced dMaxSignifKond with 1./numeric_limits<double>::epsilon()
|
||||
* */
|
||||
if (maxEV * numeric_limits<double>::epsilon() > minEV) {
|
||||
double tmp = maxEV * numeric_limits<double>::epsilon() - minEV;
|
||||
minEV += tmp;
|
||||
for (unsigned i=0;i<p.n;++i) {
|
||||
C[i][i] += tmp;
|
||||
d[i] += tmp;
|
||||
}
|
||||
} /* if */
|
||||
lastGoodMinimumEigenValue = minEV;
|
||||
|
||||
d = sqrt(d);
|
||||
|
||||
//flgEigensysIsUptodate = 1;
|
||||
//genOfEigensysUpdate = gen;
|
||||
//clockeigensum += clock() - clockeigenbegin;
|
||||
return true;
|
||||
} /* if cIterEig < ... */
|
||||
|
||||
// numerical problems, ignore them and try again
|
||||
|
||||
/* Addition des letzten minEW auf die Diagonale von C */
|
||||
/* Add the last known good eigen value to the diagonal of C */
|
||||
double summand = lastGoodMinimumEigenValue * exp((double) tries);
|
||||
for (unsigned i = 0; i < p.n; ++i)
|
||||
C[i][i] += summand;
|
||||
|
||||
} /* for iEigenCalcVers */
|
||||
|
||||
return false;
|
||||
|
||||
}
|
||||
|
||||
|
||||
};
|
||||
|
||||
CMAState::CMAState(const CMAParams& params, const std::vector<double>& initial_point, const double initial_sigma)
|
||||
: pimpl(new CMAStateImpl(params, initial_point, initial_sigma)) {}
|
||||
|
||||
CMAState::~CMAState() { delete pimpl; }
|
||||
CMAState::CMAState(const CMAState& that) : pimpl(new CMAStateImpl(*that.pimpl )) {}
|
||||
CMAState& CMAState::operator=(const CMAState& that) { *pimpl = *that.pimpl; return *this; }
|
||||
|
||||
void CMAState::sample(vector<double>& v) const { pimpl->sample(v); }
|
||||
|
||||
void CMAState::reestimate(const vector<const vector<double>* >& population, double muBest, double muWorst) { pimpl->reestimate(population, muBest, muWorst); }
|
||||
bool CMAState::updateEigenSystem(unsigned max_tries, unsigned max_iters) { return pimpl->updateEigenSystem(max_tries, max_iters); }
|
||||
|
||||
|
||||
} // namespace eo
|
||||
|
||||
Reference in a new issue