OpenMP improvements

git-svn-id: svn://scm.gforge.inria.fr/svnroot/paradiseo@1479 331e1502-861f-0410-8da2-ba01fb791d7f
This commit is contained in:
wcancino 2009-03-05 14:19:02 +00:00
commit 39e404d39c
4 changed files with 217 additions and 31 deletions

View file

@ -21,7 +21,7 @@
#include "treeIterator.h" #include "treeIterator.h"
#include <gsl/gsl_randist.h> #include <gsl/gsl_randist.h>
#include <gsl/gsl_cdf.h> #include <gsl/gsl_cdf.h>
#include "utils.h"
@ -185,6 +185,21 @@ void LikelihoodCalculator::set_tree( phylotreeIND &ind )
i++; i++;
} }
} }
graph::edge_iterator ite = tree_ptr->TREE.edges_begin();
graph::edge_iterator ite2 = tree_ptr->TREE.edges_end();
for(int i=0; ite!=ite2; i++)
{
for(int j=0; j < nrates; j++)
{
double len = tree_ptr->get_branch_length(*ite) * rates_prob[j];
len = (len < BL_MIN ? BL_MIN : len);
(part_memory_probmatrix_ptr+i*nrates)[j] = &( (*probmatrixs)[len] );
edgeprobmatrix[*ite] = part_memory_probmatrix_ptr+i*nrates;
}
++ite;
}
} }
double LikelihoodCalculator::calculate_likelihood_exp(edge focus) double LikelihoodCalculator::calculate_likelihood_exp(edge focus)
@ -345,11 +360,29 @@ double LikelihoodCalculator::calculate_likelihood()
for(int i=0; i<2; i++) for(int i=0; i<2; i++)
pthread_join(threads[i],NULL);*/ pthread_join(threads[i],NULL);*/
//cout << "calculando partials..." << endl; //cout << "calculando partials..." << endl;
struct timeval tempo1, tempo2, result;
gettimeofday(&tempo1, NULL);
calculate_partials( a, &b); calculate_partials( a, &b);
calculate_partials( b, &a); calculate_partials( b, &a);
//cout << "somando..." << endl; //cout << "somando..." << endl;
// sum all partials // sum all partials
lik = sum_site_liks(); lik = sum_site_liks();
gettimeofday(&tempo2, NULL);
timeval_subtract(&result,&tempo2,&tempo1);
long remainder = result.tv_sec % 3600;
long hours = (result.tv_sec - remainder)/3600;
long seconds = remainder % 60;
long minutes = (remainder - seconds) / 60;
cout << "Execution time : ";
cout.width(3);
cout.fill(' ');
cout << hours << ":";
cout.width(2);
cout.fill('0');
cout << minutes << ":";
cout.width(2);
cout.fill('0');
cout << seconds << "." << result.tv_usec << "(" << result.tv_sec << ")" << endl;
return lik; return lik;
} }
@ -363,16 +396,18 @@ double LikelihoodCalculator::sum_site_liks( )
for(int i=0; i< nrates; i++) for(int i=0; i< nrates; i++)
{ {
len = tree_ptr->get_branch_length(bfocus)*rates_prob[i]; //len = tree_ptr->get_branch_length(bfocus)*rates_prob[i];
len = len < BL_MIN ? BL_MIN : len; //len = len < BL_MIN ? BL_MIN : len;
ProbMatrix &p = (*probmatrixs)[ len]; ProbMatrix *p = edgeprobmatrix[bfocus][i]; //(*probmatrixs)[ len];
prob[i] = p.p; prob[i] = p->p;
} }
//#pragma omp parallel for private(factor_correct) schedule(dynamic) num_threads(2) reduction(+:lik)
for(int i=0; i < seqlen; i++) for(int i=0; i < seqlen; i++)
{ {
factor_correct = Factors[a][i] + Factors[b][i] ; factor_correct = Factors[a][i] + Factors[b][i] ;
site_liks[i] = sum_partials(i); site_liks[i] = sum_partials(i);
//#pragma omp critical
lik += ( log(site_liks[i]) + factor_correct)* SeqData->pattern_count(i); lik += ( log(site_liks[i]) + factor_correct)* SeqData->pattern_count(i);
} }
return lik; return lik;
@ -451,9 +486,8 @@ void LikelihoodCalculator::calculate_node_partial( node father, node son, edge e
register double sum; register double sum;
int r,i,j; int r,i,j;
//unsigned char l; //unsigned char l;
ProbMatrix *p;
register int seqlen = tree_ptr->number_of_positions(); register int seqlen = tree_ptr->number_of_positions();
#pragma omp parallel for private(p) schedule(dynamic) num_threads(2) #pragma omp parallel for
for(int k=0; k<seqlen;k++) for(int k=0; k<seqlen;k++)
{ {
long index = k*nrates*4; long index = k*nrates*4;
@ -463,11 +497,9 @@ void LikelihoodCalculator::calculate_node_partial( node father, node son, edge e
for(int r=0; r<nrates; r++) for(int r=0; r<nrates; r++)
{ {
double len = tree_ptr->get_branch_length(edgeaux) * rates_prob[r];
len = (len < BL_MIN ? BL_MIN : len);
double sum = 0; double sum = 0;
#pragma omp critical //#pragma omp critical
p = &((*probmatrixs)[ len ]); ProbMatrix *p = edgeprobmatrix[edgeaux][r];
for(int i=0; i < 4; i++) for(int i=0; i < 4; i++)
{ {
@ -528,7 +560,6 @@ void LikelihoodCalculator::init_partials()
// init internal nodes // init internal nodes
for(long i=0; i< size_part_memory_internal; i++) for(long i=0; i< size_part_memory_internal; i++)
part_memory_internal[i] = 1.0; part_memory_internal[i] = 1.0;
} }
// calculate the values de C_j for all nodes // calculate the values de C_j for all nodes
@ -544,3 +575,145 @@ void LikelihoodCalculator::calculate_partials(node n, node *antecessor)
} }
// omp code
double LikelihoodCalculator::calculate_likelihood_omp()
{
double lik=0;
// select an internal node as root
bfocus = *(tree_ptr->TREE.edges_begin());
a = tree_ptr->istaxon(bfocus.target()) ? bfocus.source() : bfocus.target();
b = bfocus.opposite(a);
init_partials();
struct timeval tempo1, tempo2, result;
int seqlen = tree_ptr->number_of_positions();
for(int i=0; i< nrates; i++)
{
//len = tree_ptr->get_branch_length(bfocus)*rates_prob[i];
//len = len < BL_MIN ? BL_MIN : len;
ProbMatrix *p = edgeprobmatrix[bfocus][i]; //(*probmatrixs)[ len];
prob[i] = p->p;
}
gettimeofday(&tempo1, NULL);
#pragma omp parallel for reduction(+:lik)
for(int i=0; i< seqlen; i++)
{
calculate_partials_omp( a, &b,i);
calculate_partials_omp( b, &a,i);
//cout << "somando..." << endl;
// sum all partials
lik += sum_site_liks_omp(i);
}
gettimeofday(&tempo2, NULL);
timeval_subtract(&result,&tempo2,&tempo1);
long remainder = result.tv_sec % 3600;
long hours = (result.tv_sec - remainder)/3600;
long seconds = remainder % 60;
long minutes = (remainder - seconds) / 60;
cout << "Execution time : ";
cout.width(3);
cout.fill(' ');
cout << hours << ":";
cout.width(2);
cout.fill('0');
cout << minutes << ":";
cout.width(2);
cout.fill('0');
cout << seconds << "." << result.tv_usec << "(" << result.tv_sec << ")" << endl;
return lik;
}
double LikelihoodCalculator::sum_site_liks_omp( int pos )
{
register double lik = 0;
register double factor_correct;
//#pragma omp parallel for private(factor_correct) schedule(dynamic) num_threads(2) reduction(+:lik)
factor_correct = Factors[a][pos] + Factors[b][pos] ;
site_liks[pos] = sum_partials(pos);
lik = ( log(site_liks[pos]) + factor_correct)* SeqData->pattern_count(pos);
return lik;
}
void LikelihoodCalculator::calculate_partials_omp(node n, node *antecessor, int pos)
{
postorder_Iterator it = tree_ptr->postorder_begin( n, *antecessor);
while(*it!=n)
{
calculate_node_partial_omp( it.ancestor(), *it, it.branch(),pos);
++it;
}
}
void LikelihoodCalculator::calculate_node_partial_omp( node father, node son, edge edgeaux, int pos)
{
register double sum;
//unsigned char l;
//#pragma omp parallel for
long index = pos*nrates*4;
// accumulatre
Factors[father][pos]+=Factors[son][pos];
double corr_factor = MDBL_MIN;
for(int r=0; r<nrates; r++)
{
double sum = 0;
//#pragma omp critical
ProbMatrix *p = edgeprobmatrix[edgeaux][r];
for(int i=0; i < 4; i++)
{
sum = 0;
if(tree_ptr->istaxon( son))
{
unsigned char l=SeqData->pattern_pos( pos, tree_ptr->taxon_id( son));
if(SeqData->is_defined( l) ) sum = p->p_ij_t( i, l );
else if(SeqData->is_ambiguous( l))
{
unsigned char *meaning = SeqData->ambiguos_meaning( l);
for(int j=0; j < 4; j++)
sum +=meaning[j]* p->p_ij_t( i, j );
//sum +=Partials[son][k*4+j]* p.p_ij_t( i, j );
}
else sum = 1;
}
else{
for(int j=0; j < 4; j++)
{
sum +=Partials[son][index+ r*4 +j]* p->p_ij_t( i, j );
}
}
Partials[father][index + r*4 +i] *= sum;
corr_factor = ( sum > corr_factor ? sum : corr_factor);
}
}
if( corr_factor < UMBRAL || corr_factor > (1./LIM_SCALE_VAL))
{
//cout << "escalado ..." << endl;
for(int r=0; r< nrates; r++)
for(int i=0; i<4; i++)
Partials[father][index + r*4+ i] /= corr_factor;
Factors[father][pos] += log(corr_factor);
}
}

View file

@ -46,12 +46,14 @@ private:
double *part_memory_internal, // conditional likelihood of internal nodes double *part_memory_internal, // conditional likelihood of internal nodes
*part_memory_taxons, // conditional likelihood of internal nodes, no longer used *part_memory_taxons, // conditional likelihood of internal nodes, no longer used
*part_memory_factors; // correction factors for nodes *part_memory_factors; // correction factors for nodes
ProbMatrix **part_memory_probmatrix_ptr;
double *site_liks; // site likelihoods double *site_liks; // site likelihoods
// maps nodes to the continous memory // maps nodes to the continous memory
node_map< double *> Partials; // maps nodes to the corresponding conditional likelihood node_map< double *> Partials; // maps nodes to the corresponding conditional likelihood
node_map<double *> Factors; // maps node to the corresponding correct factors node_map<double *> Factors; // maps node to the corresponding correct factors
edge_map<ProbMatrix **> edgeprobmatrix; // maps the edge to the corresponding probability matrixs
// external data // external data
phylotreeIND *tree_ptr; // point to the tree phylotreeIND *tree_ptr; // point to the tree
@ -67,9 +69,11 @@ private:
// prepare the post-order tree iterator // prepare the post-order tree iterator
void calculate_partials(node n, node *); void calculate_partials(node n, node *);
void calculate_partials_omp(node n, node *, int pos);
// calculate conditional likelihood for the node father, from the son conditionals // calculate conditional likelihood for the node father, from the son conditionals
void calculate_node_partial( node father, node son, edge edgeaux); void calculate_node_partial( node father, node son, edge edgeaux);
void calculate_node_partial_omp( node father, node son, edge edgeaux, int pos);
// likelihood sum of partial for the focus branch // likelihood sum of partial for the focus branch
double sum_partials( int pos); double sum_partials( int pos);
double sum_partials_a_to_taxon( int pos ); double sum_partials_a_to_taxon( int pos );
@ -77,20 +81,25 @@ private:
// sum the site likelihoods // sum the site likelihoods
double sum_site_liks(); double sum_site_liks();
double sum_site_liks_omp(int pos);
// allocate partial memory // allocate partial memory
void allocate_partials() void allocate_partials()
{ {
long total_pos = SeqData->pattern_count(); long total_pos = SeqData->pattern_count();
int ntaxons = SeqData->num_seqs(); int ntaxons = SeqData->num_seqs();
//int nedges = tree_ptr->TREE.number_of_edges();
part_memory_internal = new double[ (ntaxons-2) * nrates * total_pos * 4 ]; part_memory_internal = new double[ (ntaxons-2) * nrates * total_pos * 4 ];
part_memory_factors = new double [ (2*ntaxons-2) * total_pos]; part_memory_factors = new double [ (2*ntaxons-2) * total_pos];
part_memory_probmatrix_ptr = new ProbMatrix* [ (2*ntaxons-3) * nrates ] ;
site_liks = new double[total_pos]; site_liks = new double[total_pos];
cout << "allocating done..." << endl;
} }
// destroy partial memory // destroy partial memory
void deallocate_partials() void deallocate_partials()
{ {
delete [] part_memory_probmatrix_ptr;
delete [] part_memory_internal; delete [] part_memory_internal;
delete [] part_memory_factors; delete [] part_memory_factors;
delete [] site_liks; delete [] site_liks;
@ -109,6 +118,7 @@ public:
// main functions, prepare the object to calculate likelihood // main functions, prepare the object to calculate likelihood
double calculate_likelihood(); double calculate_likelihood();
double calculate_likelihood_omp();
double get_site_lik(int i) { return site_liks[i]; } double get_site_lik(int i) { return site_liks[i]; }
double calculate_likelihood_exp(edge focus); double calculate_likelihood_exp(edge focus);
double calculate_all_likelihoods(); double calculate_all_likelihoods();

View file

@ -43,7 +43,8 @@ public:
} }
else else
{ {
ProbMatrix *new_prob_matrix = new ProbMatrix(model, branchlength); ProbMatrix *new_prob_matrix;
new_prob_matrix = new ProbMatrix(model, branchlength);
new_prob_matrix->init(); new_prob_matrix->init();
container[branchlength] = new_prob_matrix; container[branchlength] = new_prob_matrix;
return *new_prob_matrix; return *new_prob_matrix;

View file

@ -47,7 +47,7 @@ int main(int argc, char *argv[])
{ {
// measures execution time // measures execution time
struct timeval tempo1, tempo2, result; struct timeval tempo1, tempo2, result;
gettimeofday(&tempo1, NULL);
cout << "\n\nReading Sequence Datafile..."; cout << "\n\nReading Sequence Datafile...";
Sequences seq("/home/wcancino/experimentos/PhyloMOEA_0.2/500/500_ZILLA.plain"); Sequences seq("/home/wcancino/experimentos/PhyloMOEA_0.2/500/500_ZILLA.plain");
@ -80,11 +80,11 @@ int main(int argc, char *argv[])
for(int i=0; i < population.size(); i++) for(int i=0; i < population.size(); i++)
{ {
lik_calc.set_tree(population[i].get_tree());
cout << lik_calc.calculate_likelihood() << endl;
}
gettimeofday(&tempo2, NULL); lik_calc.set_tree(population[i].get_tree());
// gettimeofday(&tempo1, NULL);
cout << lik_calc.calculate_likelihood() << endl;
/* gettimeofday(&tempo2, NULL);
timeval_subtract(&result,&tempo2,&tempo1); timeval_subtract(&result,&tempo2,&tempo1);
long remainder = result.tv_sec % 3600; long remainder = result.tv_sec % 3600;
long hours = (result.tv_sec - remainder)/3600; long hours = (result.tv_sec - remainder)/3600;
@ -99,7 +99,9 @@ int main(int argc, char *argv[])
cout << minutes << ":"; cout << minutes << ":";
cout.width(2); cout.width(2);
cout.fill('0'); cout.fill('0');
cout << seconds << "." << result.tv_usec << "(" << result.tv_sec << ")" << endl; cout << seconds << "." << result.tv_usec << "(" << result.tv_sec << ")" << endl;*/
}
gsl_rng_free(rn2); gsl_rng_free(rn2);
// delete probmatrixs; // delete probmatrixs;
delete rn; delete rn;