[mareframe] Diff of /trunk/gadget/hooke.cc

Diff of /trunk/gadget/hooke.cc

-revision 14, Thu Jul 30 12:36:46 2015 UTC
+revision 19, Wed May 25 16:36:33 2016 UTC
 Line 139
  #include "ecosystem.h"
  #include "global.h"
- #ifndef NO_OPENMP
+ #ifdef _OPENMP
  #include "omp.h"
  #endif
  extern Ecosystem* EcoSystem;
- #ifndef NO_OPENMP
+ #ifdef _OPENMP
  extern Ecosystem** EcoSystems;
  #endif
 Line 178
  }
  /* given a point, look for a better one nearby, one coord at a time */
- #ifndef NO_OPENMP
+ #ifdef _OPENMP
  /*
   * function bestBeraby parallelized with OpenMP
   * · 2 threads per coord to parallelize the calculation of +delta/-delta
   * · parallelize the calculation of the best nearby of the coord
   */
- double OptInfoHooke::bestNearbyOMP(DoubleVector& delta, DoubleVector& point, double prevbest, IntVector& param) {
+ double OptInfoHooke::bestNearbyRepro(DoubleVector& delta, DoubleVector& point, double prevbest, IntVector& param) {
    double minf;//, ftmp;
    int i, j, k;
    DoubleVector z(point);
 Line 209
            return -1;
    }
+ //  omp_set_dynamic(0);
+ //  omp_set_nested(1); //permit the nested parallelization
    while ( i < nvars) {
            if ((i + paral_tokens -1) >= nvars)
                    paral_tokens = nvars - i;
-           omp_set_dynamic(0);
+ #pragma omp parallel for num_threads(paral_tokens*2) private(k) //parallelize the parameters (numThr)
-           omp_set_nested(1); //permit the nested parallelization
+           for (j = 0; j < (paral_tokens*2); ++j) {
- #pragma omp parallel for num_threads(paral_tokens) private(k) //parallelize the parameters (numThr/2)
-           for (j = 0; j < paral_tokens; ++j) {
                    storage[j].z = z;
                    storage[j].delta = delta;
-                   DoubleVector v1(z);
+                   DoubleVector v(z);
-                   DoubleVector v2(z);
-                   k = param[i+j];
-                   v1[k] +=  delta[k];
-                   v2[k] -=  delta[k];
- #pragma omp parallel sections num_threads(2) //parrallelize the +/- delta simulation for each parameter
+                   if (j<paral_tokens) {
-                   {
+                           k = param[i+j];
-         #pragma omp section
+                           v[k] +=  delta[k];
-                           {
-                   storage[j].ftmp = EcoSystems[j]->SimulateAndUpdate(v1);
-                           }
-         #pragma omp section
-                           {
-                   storage[j+paral_tokens].ftmp = EcoSystems[j+paral_tokens]->SimulateAndUpdate(v2);
                            }
+                   else {
+                           k = param[i+j-paral_tokens];
+                           v[k] -=  delta[k];
                    }
+                   storage[j].ftmp = EcoSystems[j]->SimulateAndUpdate(v);
+                   storage[j].z[k] = v[k];
+           }
+           for (j = 0; j < paral_tokens; ++j) {
+                   k = param[i+j];
                    if (storage[j].ftmp < minf) {
                            storage[j].iters = 1;
-                           storage[j].z[k] = v1[k];
+ //                        storage[j].z[k] = v1[k];
                    } else {
                            storage[j].iters = 2;
                            storage[j].delta[k] = 0.0 - delta[k];
                            if (storage[j+paral_tokens].ftmp < minf) {
                                    storage[j].ftmp = storage[j+paral_tokens].ftmp;
-                                   storage[j].z[k] = v2[k];
+                                   storage[j].z[k] = storage[j+paral_tokens].z[k];;
                            }
                    }
            }
-Line 260
+Line 258
                    }
            }
    }
+   delete[] storage;
    for (i = 0; i < nvars; ++i)
      point[i] = z[i];
    return minf;
-Line 289
+Line 287
    IntVector trapped(nvars, 0);
    EcoSystem->scaleVariables();
- #ifndef NO_OPENMP
+ #ifdef _OPENMP
    int numThr = omp_get_max_threads ( );
    for (i = 0; i < numThr; i++) // scale the variables for the ecosystem of every thread
            EcoSystems[i]->scaleVariables();
-Line 334
+Line 332
    while (1) {
      if (isZero(bestf)) {
- #ifdef NO_OPENMP
+ #ifndef _OPENMP
        iters = EcoSystem->getFuncEval() - offset;
  #endif
        handle.logMessage(LOGINFO, "Error in Hooke & Jeeves optimisation after", iters, "function evaluations, f(x) = 0");
-Line 359
+Line 357
      /* find best new point, one coord at a time */
      for (i = 0; i < nvars; i++)
        trialx[i] = x[i];
- #ifndef NO_OPENMP
+ #ifdef _OPENMP
-     newf = this->bestNearbyOMP(delta, trialx, bestf, param);
+     newf = this->bestNearbyRepro(delta, trialx, bestf, param);
      if (newf == -1) {
          handle.logMessage(LOGINFO, "\nStopping Hooke & Jeeves optimisation algorithm\n");
          handle.logMessage(LOGINFO, "\nThe number of threads must be a multiple of 2\n");
-Line 371
+Line 369
  #endif
      /* if too many function evaluations occur, terminate the algorithm */
- #ifdef NO_OPENMP
+ #ifndef _OPENMP
      iters = EcoSystem->getFuncEval() - offset;
  #endif
      if (iters > hookeiter) {
-Line 441
+Line 439
        /* only move forward if this is really an improvement    */
        oldf = newf;
        newf = EcoSystem->SimulateAndUpdate(trialx);
- #ifndef NO_OPENMP
+ #ifdef _OPENMP
        iters++;
  #endif
        if ((isEqual(newf, oldf)) || (newf > oldf)) {
-Line 454
+Line 452
        for (i = 0; i < nvars; i++)
          x[i] = trialx[i];
- #ifndef NO_OPENMP
+ #ifdef _OPENMP
-       newf = this->bestNearbyOMP(delta, trialx, bestf, param);
+       newf = this->bestNearbyRepro(delta, trialx, bestf, param);
        if (newf == -1) {
                  handle.logMessage(LOGINFO, "\nStopping Hooke & Jeeves optimisation algorithm\n");
                  handle.logMessage(LOGINFO, "\nThe number of threads must be a multiple of 2\n");
-Line 468
+Line 466
          break;
        /* if too many function evaluations occur, terminate the algorithm */
- #ifdef NO_OPENMP
+ #ifndef _OPENMP
        iters = EcoSystem->getFuncEval() - offset;
  #endif
        if (iters > hookeiter) {
-Line 485
+Line 483
          EcoSystem->storeVariables(score, bestx);
          return;
        }
-     }
+     } // while (newf < bestf)
- #ifdef NO_OPENMP
+ #ifndef _OPENMP
      iters = EcoSystem->getFuncEval() - offset;
  #endif
      if (newf < bestf) {
-Line 524
+Line 522
  }
  /* Functions to perform the parallelization of the algorithm of HJ with OpenMP*/
- #ifdef GADGET_OPENMP
+ #ifdef SPECULATIVE
- double OptInfoHooke::bestNearbyOMP2(DoubleVector& delta, DoubleVector& point, double prevbest, IntVector& param) {
+ double OptInfoHooke::bestNearbySpec(DoubleVector& delta, DoubleVector& point, double prevbest, IntVector& param) {
    double minf;
    int i, j, k, ii;
    DoubleVector z(point);
-Line 549
+Line 547
            return -1;
    }
+ //  omp_set_dynamic(0);
+ //  omp_set_nested(1); //permit the nested parallelization
    for (ii=0; ii< paral_tokens; ii++) {
            i = 0;
            while ( i < nvars) {
                    if ((i + paral_tokens -1) >= nvars)
                            paral_tokens = nvars - i;
-                   omp_set_dynamic(0);
+         #pragma omp parallel for num_threads(paral_tokens*2) private(k)
-                   omp_set_nested(1);
+                   for (j = 0; j < (paral_tokens*2); ++j) {
-         #pragma omp parallel for num_threads(paral_tokens) private(k)
-                   for (j = 0; j < paral_tokens; ++j) {
                            storage[j].z = z;
                            storage[j].delta = delta;
-                           DoubleVector v1(z);
+                           DoubleVector v(z);
-                           DoubleVector v2(z);
-                           k = param[i+j];
-                           v1[k] +=  delta[k];
-                           v2[k] -=  delta[k];
- #pragma omp parallel sections num_threads(2)
+                           if (j<paral_tokens) {
-                           {
+                                   k = param[i+j];
-           #pragma omp section
+                                   v[k] +=  delta[k];
-                                   {
+                           }
-                           storage[j].ftmp = EcoSystems[j]->SimulateAndUpdate(v1);
+                           else {
-                                   }
+                                   k = param[i+j-paral_tokens];
-           #pragma omp section
+                                   v[k] -=  delta[k];
-                                   {
-                           storage[j+paral_tokens].ftmp = EcoSystems[j+paral_tokens]->SimulateAndUpdate(v2);
                                    }
+                           storage[j].ftmp = EcoSystems[j]->SimulateAndUpdate(v);
+                           storage[j].z[k] = v[k];
                            }
+                   for (j = 0; j < paral_tokens; ++j) {
+                           k = param[i+j];
                            if (storage[j].ftmp < minf) {
                                    storage[j].iters = 1;
-                                   storage[j].z[k] = v1[k];
+ //                                storage[j].z[k] = v1[k];
                            } else {
                                    storage[j].iters = 2;
                                    storage[j].delta[k] = 0.0 - delta[k];
                                    if (storage[j+paral_tokens].ftmp < minf) {
                                            storage[j].ftmp = storage[j+paral_tokens].ftmp;
-                                           storage[j].z[k] = v2[k];
+                                           storage[j].z[k] = storage[j+paral_tokens].z[k];
                                    }
                                    else iters += 2;
                            }
-Line 605
+Line 603
                    i += paral_tokens;
            }
+           paral_tokens = numThr / 2;
          }
    delete[] storage;
-Line 678
+Line 677
             while (1) {
               if (isZero(bestf)) {
-          #ifdef NO_OPENMP
+          #ifndef _OPENMP
                 iters = EcoSystem->getFuncEval() - offset;
           #endif
                 handle.logMessage(LOGINFO, "Error in Hooke & Jeeves optimisation after", iters, "function evaluations, f(x) = 0");
-Line 703
+Line 702
               /* find best new point, one coord at a time */
               for (i = 0; i < nvars; i++)
                 trialx[i] = x[i];
-          #ifndef NO_OPENMP
+          #ifdef _OPENMP
-              newf = this->bestNearbyOMP2(delta, trialx, bestf, param);
+              newf = this->bestNearbySpec(delta, trialx, bestf, param);
               if (newf == -1) {
                  handle.logMessage(LOGINFO, "\nStopping Hooke & Jeeves optimisation algorithm\n");
                  handle.logMessage(LOGINFO, "\nThe number of threads must be a multiple of 2\n");
-Line 715
+Line 714
           #endif
               /* if too many function evaluations occur, terminate the algorithm */
-          #ifdef NO_OPENMP
+          #ifndef _OPENMP
               iters = EcoSystem->getFuncEval() - offset;
           #endif
               if (iters > hookeiter) {
-Line 785
+Line 784
                 /* only move forward if this is really an improvement    */
                 oldf = newf;
                 newf = EcoSystem->SimulateAndUpdate(trialx);
-          #ifndef NO_OPENMP
+          #ifdef _OPENMP
                 iters++;
           #endif
                 if ((isEqual(newf, oldf)) || (newf > oldf)) {
-Line 798
+Line 797
                 for (i = 0; i < nvars; i++)
                   x[i] = trialx[i];
-          #ifndef NO_OPENMP
+          #ifdef _OPENMP
-                newf = this->bestNearbyOMP2(delta, trialx, bestf, param);
+                newf = this->bestNearbySpec(delta, trialx, bestf, param);
                 if (newf == -1) {
                          handle.logMessage(LOGINFO, "\nStopping Hooke & Jeeves optimisation algorithm\n");
                          handle.logMessage(LOGINFO, "\nThe number of threads must be a multiple of 2\n");
-Line 812
+Line 811
                   break;
                 /* if too many function evaluations occur, terminate the algorithm */
-          #ifdef NO_OPENMP
+          #ifndef _OPENMP
                 iters = EcoSystem->getFuncEval() - offset;
           #endif
                 if (iters > hookeiter) {
-Line 831
+Line 830
                 }
               }
-          #ifdef NO_OPENMP
+          #ifndef _OPENMP
               iters = EcoSystem->getFuncEval() - offset;
           #endif
               if (newf < bestf) {

 Legend:



Removed from v.14
 


changed lines


 
Added in v.19
 Legend:



Removed from v.14
 


changed lines


 
Added in v.19
-Removed from v.14
+Added in v.19

root@forge.cesga.es	ViewVC Help
Powered by ViewVC 1.0.0