Reverting the commits 4559a42f c484c4bc b7370ae7 477f685d

5a7ec24b · Tiago de Freitas Pereira · 9ddad2a4 · 5a7ec24b · 5a7ec24b · 5a7ec24b
Commit 5a7ec24b authored 9 years ago by Tiago de Freitas Pereira
--- a/bob/measure/data/nonsep-epc.hdf5
+++ b/bob/measure/data/nonsep-epc.hdf5
--- a/bob/measure/error.h
+++ b/bob/measure/error.h
@@ -13,7 +13,6 @@
 #include <blitz/array.h>
 #include <utility>
 #include <vector>
-#include <algorithm>
 namespace bob { namespace measure {
@@ -108,6 +107,61 @@ namespace bob { namespace measure {
      return blitz::Array<bool,1>(negatives < threshold);
    }
+  /**
+   * Recursively minimizes w.r.t. to the given predicate method. Please refer
+   * to minimizingThreshold() for a full explanation. This method is only
+   * supposed to be used through that method.
+   */
+  template <typename T>
+  static double recursive_minimization(const blitz::Array<double,1>& negatives,
+      const blitz::Array<double,1>& positives, T& predicate,
+      double min, double max, size_t steps) {
+    static const double QUIT_THRESHOLD = 1e-10;
+    const double diff = max - min;
+    const double too_small = std::abs(diff/max);
+    //if the difference between max and min is too small, we quit.
+    if ( too_small < QUIT_THRESHOLD ) return min; //or max, does not matter...
+    double step_size = diff/(double)steps;
+    double min_value = predicate(1.0, 0.0); ///< to the left of the range
+    //the accumulator holds the thresholds that given the minimum value for the
+    //input predicate.
+    std::vector<double> accumulator;
+    accumulator.reserve(steps);
+    for (size_t i=0; i<steps; ++i) {
+      double threshold = ((double)i * step_size) + min;
+      std::pair<double, double> ratios =
+        farfrr(negatives, positives, threshold);
+      double current_cost = predicate(ratios.first, ratios.second);
+      if (current_cost < min_value) {
+        min_value = current_cost;
+        accumulator.clear(); ///< clean-up, we got a better minimum
+        accumulator.push_back(threshold); ///< remember this threshold
+      }
+      else if (std::abs(current_cost - min_value) < 1e-16) {
+        //accumulate to later decide...
+        accumulator.push_back(threshold);
+      }
+    }
+    //we stop when it doesn't matter anymore to threshold.
+    if (accumulator.size() != steps) {
+      //still needs some refinement: pick-up the middle of the range and go
+      return recursive_minimization(negatives, positives, predicate,
+          accumulator[accumulator.size()/2]-step_size,
+          accumulator[accumulator.size()/2]+step_size,
+          steps);
+    }
+    return accumulator[accumulator.size()/2];
+  }
  /**
   * This method can calculate a threshold based on a set of scores (positives
   * and negatives) given a certain minimization criteria, input as a
@@ -124,94 +178,28 @@ namespace bob { namespace measure {
   * Please note that this method will only work with single-minimum smooth
   * predicates.
   *
-   * The minimization is carried out in a data-driven way.
+   * The minimization is carried out in a recursive manner. First, we identify
-   * First, it sorts the positive and negative scores.
+   * the threshold that minimizes the predicate given a set of N (N=100)
-   * Starting from the lowest score (might be a positive or a negative), it
+   * thresholds between the min(negatives, positives) and the max(negatives,
-   * increases the threshold based on the distance between the current score
+   * positives). If the minimum lies in a range of values, the center value is
-   * and the following higher score (also keeping track of duplicate scores)
+   * picked up.
-   * and computes the predicate for each possible threshold.
   *
-   * Finally, that threshold is returned, for which the predicate returned the
+   * In a second round of minimization new minimum and maximum bounds are
-   * lowest value.
+   * defined based on the center value plus/minus the step (max-min/N) and a
+   * new minimization round is restarted for N samples within the new bounds.
+   *
+   * The procedure continues until all calculated predicates in a given round
+   * give the same minimum. At this point, the center threshold is picked up and
+   * returned.
   */
-  template <typename T>
+  template <typename T> double
-  double minimizingThreshold(const blitz::Array<double,1>& negatives, const blitz::Array<double,1>& positives, T& predicate){
+    minimizingThreshold(const blitz::Array<double,1>& negatives,
-    // sort negative and positive scores ascendingly
+        const blitz::Array<double,1>& positives, T& predicate) {
-    std::vector<double> negatives_(negatives.extent(0));
+      const size_t N = 100; ///< number of steps in each iteration
-    std::copy(negatives.begin(), negatives.end(), negatives_.begin());
+      double min = std::min(blitz::min(negatives), blitz::min(positives));
-    std::sort(negatives_.begin(), negatives_.end(), std::less<double>());
+      double max = std::max(blitz::max(negatives), blitz::max(positives));
+      return recursive_minimization(negatives, positives, predicate, min,
-    std::vector<double> positives_(positives.extent(0));
+          max, N);
-    std::copy(positives.begin(), positives.end(), positives_.begin());
-    std::sort(positives_.begin(), positives_.end(), std::less<double>());
-    // iterate over the whole set of points
-    std::vector<double>::const_iterator pos_it = positives_.begin(), neg_it = negatives_.begin();
-    // iterate over all possible far and frr points and compute the predicate for each possible threshold...
-    double min_predicate = 1e8;
-    double min_threshold = 1e8;
-    double current_predicate = 1e8;
-    // we start with the extreme values for far and frr
-    double far = 1., frr = 0.;
-    // the decrease/increase for far/frr when moving one negative/positive
-    double far_decrease = 1./negatives_.size(), frr_increase = 1./positives_.size();
-    // we start with the threshold based on the minimum score
-    double current_threshold = std::min(*pos_it, *neg_it);
-    // now, iterate over both lists, in a sorted order
-    while (pos_it != positives_.end() && neg_it != negatives_.end()){
-      // compute predicate
-      current_predicate = predicate(far, frr);
-      if (current_predicate <= min_predicate){
-        min_predicate = current_predicate;
-        min_threshold = current_threshold;
-      }
-      if (*pos_it >= *neg_it){
-        // compute current threshold
-        current_threshold = *neg_it;
-        // go to the next negative value
-        ++neg_it;
-        far -= far_decrease;
-      } else {
-        // compute current threshold
-        current_threshold = *pos_it;
-        // go to the next positive
-        ++pos_it;
-        frr += frr_increase;
-      }
-      // increase positive and negative as long as they contain the same value
-      while (neg_it != negatives_.end() && *neg_it == current_threshold) {
-        // go to next negative
-        ++neg_it;
-        far -= far_decrease;
-      }
-      while (pos_it != positives_.end() && *pos_it == current_threshold) {
-        // go to next positive
-        ++pos_it;
-        frr += frr_increase;
-      }
-      // compute a new threshold based on the center between last and current score, if we are not already at the end of the score lists
-      if (neg_it != negatives_.end() || pos_it != positives_.end()){
-        if (neg_it != negatives_.end() && pos_it != positives_.end())
-          current_threshold += std::min(*pos_it, *neg_it);
-        else if (neg_it != negatives_.end())
-          current_threshold += *neg_it;
-        else
-          current_threshold += *pos_it;
-        current_threshold /= 2;
-      }
-    } // while
-    // now, we have reached the end of one list (usually the negatives)
-    // so, finally compute predicate for the last time
-    current_predicate = predicate(far, frr);
-    if (current_predicate < min_predicate){
-      min_predicate = current_predicate;
-      min_threshold = current_threshold;
-    }
-    // return the best threshold found
-    return min_threshold;
    }
  /**

--- a/bob/measure/test_error.py
+++ b/bob/measure/test_error.py
@@ -211,7 +211,7 @@ def test_plots():
  xy = epc(dev_negatives, dev_positives,
      test_negatives, test_positives, 100)
  # uncomment the next line to save a reference value
-  # bob.io.base.save(xy, F('nonsep-epc.hdf5'))
+  # save('nonsep-epc.hdf5', xy)
  xyref = bob.io.base.load(F('nonsep-epc.hdf5'))
  assert numpy.allclose(xy, xyref, atol=1e-15)

--- a/version.txt
+++ b/version.txt
-2.1.0b0
+2.0.5b0
\ No newline at end of file