diff --git a/bob/ip/binseg/script/significance.py b/bob/ip/binseg/script/significance.py
index 1e4d5e8e0c9d907d5e5af990a6610db713a878fa..1dd98283eb982169d5a398a9b7a33632e82bdddf 100755
--- a/bob/ip/binseg/script/significance.py
+++ b/bob/ip/binseg/script/significance.py
@@ -137,7 +137,7 @@ def _eval_patches(
             f"'{system_name}' using {steps} steps"
         )
         threshold = run_evaluation(
-            dataset[threshold], threshold, predictions[0], steps=steps
+            dataset[threshold], threshold, preddir, steps=steps
         )
         logger.info(f"Set --threshold={threshold:.5f} for '{system_name}'")