diff --git a/bob/ip/binseg/test/test_models.py b/bob/ip/binseg/test/test_models.py
deleted file mode 100644
index 35e39db8c2e3641b22a8a4e563651b70c968b4dd..0000000000000000000000000000000000000000
--- a/bob/ip/binseg/test/test_models.py
+++ /dev/null
@@ -1,55 +0,0 @@
-#!/usr/bin/env python
-# -*- coding: utf-8 -*-
-
-import torch
-import unittest
-import numpy as np
-from bob.ip.binseg.modeling.driu import build_driu
-from bob.ip.binseg.modeling.driuod import build_driuod
-from bob.ip.binseg.modeling.hed import build_hed
-from bob.ip.binseg.modeling.unet import build_unet
-from bob.ip.binseg.modeling.resunet import build_res50unet
-
-class Tester(unittest.TestCase):
-    """
-    Unit test for model architectures
-    """
-    def setUp(self):
-        self.x = torch.randn(1, 3, 544, 544)
-        self.hw = np.array(self.x.shape)[[2,3]]
-    
-    def test_driu(self):
-        model = build_driu()
-        out = model(self.x)
-        out_hw = np.array(out.shape)[[2,3]]
-        self.assertEqual(self.hw.all(), out_hw.all())
-
-
-    def test_driuod(self):
-        model = build_driuod()
-        out = model(self.x)
-        out_hw = np.array(out.shape)[[2,3]]
-        self.assertEqual(self.hw.all(), out_hw.all())
-
-    def test_hed(self):
-        model = build_hed()
-        out = model(self.x)
-        # NOTE: HED outputs a list of length 4. We test only for the last concat-fuse layer
-        out_hw = np.array(out[4].shape)[[2,3]]
-        self.assertEqual(self.hw.all(), out_hw.all())
-
-    def test_unet(self):
-        model = build_unet()
-        out = model(self.x)
-        out_hw = np.array(out.shape)[[2,3]]
-        self.assertEqual(self.hw.all(), out_hw.all())
-
-    def test_resunet(self):
-        model = build_res50unet()
-        out = model(self.x)
-        out_hw = np.array(out.shape)[[2,3]]
-        self.assertEqual(self.hw.all(), out_hw.all())
-
-
-if __name__ == '__main__':
-    unittest.main()
\ No newline at end of file