diff --git a/src/ptbench/configs/datasets/tbx11k_simplified/__init__.py b/src/ptbench/configs/datasets/tbx11k_simplified/__init__.py new file mode 100644 index 0000000000000000000000000000000000000000..643625e0679047392d7c214c524452b405ca0d15 --- /dev/null +++ b/src/ptbench/configs/datasets/tbx11k_simplified/__init__.py @@ -0,0 +1,27 @@ +# Copyright © 2022 Idiap Research Institute <contact@idiap.ch> +# +# SPDX-License-Identifier: GPL-3.0-or-later + + +def _maker(protocol, RGB=False): + from torchvision import transforms + + from ....data.tbx11k_simplified import dataset as raw + from ....data.transforms import ElasticDeformation, RemoveBlackBorders, RGBtoGreyscale8bit + from .. import make_dataset as mk + + post_transforms = [] + if RGB: + post_transforms = [ + transforms.Lambda(lambda x: x.convert("RGB")), + transforms.ToTensor(), + ] + + return mk( + [raw.subsets(protocol)], + [ + RGBtoGreyscale8bit() + ], + [ElasticDeformation(p=0.8)], + post_transforms, + ) diff --git a/src/ptbench/configs/datasets/tbx11k_simplified/default.py b/src/ptbench/configs/datasets/tbx11k_simplified/default.py new file mode 100644 index 0000000000000000000000000000000000000000..6aa1b81b16f4049b3998f434ee084eef2d11704b --- /dev/null +++ b/src/ptbench/configs/datasets/tbx11k_simplified/default.py @@ -0,0 +1,17 @@ +# Copyright © 2022 Idiap Research Institute <contact@idiap.ch> +# +# SPDX-License-Identifier: GPL-3.0-or-later + +"""TBX11k simplified dataset for TB detection (default protocol) + +* Split reference: first 62.5% of TB and healthy CXR for "train" 15.9% for +* "validation", 21.6% for "test" +* This split only consists of healthy and active TB samples +* "Latent TB" or "sick & non-TB" samples are not included in this configuration +* This configuration resolution: 512 x 512 (default) +* See :py:mod:`ptbench.data.tbx11k` for dataset details +""" + +from . import _maker + +dataset = _maker("default")