From c113676cc9022d538f1aeb8046dadd70cf8abdb9 Mon Sep 17 00:00:00 2001
From: Andre Anjos <andre.dos.anjos@gmail.com>
Date: Thu, 27 Jul 2023 20:20:05 +0200
Subject: [PATCH] [data.shenzhen] Remove split information from core datamodule

---
 src/ptbench/data/shenzhen/datamodule.py | 6 ------
 src/ptbench/data/shenzhen/default.py    | 6 ++++++
 2 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/src/ptbench/data/shenzhen/datamodule.py b/src/ptbench/data/shenzhen/datamodule.py
index 59a9d0bd..45ce8762 100644
--- a/src/ptbench/data/shenzhen/datamodule.py
+++ b/src/ptbench/data/shenzhen/datamodule.py
@@ -104,12 +104,6 @@ class DataModule(CachingDataModule):
 
     * Database reference: [MONTGOMERY-SHENZHEN-2014]_
     * Original resolution (height x width or width x height): 3000 x 3000 or less
-    * This split:
-
-      * Split reference: None
-      * Training samples: 64% of TB and healthy CXR (including labels)
-      * Validation samples: 16% of TB and healthy CXR (including labels)
-      * Test samples: 20% of TB and healthy CXR (including labels)
 
     Data specifications:
 
diff --git a/src/ptbench/data/shenzhen/default.py b/src/ptbench/data/shenzhen/default.py
index 7fe993a9..0e29c385 100644
--- a/src/ptbench/data/shenzhen/default.py
+++ b/src/ptbench/data/shenzhen/default.py
@@ -5,3 +5,9 @@
 from .datamodule import DataModule
 
 datamodule = DataModule("default.json.bz2")
+"""Default Shenzen TB database split.
+
+* Training samples: 64% of TB and healthy CXR (including labels)
+* Validation samples: 16% of TB and healthy CXR (including labels)
+* Test samples: 20% of TB and healthy CXR (including labels)
+"""
-- 
GitLab