0.10.20 documentation

bartzbeielstein · bartzbeielstein · commit 740aca030db4 · 2024-01-18T10:03:47.000+01:00
Improved docs
diff --git a/pyproject.toml b/pyproject.toml
@@ -7,7 +7,7 @@ build-backend = "setuptools.build_meta"
 
 [project]
 name = "spotPython"
-version = "0.10.19"
+version = "0.10.20"
 authors = [
   { name="T. Bartz-Beielstein", email="tbb@bartzundbartz.de" }
 ]
diff --git a/src/spotPython/data/lightdatamodule.py b/src/spotPython/data/lightdatamodule.py
@@ -9,11 +9,18 @@ class LightDataModule(L.LightningDataModule):
     A LightningDataModule for handling data.
 
     Args:
-        batch_size (int): The batch size.
-        dataset (Dataset): The dataset.
-        test_size (float): The test size. Defaults to 0.6.
-        test_seed (int): The test seed. Defaults to 42.
-        num_workers (int): The number of workers. Defaults to 0.
+        batch_size (int):
+            The batch size. Required.
+        dataset (torch.utils.data.Dataset):
+            The dataset from the torch.utils.data Dataset class.
+            It  must implement three functions: __init__, __len__, and __getitem__.
+            Required.
+        test_size (float):
+            The test size. Defaults to 0.6.
+        test_seed (int):
+            The test seed. Defaults to 42.
+        num_workers (int):
+            The number of workers. Defaults to 0.
 
     Attributes:
         batch_size (int): The batch size.
@@ -25,6 +32,18 @@ class LightDataModule(L.LightningDataModule):
         test_seed (int): The test seed.
         test_size (float): The test size.
 
+    Methods:
+        prepare_data(self):
+            Usually used for downloading the data. Here: Does nothing, i.e., pass.
+        setup(self, stage: Optional[str] = None):
+            Performs the training, validation, and test split.
+        train_dataloader():
+            Returns a DataLoader instance for the training set.
+        val_dataloader():
+            Returns a DataLoader instance for the validation set.
+        test_dataloader():
+            Returns a DataLoader instance for the test set.
+
     Examples:
         >>> from spotPython.data.lightdatamodule import LightDataModule
             from spotPython.data.csvdataset import CSVDataset
@@ -55,10 +74,15 @@ def prepare_data(self) -> None:
 
     def setup(self, stage: Optional[str] = None) -> None:
         """
-        Sets up the data for use.
+        Splits the data for use in training, validation, and testing.
+        Uses torch.utils.data.random_split() to split the data.
+        Splitting is based on the test_size and test_seed.
+        The test_size can be a float or an int.
 
         Args:
-            stage (Optional[str]): The current stage. Defaults to None.
+            stage (Optional[str]):
+                The current stage. Can be "fit" (for training and validation), "test" (testing),
+                or None (for all three stages). Defaults to None.
 
         Examples:
             >>> from spotPython.data.lightdatamodule import LightDataModule
@@ -101,7 +125,8 @@ def setup(self, stage: Optional[str] = None) -> None:
 
     def train_dataloader(self) -> DataLoader:
         """
-        Returns the training dataloader.
+        Returns the training dataloader, i.e., a pytorch DataLoader instance
+        using the training dataset.
 
         Returns:
             DataLoader: The training dataloader.
@@ -125,7 +150,8 @@ def train_dataloader(self) -> DataLoader:
 
     def val_dataloader(self) -> DataLoader:
         """
-        Returns the validation dataloader.
+        Returns the validation dataloader, i.e., a pytorch DataLoader instance
+        using the validation dataset.
 
         Returns:
             DataLoader: The validation dataloader.
@@ -146,7 +172,8 @@ def val_dataloader(self) -> DataLoader:
 
     def test_dataloader(self) -> DataLoader:
         """
-        Returns the test dataloader.
+        Returns the test dataloader, i.e., a pytorch DataLoader instance
+        using the test dataset.
 
         Returns:
             DataLoader: The test dataloader.

Original file line number	Diff line number	Diff line change
`@@ -7,7 +7,7 @@ build-backend = "setuptools.build_meta"`
`7`	`7`
`8`	`8`	`[project]`
`9`	`9`	`name = "spotPython"`
`10`		`-version = "0.10.19"`
	`10`	`+version = "0.10.20"`
`11`	`11`	`authors = [`
`12`	`12`	`{ name="T. Bartz-Beielstein", email="tbb@bartzundbartz.de" }`
`13`	`13`	`]`