sequential-parameter-optimization
diff --git a/‎notebooks/00_spotPython_tests.ipynb‎
Lines changed: 182 additions & 5 deletions b/‎notebooks/00_spotPython_tests.ipynb‎
Lines changed: 182 additions & 5 deletions
diff --git a/‎pyproject.toml‎
Lines changed: 1 addition & 1 deletion b/‎pyproject.toml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/spotPython/data/lightdatamodule.py‎
Lines changed: 7 additions & 4 deletions b/‎src/spotPython/data/lightdatamodule.py‎
Lines changed: 7 additions & 4 deletions
@@ -3060,7 +3060,7 @@
     },
     {
       "cell_type": "code",
-      "execution_count": 14,
+      "execution_count": null,
       "metadata": {},
       "outputs": [],
       "source": [
@@ -3147,26 +3147,203 @@
     },
     {
       "cell_type": "code",
-      "execution_count": 15,
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "test_file_save_load()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Netlightregression2"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": 6,
       "metadata": {},
       "outputs": [
         {
           "name": "stderr",
           "output_type": "stream",
           "text": [
-            "Seed set to 123\n"
+            "/Users/bartz/miniforge3/envs/spotCondaEnv/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:198: Attribute 'act_fn' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['act_fn'])`.\n",
+            "GPU available: True (mps), used: True\n",
+            "TPU available: False, using: 0 TPU cores\n",
+            "IPU available: False, using: 0 IPUs\n",
+            "HPU available: False, using: 0 HPUs\n"
           ]
         },
         {
           "name": "stdout",
           "output_type": "stream",
           "text": [
-            "Experiment saved as spot_braninexperiment.pickle\n"
+            "batch_x.shape: torch.Size([8, 10])\n",
+            "batch_y.shape: torch.Size([8])\n"
           ]
+        },
+        {
+          "name": "stderr",
+          "output_type": "stream",
+          "text": [
+            "/Users/bartz/miniforge3/envs/spotCondaEnv/lib/python3.11/site-packages/lightning/pytorch/trainer/configuration_validator.py:74: You defined a `validation_step` but have no `val_dataloader`. Skipping val loop.\n",
+            "\n",
+            "  | Name   | Type       | Params | In sizes | Out sizes\n",
+            "-------------------------------------------------------------\n",
+            "0 | layers | Sequential | 25.6 K | [8, 10]  | [8, 1]   \n",
+            "-------------------------------------------------------------\n",
+            "25.6 K    Trainable params\n",
+            "0         Non-trainable params\n",
+            "25.6 K    Total params\n",
+            "0.102     Total estimated model params size (MB)\n",
+            "/Users/bartz/miniforge3/envs/spotCondaEnv/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/data_connector.py:441: The 'train_dataloader' does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` to `num_workers=11` in the `DataLoader` to improve performance.\n",
+            "/Users/bartz/miniforge3/envs/spotCondaEnv/lib/python3.11/site-packages/lightning/pytorch/loops/fit_loop.py:293: The number of training batches (20) is smaller than the logging interval Trainer(log_every_n_steps=50). Set a lower value for log_every_n_steps if you want to see logs for the training epoch.\n",
+            "`Trainer.fit` stopped: `max_epochs=10` reached.\n",
+            "/Users/bartz/miniforge3/envs/spotCondaEnv/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/data_connector.py:441: The 'val_dataloader' does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` to `num_workers=11` in the `DataLoader` to improve performance.\n"
+          ]
+        },
+        {
+          "data": {
+            "text/html": [
+              "<pre style=\"white-space:pre;overflow-x:auto;line-height:normal;font-family:Menlo,'DejaVu Sans Mono',consolas,'Courier New',monospace\">┏━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━┓\n",
+              "┃<span style=\"font-weight: bold\">      Validate metric      </span>┃<span style=\"font-weight: bold\">       DataLoader 0        </span>┃\n",
+              "┡━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━┩\n",
+              "│<span style=\"color: #008080; text-decoration-color: #008080\">         hp_metric         </span>│<span style=\"color: #800080; text-decoration-color: #800080\">      28803.052734375      </span>│\n",
+              "│<span style=\"color: #008080; text-decoration-color: #008080\">         val_loss          </span>│<span style=\"color: #800080; text-decoration-color: #800080\">      28803.052734375      </span>│\n",
+              "└───────────────────────────┴───────────────────────────┘\n",
+              "</pre>\n"
+            ],
+            "text/plain": [
+              "┏━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━┓\n",
+              "┃\u001b[1m \u001b[0m\u001b[1m     Validate metric     \u001b[0m\u001b[1m \u001b[0m┃\u001b[1m \u001b[0m\u001b[1m      DataLoader 0       \u001b[0m\u001b[1m \u001b[0m┃\n",
+              "┡━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━┩\n",
+              "│\u001b[36m \u001b[0m\u001b[36m        hp_metric        \u001b[0m\u001b[36m \u001b[0m│\u001b[35m \u001b[0m\u001b[35m     28803.052734375     \u001b[0m\u001b[35m \u001b[0m│\n",
+              "│\u001b[36m \u001b[0m\u001b[36m        val_loss         \u001b[0m\u001b[36m \u001b[0m│\u001b[35m \u001b[0m\u001b[35m     28803.052734375     \u001b[0m\u001b[35m \u001b[0m│\n",
+              "└───────────────────────────┴───────────────────────────┘\n"
+            ]
+          },
+          "metadata": {},
+          "output_type": "display_data"
+        },
+        {
+          "name": "stderr",
+          "output_type": "stream",
+          "text": [
+            "/Users/bartz/miniforge3/envs/spotCondaEnv/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/data_connector.py:441: The 'test_dataloader' does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` to `num_workers=11` in the `DataLoader` to improve performance.\n"
+          ]
+        },
+        {
+          "data": {
+            "text/html": [
+              "<pre style=\"white-space:pre;overflow-x:auto;line-height:normal;font-family:Menlo,'DejaVu Sans Mono',consolas,'Courier New',monospace\">┏━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━┓\n",
+              "┃<span style=\"font-weight: bold\">        Test metric        </span>┃<span style=\"font-weight: bold\">       DataLoader 0        </span>┃\n",
+              "┡━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━┩\n",
+              "│<span style=\"color: #008080; text-decoration-color: #008080\">         hp_metric         </span>│<span style=\"color: #800080; text-decoration-color: #800080\">      28280.533203125      </span>│\n",
+              "│<span style=\"color: #008080; text-decoration-color: #008080\">         val_loss          </span>│<span style=\"color: #800080; text-decoration-color: #800080\">      28280.533203125      </span>│\n",
+              "└───────────────────────────┴───────────────────────────┘\n",
+              "</pre>\n"
+            ],
+            "text/plain": [
+              "┏━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━┓\n",
+              "┃\u001b[1m \u001b[0m\u001b[1m       Test metric       \u001b[0m\u001b[1m \u001b[0m┃\u001b[1m \u001b[0m\u001b[1m      DataLoader 0       \u001b[0m\u001b[1m \u001b[0m┃\n",
+              "┡━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━┩\n",
+              "│\u001b[36m \u001b[0m\u001b[36m        hp_metric        \u001b[0m\u001b[36m \u001b[0m│\u001b[35m \u001b[0m\u001b[35m     28280.533203125     \u001b[0m\u001b[35m \u001b[0m│\n",
+              "│\u001b[36m \u001b[0m\u001b[36m        val_loss         \u001b[0m\u001b[36m \u001b[0m│\u001b[35m \u001b[0m\u001b[35m     28280.533203125     \u001b[0m\u001b[35m \u001b[0m│\n",
+              "└───────────────────────────┴───────────────────────────┘\n"
+            ]
+          },
+          "metadata": {},
+          "output_type": "display_data"
+        },
+        {
+          "data": {
+            "text/plain": [
+              "[{'val_loss': 28280.533203125, 'hp_metric': 28280.533203125}]"
+            ]
+          },
+          "execution_count": 6,
+          "metadata": {},
+          "output_type": "execute_result"
         }
       ],
       "source": [
-        "test_file_save_load()"
+        "from torch.utils.data import DataLoader\n",
+        "from spotPython.data.diabetes import Diabetes\n",
+        "from spotPython.light.regression.netlightregression2 import NetLightRegression2\n",
+        "from torch import nn\n",
+        "import lightning as L\n",
+        "import torch\n",
+        "BATCH_SIZE = 8\n",
+        "dataset = Diabetes()\n",
+        "train1_set, test_set = torch.utils.data.random_split(dataset, [0.6, 0.4])\n",
+        "train_set, val_set = torch.utils.data.random_split(train1_set, [0.6, 0.4])\n",
+        "train_loader = DataLoader(train_set, batch_size=BATCH_SIZE, shuffle=True, drop_last=True, pin_memory=True)\n",
+        "test_loader = DataLoader(test_set, batch_size=BATCH_SIZE)\n",
+        "val_loader = DataLoader(val_set, batch_size=BATCH_SIZE)\n",
+        "batch_x, batch_y = next(iter(train_loader))\n",
+        "print(f\"batch_x.shape: {batch_x.shape}\")\n",
+        "print(f\"batch_y.shape: {batch_y.shape}\")\n",
+        "net_light_base = NetLightRegression2(l1=128,\n",
+        "                                    epochs=10,\n",
+        "                                    batch_size=BATCH_SIZE,\n",
+        "                                    initialization='Default',\n",
+        "                                    act_fn=nn.ReLU(),\n",
+        "                                    optimizer='Adam',\n",
+        "                                    dropout_prob=0.1,\n",
+        "                                    lr_mult=0.1,\n",
+        "                                    patience=5,\n",
+        "                                    _L_in=10,\n",
+        "                                    _L_out=1)\n",
+        "trainer = L.Trainer(max_epochs=10,  enable_progress_bar=False)\n",
+        "trainer.fit(net_light_base, train_loader)\n",
+        "trainer.validate(net_light_base, val_loader)\n",
+        "trainer.test(net_light_base, test_loader)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# LightDataModule"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": 8,
+      "metadata": {},
+      "outputs": [
+        {
+          "name": "stdout",
+          "output_type": "stream",
+          "text": [
+            "LightDataModule: setup(). stage: None\n",
+            "LightDataModule setup(): full_train_size: 0.5\n",
+            "LightDataModule setup(): val_size: 0.25\n",
+            "LightDataModule setup(): train_size: 0.25\n",
+            "LightDataModule setup(): test_size: 0.5\n",
+            "LightDataModule: setup(). stage: fit\n",
+            "LightDataModule: setup(). stage: test\n",
+            "LightDataModule: setup(). stage: predict\n",
+            "Training set size: 3\n",
+            "Validation set size: 3\n",
+            "Test set size: 6\n"
+          ]
+        }
+      ],
+      "source": [
+        "from spotPython.data.lightdatamodule import LightDataModule\n",
+        "from spotPython.data.csvdataset import CSVDataset\n",
+        "import torch\n",
+        "# data.csv is simple csv file with 11 samples\n",
+        "dataset = CSVDataset(csv_file='data.csv', target_column='prognosis', feature_type=torch.long)\n",
+        "data_module = LightDataModule(dataset=dataset, batch_size=5, test_size=0.5)\n",
+        "data_module.setup()\n",
+        "print(f\"Training set size: {len(data_module.data_train)}\")\n",
+        "print(f\"Validation set size: {len(data_module.data_val)}\")\n",
+        "print(f\"Test set size: {len(data_module.data_test)}\")"
       ]
     },
     {
 
@@ -7,7 +7,7 @@ build-backend = "setuptools.build_meta"
 
 [project]
 name = "spotPython"
-version = "0.10.66"
+version = "0.10.67"
 authors = [
   { name="T. Bartz-Beielstein", email="tbb@bartzundbartz.de" }
 ]
 
@@ -130,12 +130,15 @@ def setup(self, stage: Optional[str] = None) -> None:
         # Assign train/val datasets for use in dataloaders
         if stage == "fit" or stage is None:
             print("LightDataModule: setup(). stage: fit")
-            self.data_train, self.data_val, _ = random_split(self.data_full, [train_size, val_size, test_size])
+            generator_fit = torch.Generator().manual_seed(self.test_seed)
+            self.data_train, self.data_val, _ = random_split(
+                self.data_full, [train_size, val_size, test_size], generator=generator_fit
+            )
 
         # Assign test dataset for use in dataloader(s)
         if stage == "test" or stage is None:
             print("LightDataModule: setup(). stage: test")
-            # get test data aset as test_abs percent of the full dataset
+            # get test data set as test_abs percent of the full dataset
             generator_test = torch.Generator().manual_seed(self.test_seed)
             self.data_test, _ = random_split(self.data_full, [test_size, full_train_size], generator=generator_test)
 
@@ -151,7 +154,7 @@ def setup(self, stage: Optional[str] = None) -> None:
         # Assign pred dataset for use in dataloader(s)
         if stage == "predict" or stage is None:
             print("LightDataModule: setup(). stage: predict")
-            # get test data aset as test_abs percent of the full dataset
+            # get test data set as test_abs percent of the full dataset
             generator_predict = torch.Generator().manual_seed(self.test_seed)
             self.data_predict, _ = random_split(
                 self.data_full, [test_size, full_train_size], generator=generator_predict
@@ -199,7 +202,7 @@ def val_dataloader(self) -> DataLoader:
                 print(f"Training set size: {len(data_module.data_val)}")
                 Training set size: 3
         """
-        print(f"LightDataModule: val_dataloader(). Training set size: {len(self.data_val)}")
+        print(f"LightDataModule: val_dataloader(). Validation set size: {len(self.data_val)}")
         print(f"LightDataModule: val_dataloader(). batch_size: {self.batch_size}")
         print(f"LightDataModule: val_dataloader(). num_workers: {self.num_workers}")
         return DataLoader(self.data_val, batch_size=self.batch_size, num_workers=self.num_workers)
Original file line number	Diff line number	Diff line change
`@@ -7,7 +7,7 @@ build-backend = "setuptools.build_meta"`
`7`	`7`
`8`	`8`	`[project]`
`9`	`9`	`name = "spotPython"`
`10`		`-version = "0.10.66"`
	`10`	`+version = "0.10.67"`
`11`	`11`	`authors = [`
`12`	`12`	`{ name="T. Bartz-Beielstein", email="tbb@bartzundbartz.de" }`
`13`	`13`	`]`