sequential-parameter-optimization
diff --git a/‎notebooks/00_spotPython_tests.ipynb‎
Lines changed: 63 additions & 3 deletions b/‎notebooks/00_spotPython_tests.ipynb‎
Lines changed: 63 additions & 3 deletions
diff --git a/‎pyproject.toml‎
Lines changed: 1 addition & 1 deletion b/‎pyproject.toml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/spotpython/light/regression/__init__.py‎
Lines changed: 4 additions & 0 deletions b/‎src/spotpython/light/regression/__init__.py‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎src/spotpython/light/regression/nn_many_to_many_gru_regressor.py‎
Lines changed: 254 additions & 0 deletions b/‎src/spotpython/light/regression/nn_many_to_many_gru_regressor.py‎
Lines changed: 254 additions & 0 deletions
@@ -13210,17 +13210,77 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 4,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Seed set to 123\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "spotpython tuning: 24.570062683593157 [#######---] 73.33% \n",
+      "spotpython tuning: 9.653948855801172 [########--] 80.00% \n",
+      "spotpython tuning: 6.0 [#########-] 86.67% \n",
+      "spotpython tuning: 6.0 [#########-] 93.33% \n",
+      "spotpython tuning: 6.0 [##########] 100.00% Done...\n",
+      "\n",
+      "Experiment saved to 000_res.pkl\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "array([[  49.03864351,  -49.03864351,   49.03864351,  -49.03864351,\n",
+       "          49.03864351],\n",
+       "       [  26.44326166,  -26.44326166,   26.44326166,  -26.44326166,\n",
+       "          26.44326166],\n",
+       "       [  30.30474677,  -30.30474677,   30.30474677,  -30.30474677,\n",
+       "          30.30474677],\n",
+       "       [  97.95896241,  -97.95896241,   97.95896241,  -97.95896241,\n",
+       "          97.95896241],\n",
+       "       [  54.8004826 ,  -54.8004826 ,   54.8004826 ,  -54.8004826 ,\n",
+       "          54.8004826 ],\n",
+       "       [  41.20251877,  -41.20251877,   41.20251877,  -41.20251877,\n",
+       "          41.20251877],\n",
+       "       [  82.56284391,  -82.56284391,   82.56284391,  -82.56284391,\n",
+       "          82.56284391],\n",
+       "       [  67.51701335,  -67.51701335,   67.51701335,  -67.51701335,\n",
+       "          67.51701335],\n",
+       "       [  79.24343522,  -79.24343522,   79.24343522,  -79.24343522,\n",
+       "          79.24343522],\n",
+       "       [ 101.08340746, -101.08340746,  101.08340746, -101.08340746,\n",
+       "         101.08340746],\n",
+       "       [  24.57006268,  -24.57006268,   24.57006268,  -24.57006268,\n",
+       "          24.57006268],\n",
+       "       [   9.65394886,   -9.65394886,    9.65394886,   -9.65394886,\n",
+       "           9.65394886],\n",
+       "       [   6.        ,   -6.        ,    6.        ,   -6.        ,\n",
+       "           6.        ],\n",
+       "       [ 107.08509445, -107.08509445,  107.08509445, -107.08509445,\n",
+       "         107.08509445],\n",
+       "       [  68.96564781,  -68.96564781,   68.96564781,  -68.96564781,\n",
+       "          68.96564781]])"
+      ]
+     },
+     "execution_count": 4,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
    "source": [
     "import numpy as np\n",
     "from spotpython.fun.multiobjectivefunctions import MultiAnalytical\n",
     "from spotpython.spot import Spot\n",
     "\n",
     "from spotpython.utils.init import fun_control_init\n",
     "# Objective function with m=5 objectives\n",
-    "fun = MultiAnalytical(m=4).fun_mo_linear\n",
+    "fun = MultiAnalytical(m=5).fun_mo_linear\n",
     "fun_control = fun_control_init(\n",
     "    lower=np.array([1, 0, 5]),\n",
     "    upper=np.array([10, 10, 100])\n",
 
@@ -7,7 +7,7 @@ build-backend = "setuptools.build_meta"
 
 [project]
 name = "spotpython"
-version = "0.28.0"
+version = "0.28.1"
 authors = [
   { name="T. Bartz-Beielstein", email="tbb@bartzundbartz.de" }
 ]
 
@@ -9,6 +9,8 @@
 from .netlightregression import NetLightRegression
 from .nn_condnet_regressor import NNCondNetRegressor
 from .nn_many_to_many_rnn_regressor import ManyToManyRNNRegressor, ManyToManyRNN
+from .nn_many_to_many_gru_regressor import ManyToManyGRURegressor
+from .nn_many_to_many_lstm_regressor import ManyToManyLSTMRegressor
 
 __all__ = [
     "NNLinearRegressor",
@@ -18,4 +20,6 @@
     "NNCondNetRegressor",
     "ManyToManyRNNRegressor",
     "ManyToManyRNN",
+    "ManyToManyGRURegressor",
+    "ManyToManyLSTMRegressor",
 ]
@@ -0,0 +1,254 @@
+import lightning as L
+import torch
+import torch.nn as nn
+from torch.nn.utils.rnn import pack_padded_sequence, pad_packed_sequence
+import torchmetrics.functional.regression
+import torch.optim as optim
+from spotpython.hyperparameters.optimizer import optimizer_handler
+
+
+class ManyToManyGRU(nn.Module):
+    """A Many-to-Many GRU model for sequence-to-sequence regression tasks.
+
+    This model uses a GRU layer followed by a fully connected layer and an output layer.
+
+    Args:
+        input_size (int): The number of input features.
+        output_size (int): The number of output features. Defaults to 1.
+        gru_units (int): The number of units in the GRU layer. Defaults to 128.
+        fc_units (int): The number of units in the fully connected layer. Defaults to 128.
+        activation_fct (nn.Module): The activation function to use after the fully connected layer. Defaults to nn.ReLU().
+        dropout (float): The dropout probability. Defaults to 0.2.
+        bidirectional (bool): Whether the GRU is bidirectional. Defaults to True.
+        num_layers (int): The number of GRU layers. Defaults to 2.
+
+    Examples:
+        >>> from spotpython.light.regression.nn_many_to_many_gru_regressor import ManyToManyGRU
+        >>> import torch
+        >>> model = ManyToManyGRU(input_size=10, output_size=1)
+        >>> x = torch.randn(16, 10, 10)  # Batch of 16 sequences, each of length 10 with 10 features
+        >>> lengths = torch.tensor([10] * 16)  # All sequences have length 10
+        >>> output = model(x, lengths)
+        >>> print(output.shape)  # Output shape: (16, 10, 1)
+    """
+
+    def __init__(
+        self,
+        input_size,
+        output_size=1,
+        gru_units=128,
+        fc_units=128,
+        activation_fct=nn.ReLU(),
+        dropout=0.2,
+        bidirectional=True,
+        num_layers=2,
+    ):
+        super(ManyToManyGRU, self).__init__()
+        self.gru_layer = nn.GRU(
+            input_size=input_size,
+            hidden_size=gru_units,
+            num_layers=num_layers,
+            batch_first=True,
+            bidirectional=bidirectional,
+            dropout=dropout if num_layers > 1 else 0.0,
+        )
+        if bidirectional:
+            gru_units = gru_units * 2
+        self.fc = nn.Linear(gru_units, fc_units)
+        self.dropout = nn.Dropout(dropout)
+        self.output_layer = nn.Linear(fc_units, output_size)
+        self.activation_fct = activation_fct
+
+    def forward(self, x, lengths):
+        """Forward pass of the ManyToManyGRU model.
+
+        Args:
+            x (torch.Tensor): Input tensor of shape (batch_size, seq_len, input_size).
+            lengths (torch.Tensor): Tensor containing the lengths of each sequence in the batch.
+
+        Returns:
+            torch.Tensor: Output tensor of shape (batch_size, seq_len, output_size).
+
+        Raises:
+            ValueError: If the input tensor is empty or if the lengths tensor is empty.
+            RuntimeError: If the lengths tensor does not match the batch size of the input tensor.
+        """
+        if x.size(0) == 0 or lengths.size(0) == 0:
+            raise ValueError("Input tensor or lengths tensor is empty.")
+        if x.size(0) != lengths.size(0):
+            raise RuntimeError(f"Batch size of input tensor ({x.size(0)}) and lengths tensor ({lengths.size(0)}) must match.")
+
+        x = pack_padded_sequence(x, lengths, batch_first=True, enforce_sorted=False)
+        packed_output, _ = self.gru_layer(x)
+        x, _ = pad_packed_sequence(packed_output, batch_first=True)
+        x = self.dropout(x)
+        x = self.fc(x)
+        x = self.activation_fct(x)
+        x = self.output_layer(x)
+        return x
+
+
+class ManyToManyGRURegressor(L.LightningModule):
+    """A LightningModule for training and evaluating a Many-to-Many GRU regressor.
+
+    Args:
+        _L_in (int): The number of input features.
+        _L_out (int): The number of output features.
+        l1 (int): Unused parameter. Defaults to 8.
+        gru_units (int): The number of units in the GRU layer. Defaults to 128.
+        fc_units (int): The number of units in the fully connected layer. Defaults to 128.
+        act_fn (nn.Module): The activation function to use after the fully connected layer. Defaults to nn.ReLU().
+        dropout_prob (float): The dropout probability. Defaults to 0.2.
+        bidirectional (bool): Whether the GRU is bidirectional. Defaults to True.
+        num_layers (int): The number of GRU layers. Defaults to 2.
+        optimizer (str): The optimizer to use. Defaults to "Adam".
+        lr_mult (float): Learning rate multiplier. Defaults to 1.0.
+        patience (int): Patience for learning rate scheduler. Defaults to 5.
+        epochs (int): Number of training epochs. Defaults to 100.
+        batch_size (int): Batch size for training. Defaults to 32.
+        _torchmetric (str): The metric to use for evaluation. Defaults to "mean_squared_error".
+
+    Examples:
+        >>> model = ManyToManyGRURegressor(_L_in=10, _L_out=1)
+        >>> x = torch.randn(16, 10, 10)  # Batch of 16 sequences, each of length 10 with 10 features
+        >>> lengths = torch.tensor([10] * 16)  # All sequences have length 10
+        >>> output = model(x, lengths)
+        >>> print(output.shape)  # Output shape: (16, 10, 1)
+    """
+
+    def __init__(
+        self,
+        _L_in: int,
+        _L_out: int,
+        l1: int = 8,
+        gru_units: int = 128,
+        fc_units: int = 128,
+        act_fn: nn.Module = nn.ReLU(),
+        dropout_prob: float = 0.2,
+        bidirectional: bool = True,
+        num_layers: int = 2,
+        optimizer: str = "Adam",
+        lr_mult: float = 1.0,
+        patience: int = 5,
+        epochs: int = 100,
+        batch_size: int = 32,
+        _torchmetric: str = "mean_squared_error",
+        *args,
+        **kwargs,
+    ):
+        super().__init__()
+        self._L_in = _L_in
+        self._L_out = _L_out
+        if _torchmetric is None:
+            _torchmetric = "mean_squared_error"
+        self._torchmetric = _torchmetric
+        self.metric = getattr(torchmetrics.functional.regression, _torchmetric)
+        self.save_hyperparameters(ignore=["_L_in", "_L_out", "_torchmetric"])
+        self.example_input_array = (torch.zeros((batch_size, 10, _L_in)), torch.tensor([10] * batch_size))
+
+        self.layers = ManyToManyGRU(
+            input_size=_L_in,
+            output_size=_L_out,
+            gru_units=self.hparams.gru_units,
+            fc_units=self.hparams.fc_units,
+            activation_fct=self.hparams.act_fn,
+            dropout=self.hparams.dropout_prob,
+            bidirectional=self.hparams.bidirectional,
+            num_layers=self.hparams.num_layers,
+        )
+
+    def forward(self, x, lengths) -> torch.Tensor:
+        """Forward pass of the ManyToManyGRURegressor.
+
+        Args:
+            x (torch.Tensor): Input tensor of shape (batch_size, seq_len, input_size).
+            lengths (torch.Tensor): Tensor containing the lengths of each sequence in the batch.
+
+        Returns:
+            torch.Tensor: Output tensor of shape (batch_size, seq_len, output_size).
+        """
+        x = self.layers(x, lengths)
+        return x
+
+    def _calculate_loss(self, batch):
+        """Calculates the loss for a given batch.
+
+        Args:
+            batch (tuple): A tuple containing (x, lengths, y), where:
+                - x: Input tensor of shape (batch_size, seq_len, input_size).
+                - lengths: Tensor containing the lengths of each sequence in the batch.
+                - y: Target tensor of shape (batch_size, seq_len, output_size).
+
+        Returns:
+            torch.Tensor: The calculated loss.
+        """
+        x, lengths, y = batch
+        y_hat = self(x, lengths)
+        y = y.view_as(y_hat)
+        loss = self.metric(y_hat, y)
+        return loss
+
+    def training_step(self, batch: tuple, batch_idx) -> torch.Tensor:
+        """Performs a single training step.
+
+        Args:
+            batch (tuple): A tuple containing (x, lengths, y).
+            batch_idx (int): The index of the batch.
+
+        Returns:
+            torch.Tensor: The training loss.
+        """
+        val_loss = self._calculate_loss(batch)
+        return val_loss
+
+    def validation_step(self, batch: tuple, batch_idx, prog_bar: bool = False) -> torch.Tensor:
+        """Performs a single validation step.
+
+        Args:
+            batch (tuple): A tuple containing (x, lengths, y).
+            batch_idx (int): The index of the batch.
+            prog_bar (bool): Whether to log the loss to the progress bar. Defaults to False.
+
+        Returns:
+            torch.Tensor: The validation loss.
+        """
+        val_loss = self._calculate_loss(batch)
+        self.log("val_loss", val_loss, prog_bar=True)
+        self.log("hp_metric", val_loss, prog_bar=True)
+        return val_loss
+
+    def test_step(self, batch: tuple, batch_idx: int, prog_bar: bool = False) -> torch.Tensor:
+        """Performs a single test step.
+
+        Args:
+            batch (tuple): A tuple containing (x, lengths, y).
+            batch_idx (int): The index of the batch.
+            prog_bar (bool): Whether to log the loss to the progress bar. Defaults to False.
+
+        Returns:
+            torch.Tensor: The test loss.
+        """
+        val_loss = self._calculate_loss(batch)
+        self.log("val_loss", val_loss, prog_bar=prog_bar)
+        self.log("hp_metric", val_loss, prog_bar=prog_bar)
+        return val_loss
+
+    def configure_optimizers(self) -> dict:
+        """Configures the optimizer and learning rate scheduler.
+
+        Returns:
+            dict: A dictionary containing the optimizer and learning rate scheduler configuration.
+        """
+        optimizer = optimizer_handler(optimizer_name=self.hparams.optimizer, params=self.parameters(), lr_mult=self.hparams.lr_mult)
+
+        num_milestones = 3
+        milestones = [int(self.hparams.epochs / (num_milestones + 1) * (i + 1)) for i in range(num_milestones)]
+        scheduler = optim.lr_scheduler.MultiStepLR(optimizer, milestones=milestones, gamma=0.1)
+
+        lr_scheduler_config = {
+            "scheduler": scheduler,
+            "interval": "epoch",
+            "frequency": 1,
+        }
+
+        return {"optimizer": optimizer, "lr_scheduler": lr_scheduler_config}
Original file line number	Diff line number	Diff line change
`@@ -7,7 +7,7 @@ build-backend = "setuptools.build_meta"`
`7`	`7`
`8`	`8`	`[project]`
`9`	`9`	`name = "spotpython"`
`10`		`-version = "0.28.0"`
	`10`	`+version = "0.28.1"`
`11`	`11`	`authors = [`
`12`	`12`	`{ name="T. Bartz-Beielstein", email="tbb@bartzundbartz.de" }`
`13`	`13`	`]`