v0.28.9

bartzbeielstein · bartzbeielstein · commit 2cab0c3086b3 · 2025-03-30T12:29:10.000+02:00
pareto front
diff --git a/pyproject.toml b/pyproject.toml
@@ -7,7 +7,7 @@ build-backend = "setuptools.build_meta"
 
 [project]
 name = "spotpython"
-version = "0.28.8"
+version = "0.28.9"
 authors = [
   { name="T. Bartz-Beielstein", email="tbb@bartzundbartz.de" }
 ]
diff --git a/src/spotpython/fun/mohyperlight.py b/src/spotpython/fun/mohyperlight.py
@@ -142,7 +142,9 @@ def fun(self, X: np.ndarray, fun_control: dict = None) -> np.ndarray:
             epochs_val = config.get("epochs", np.nan)  # Default to np.nan if "epochs" is not in config
             epochs_res = np.append(epochs_res, epochs_val)
 
-        # Stack z_res and epochs_res into a (2, n) array
-        result = np.vstack((z_res, epochs_res))
+        # Stack z_res and epochs_res into a (n, 2) array
+        result = np.column_stack((z_res, epochs_res))
+        print(f"result.shape: {result.shape}")
+        print(f"result: {result}")
 
         return result
diff --git a/src/spotpython/mo/plot.py b/src/spotpython/mo/plot.py
@@ -0,0 +1,126 @@
+import matplotlib.pyplot as plt
+import numpy as np
+import pandas as pd
+from spotpython.mo.pareto import is_pareto_efficient
+
+
+def plot_mo(
+    target_names: list,
+    combinations: list,
+    pareto: str,
+    y_rf: np.ndarray = None,
+    pareto_front: bool = False,
+    y_best: np.ndarray = None,
+    title: str = "",
+    y_orig: np.ndarray = None,
+    pareto_front_orig: bool = False,
+    pareto_label: bool = False,
+    y_rf_color="blue",
+    y_best_color="red",
+) -> None:
+    """
+    Generates scatter plots for each combination of two targets from a multi-output prediction while highlighting Pareto optimal points.
+
+    Args:
+        y_rf (np.ndarray): The predicted target values with shape (n_samples, n_targets).
+        target_names (list): A list of target names corresponding to the columns of y_rf.
+        combinations (list): A list of tuples, where each tuple contains the indices of the target combinations to plot.
+        pareto (str): Specifies whether to compute Pareto front based on 'min' or 'max' criterion.
+        pareto_front (bool): If True, connect Pareto optimal points with a red line for y_rf.
+        y_best (np.ndarray, optional): A NumPy array representing the best point to highlight in red. Defaults to None.
+        title (str): The title of the plot. Defaults to "" (empty string).
+        y_orig (np.ndarray, optional): The original target values with shape (n_samples, n_targets). Defaults to None.
+        pareto_front_orig (bool): If True, connect Pareto optimal points with a light blue line for y_orig. Defaults to False.
+        pareto_label (bool): If True, label Pareto points with their index. Defaults to False.
+        y_rf_color (str): The color of the predicted points. Defaults to "blue".
+        y_best_color (str): The color of the best point. Defaults to "red".
+
+    Returns:
+        None: Displays the plot.
+
+    Examples:
+        >>> from spotpython.mo.plot import plot_mo
+        >>> import numpy as np
+        >>> target_names = ["Target 1", "Target 2"]
+        >>> combinations = [(0, 1)]
+        >>> pareto = "min"
+        >>> y_rf = np.random.rand(100, 2)
+        >>> y_orig = np.random.rand(100, 2)
+        >>> plot_mo(target_names, combinations, pareto, y_rf=y_rf, y_orig=y_orig)
+    """
+    # Convert y_rf to numpy array if it's a pandas DataFrame
+    if isinstance(y_rf, pd.DataFrame):
+        y_rf = y_rf.values
+
+    # Convert y_orig to numpy array if it's a pandas DataFrame
+    if isinstance(y_orig, pd.DataFrame):
+        y_orig = y_orig.values
+
+    for i, j in combinations:
+        plt.figure()
+        s = 50  # Base size for points
+        pareto_size = s  # Size for Pareto points
+        if pareto_label:
+            pareto_size = s * 4  # Increase the size for Pareto points
+        a = 0.4
+
+        # Plot original data if provided
+        if y_orig is not None:
+            # Determine Pareto optimal points for original data
+            minimize = pareto == "min"
+            pareto_mask_orig = is_pareto_efficient(y_orig[:, [i, j]], minimize)
+
+            # Plot all original points
+            plt.scatter(y_orig[:, i], y_orig[:, j], edgecolor="w", c="gray", s=s, marker="o", alpha=a, label="Original Points")
+
+            # Highlight Pareto points for original data
+            plt.scatter(y_orig[pareto_mask_orig, i], y_orig[pareto_mask_orig, j], edgecolor="k", c="gray", s=pareto_size, marker="o", alpha=a, label="Original Pareto")
+
+            # Label Pareto points for original data if requested
+            if pareto_label:
+                for idx in np.where(pareto_mask_orig)[0]:
+                    plt.text(y_orig[idx, i], y_orig[idx, j], str(idx), color="black", fontsize=8, ha="center", va="center")
+
+            # Draw Pareto front for original data if requested
+            if pareto_front_orig:
+                sorted_indices_orig = np.argsort(y_orig[pareto_mask_orig, i])
+                plt.plot(y_orig[pareto_mask_orig, i][sorted_indices_orig], y_orig[pareto_mask_orig, j][sorted_indices_orig], "k-", alpha=a, label="Original Pareto Front")
+
+        if y_rf is not None:
+            # Determine Pareto optimal points for predicted data
+            minimize = pareto == "min"
+            pareto_mask = is_pareto_efficient(y_rf[:, [i, j]], minimize)
+
+            # Plot all predicted points
+            plt.scatter(y_rf[:, i], y_rf[:, j], edgecolor="w", c=y_rf_color, s=s, marker="^", alpha=a, label="Predicted Points")
+
+            # Highlight Pareto points for predicted data
+            plt.scatter(y_rf[pareto_mask, i], y_rf[pareto_mask, j], edgecolor="k", c=y_rf_color, s=pareto_size, marker="s", alpha=a, label="Predicted Pareto")
+
+            # Label Pareto points for predicted data if requested
+            if pareto_label:
+                for idx in np.where(pareto_mask)[0]:
+                    plt.text(y_rf[idx, i], y_rf[idx, j], str(idx), color="black", fontsize=8, ha="center", va="center")
+
+            # Draw Pareto front for predicted data if requested
+            if pareto_front:
+                sorted_indices = np.argsort(y_rf[pareto_mask, i])
+                plt.plot(
+                    y_rf[pareto_mask, i][sorted_indices],
+                    y_rf[pareto_mask, j][sorted_indices],
+                    linestyle="-",  # Specify the line style
+                    color=y_rf_color,  # Use the color specified by y_rf_color
+                    alpha=a,
+                    label="Predicted Pareto Front",
+                )
+
+        # Plot the best point, if provided
+        if y_best is not None:
+            plt.scatter(y_best[:, i], y_best[:, j], edgecolor="k", c=y_best_color, s=s, marker="D", alpha=1, label="Best")
+
+        plt.xlabel(target_names[i])
+        plt.ylabel(target_names[j])
+        plt.grid()
+        plt.title(title)
+        plt.legend()
+        plt.show()
diff --git a/src/spotpython/utils/repair.py b/src/spotpython/utils/repair.py
@@ -60,6 +60,8 @@ def remove_nan(X: np.ndarray, y: np.ndarray, stop_on_zero_return: bool = False)
         >>> print(X_cleaned, y_cleaned)
         [[1 2]] [[1. 2.]]
     """
+    print(f"remove_nan: X.shape={X.shape}, y.shape={y.shape}")
+    print(f"remove_nan: X={X},\n y={y}")
     # Get the original dimension of the y array
     original_dim = y.shape[0]
 
@@ -70,6 +72,7 @@ def remove_nan(X: np.ndarray, y: np.ndarray, stop_on_zero_return: bool = False)
         ind = np.all(np.isfinite(y), axis=0)
     else:
         raise ValueError("y must be a 1D or 2D array.")
+    print(f"remove_nan: ind={ind}")
 
     # Update X and y by removing rows with NaN in y
     X_cleaned = X[ind, :]

Original file line number	Diff line number	Diff line change
`@@ -7,7 +7,7 @@ build-backend = "setuptools.build_meta"`
`7`	`7`
`8`	`8`	`[project]`
`9`	`9`	`name = "spotpython"`
`10`		`-version = "0.28.8"`
	`10`	`+version = "0.28.9"`
`11`	`11`	`authors = [`
`12`	`12`	`{ name="T. Bartz-Beielstein", email="tbb@bartzundbartz.de" }`
`13`	`13`	`]`