automl · daphne12345 · Oct 23, 2024 · Oct 23, 2024 · Oct 29, 2024 · Dec 2, 2024
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -25,6 +25,9 @@
 
 # 2.3.0
 
+## Features
+- Improved batch sampling: Fantasize points in batch/parallel mode (#1154).
+
 ## Documentation
 - Update windows install guide (#952)
 - Correct intensifier for Algorithm Configuration Facade (#1162, #1165)

diff --git a/examples/1_basics/7_0_parallelization_fantasize.py b/examples/1_basics/7_0_parallelization_fantasize.py
@@ -0,0 +1,112 @@
+"""Example of using SMAC with parallelization and fantasization vs. no estimation for pending evaluations.
+
+This example will take some time because the target function is artificially slowed down to demonstrate the effect of
+fantasization. The example will plot the incumbent found by SMAC with and without fantasization.
+"""
+from __future__ import annotations
+
+import numpy as np
+from ConfigSpace import Configuration, ConfigurationSpace, Float
+
+from matplotlib import pyplot as plt
+
+from smac import BlackBoxFacade, Scenario
+from smac.facade import AbstractFacade
+
+from rich import inspect
+import time
+
+def plot_trajectory(facades: list[AbstractFacade], names: list[str]) -> None:
+    # Plot incumbent
+    cmap = plt.get_cmap("tab10")
+
+    fig = plt.figure()
+    axes = fig.subplots(1, 2)
+
+    for ax_i, x_axis in zip(axes, ["walltime", "trial"]):
+        for i, facade in enumerate(facades):
+            X, Y = [], []
+            inspect(facade.intensifier.trajectory)
+            for item in facade.intensifier.trajectory:
+                # Single-objective optimization
+                assert len(item.config_ids) == 1
+                assert len(item.costs) == 1
+
+                y = item.costs[0]
+                x = getattr(item, x_axis)
+
+                X.append(x)
+                Y.append(y)
+
+            ax_i.plot(X, Y, label=names[i], color=cmap(i))
+            ax_i.scatter(X, Y, marker="x", color=cmap(i))
+            ax_i.set_xlabel(x_axis)
+            ax_i.set_ylabel(facades[0].scenario.objectives)
+            ax_i.set_yscale("log")
+            ax_i.legend()
+
+    plt.show()
+
+class Branin():
+    @property
+    def configspace(self) -> ConfigurationSpace:
+        # Build Configuration Space which defines all parameters and their ranges
+        cs = ConfigurationSpace(seed=0)
+
+        # First we create our hyperparameters
+        x1 = Float("x1", (-5, 10), default=0)
+        x2 = Float("x2", (0, 15), default=0)
+
+        # Add hyperparameters and conditions to our configspace
+        cs.add([x1, x2])
+
+        time.sleep(10)
+
+        return cs
+
+    def train(self, config: Configuration, seed: int) -> float:
+        x1 = config["x1"]
+        x2 = config["x2"]
+        a = 1.0
+        b = 5.1 / (4.0 * np.pi**2)
+        c = 5.0 / np.pi
+        r = 6.0
+        s = 10.0
+        t = 1.0 / (8.0 * np.pi)
+
+        cost = a * (x2 - b * x1**2 + c * x1 - r) ** 2 + s * (1 - t) * np.cos(x1) + s
+        regret = cost - 0.397887
+
+        return regret
+
+if __name__ == "__main__":
+    seed = 345455
+    scenario = Scenario(n_trials=100, configspace=Branin().configspace, n_workers=4, seed=seed)
+    facade = BlackBoxFacade
+
+    smac_noestimation = facade(
+        scenario=scenario,
+        target_function=Branin().train,
+        overwrite=True, 
+    )
+    smac_fantasize = facade(
+        scenario=scenario,
+        target_function=Branin().train,
+        config_selector=facade.get_config_selector(
+            scenario=scenario,
+            batch_sampling_estimation_strategy="kriging_believer"
+        ),
+        overwrite=True,
+        logging_level=0
+    )
+
+    incumbent_noestimation = smac_noestimation.optimize()
+    incumbent_fantasize = smac_fantasize.optimize()
+
+    plot_trajectory(facades=[
+        smac_noestimation,
+        smac_fantasize,
+        ], names=["No Estimation", "Fantasize"])
+
+    del smac_noestimation
+    del smac_fantasize
diff --git a/examples/1_basics/7_1_parallelization_q_ei.py b/examples/1_basics/7_1_parallelization_q_ei.py
@@ -0,0 +1,126 @@
+"""Example of using SMAC with parallelization and fantasization vs. no estimation for pending evaluations.
+
+This example will take some time because the target function is artificially slowed down to demonstrate the effect of
+fantasization. The example will plot the incumbent found by SMAC with and without fantasization.
+"""
+from __future__ import annotations
+
+import numpy as np
+from ConfigSpace import Configuration, ConfigurationSpace, Float
+
+from matplotlib import pyplot as plt
+
+from smac import BlackBoxFacade, Scenario
+from smac.facade import AbstractFacade
+from smac.acquisition.function.expected_improvement import QExpectedImprovement, EI
+from smac.acquisition.maximizer.random_search import RandomSearch
+
+from rich import inspect
+import time
+
+def plot_trajectory(facades: list[AbstractFacade], names: list[str]) -> None:
+    # Plot incumbent
+    cmap = plt.get_cmap("tab10")
+
+    fig = plt.figure()
+    axes = fig.subplots(1, 2)
+
+    for ax_i, x_axis in zip(axes, ["walltime", "trial"]):
+        for i, facade in enumerate(facades):
+            X, Y = [], []
+            inspect(facade.intensifier.trajectory)
+            for item in facade.intensifier.trajectory:
+                # Single-objective optimization
+                assert len(item.config_ids) == 1
+                assert len(item.costs) == 1
+
+                y = item.costs[0]
+                x = getattr(item, x_axis)
+
+                X.append(x)
+                Y.append(y)
+
+            ax_i.plot(X, Y, label=names[i], color=cmap(i))
+            ax_i.scatter(X, Y, marker="x", color=cmap(i))
+            ax_i.set_xlabel(x_axis)
+            ax_i.set_ylabel(facades[0].scenario.objectives)
+            ax_i.set_yscale("log")
+            ax_i.legend()
+
+    plt.show()
+
+class Branin():
+    @property
+    def configspace(self) -> ConfigurationSpace:
+        # Build Configuration Space which defines all parameters and their ranges
+        cs = ConfigurationSpace(seed=0)
+
+        # First we create our hyperparameters
+        x1 = Float("x1", (-5, 10), default=0)
+        x2 = Float("x2", (0, 15), default=0)
+
+        # Add hyperparameters and conditions to our configspace
+        cs.add([x1, x2])
+
+        time.sleep(10)
+
+        return cs
+
+    def train(self, config: Configuration, seed: int) -> float:
+        x1 = config["x1"]
+        x2 = config["x2"]
+        a = 1.0
+        b = 5.1 / (4.0 * np.pi**2)
+        c = 5.0 / np.pi
+        r = 6.0
+        s = 10.0
+        t = 1.0 / (8.0 * np.pi)
+
+        cost = a * (x2 - b * x1**2 + c * x1 - r) ** 2 + s * (1 - t) * np.cos(x1) + s
+        regret = cost - 0.397887
+
+        return regret
+
+if __name__ == "__main__":
+    seed = 345455
+    scenario = Scenario(n_trials=100, configspace=Branin().configspace, n_workers=4, seed=seed)
+    facade = BlackBoxFacade
+
+    acq_function = EI()
+    acq_maximizer = RandomSearch(scenario.configspace, acq_function)
+
+    smac_noestimation = facade(
+        scenario=scenario,
+        target_function=Branin().train,
+        overwrite=True, 
+        acquisition_function=acq_function,
+        acquisition_maximizer=acq_maximizer
+    )
+
+    acq_function_qei = QExpectedImprovement()
+    acq_maximizer_qei = RandomSearch(scenario.configspace, acquisition_function=acq_function_qei)
+
+
+    smac_q_ei = facade(
+        scenario=scenario,
+        target_function=Branin().train,
+        config_selector=facade.get_config_selector(
+            scenario=scenario,
+            batch_sampling_estimation_strategy="q_ei"
+        ),
+        acquisition_function = acq_function_qei,
+        acquisition_maximizer=acq_maximizer_qei,
+        overwrite=True,
+        logging_level=0
+    )
+
+    incumbent_noestimation = smac_noestimation.optimize()
+    incumbent_q_ei= smac_q_ei.optimize()
+
+    plot_trajectory(facades=[
+        smac_noestimation,
+        smac_q_ei,
+        ], names=["No Estimation", "QEI"])
+
+    # del smac_noestimation
+    del smac_q_ei
diff --git a/smac/acquisition/function/expected_improvement.py b/smac/acquisition/function/expected_improvement.py
@@ -286,3 +286,99 @@ def calculate_f() -> np.ndarray:
             raise ValueError("Expected Improvement per Second is smaller than 0 " "for at least one sample.")
 
         return f.reshape((-1, 1))
+
+
+class QExpectedImprovement(EI):
+    r"""
+    Monte Carlo approximation of q-Expected Improvement.
+    Approximates joint distribution with independent normals.
+
+    :math:`EI(X) := \mathbb{E}\left[ \max\{0, f(\mathbf{X^+}) - f_{t+1}(\mathbf{X}) - \xi \} \right]`,
+    with :math:`f(X^+)` as the best location.
+
+    Reference for q-EI
+
+
+    Parameters
+    ----------
+    xi : float, defaults to 0.0
+        Controls the balance between exploration and exploitation of the
+        acquisition function.
+    log : bool, defaults to False
+        Whether the function values are in log-space.
+
+
+    Attributes
+    ----------
+    _xi : float
+        Exploration-exloitation trade-off parameter.
+    _log: bool
+        Function values in log-space or not.
+    _eta : float
+        Current incumbent function value (best value observed so far).
+
+    """
+
+    def __init__(self, xi: float = 0.0, n_samples: int = 128) -> None:
+        super(QExpectedImprovement, self).__init__(xi=xi)
+        self.n_samples = n_samples
+
+    @property
+    def name(self) -> str:  # noqa: D102
+        return "Batch Expected Improvement"
+
+    def _compute(self, X: np.ndarray) -> np.ndarray:
+        """
+        Compute q-EI acquisition value using Monte Carlo approximation.
+
+        Parameters
+        ----------
+        X : np.ndarray [N, D]
+            The batch of input points to evaluate.
+
+        Returns
+        -------
+        np.ndarray [1, 1]
+            The q-EI value for the batch as a whole.
+        """
+        assert self._model is not None
+        assert self._xi is not None
+
+        if self._eta is None:
+            raise ValueError(
+                "No current best specified. Call update(eta=<float>) to inform the acquisition function "
+                "about the current best value."
+            )
+
+        if len(X.shape) == 1:
+            X = X[np.newaxis, :]
+
+        m, var = self._model.predict_marginalized(X)
+        std = np.sqrt(var)
+
+        if np.any(std == 0.0):
+            logger.warning("Predicted std is 0.0 for at least one sample.")
+            std_copy = np.copy(std)
+            std[std_copy == 0.0] = 1.0  # prevent division by zero
+
+        # Monte Carlo sampling from log-normal distribution
+        normal_samples = np.random.normal(loc=m.T, scale=std.T, size=(self.n_samples, X.shape[0]))
+
+        if not self._log:
+            f_samples = normal_samples  # in original (normal) space
+            f_min_sample = np.min(f_samples, axis=1)
+            improvement = np.maximum(self._eta - self._xi - f_min_sample, 0.0)
+        else:
+            # In log-space, the *actual values* are exp(samples)
+            f_samples = np.exp(normal_samples)
+            f_min_sample = np.min(f_samples, axis=1)
+
+            # eta is already in log-space, so we compare to exp(eta - xi)
+            improvement = np.maximum(np.exp(self._eta - self._xi) - f_min_sample, 0.0)
+
+        qei = np.mean(improvement)
+
+        if qei < 0:
+            raise ValueError("q-Expected Improvement is smaller than 0. Should not happen.")
+
+        return np.array([[qei]])
diff --git a/smac/acquisition/maximizer/abstract_acquisition_maximizer.py b/smac/acquisition/maximizer/abstract_acquisition_maximizer.py
@@ -74,6 +74,7 @@ def maximize(
         previous_configs: list[Configuration],
         n_points: int | None = None,
         random_design: AbstractRandomDesign | None = None,
+        **kwargs: Any,
     ) -> Iterator[Configuration]:
         """Maximize acquisition function using `_maximize`, implemented by a subclass.