secondmind-labs · khurram-ghani · Sep 11, 2023 · Aug 9, 2023 · Aug 22, 2023 · Aug 24, 2023
diff --git a/docs/notebooks/constraints.txt b/docs/notebooks/constraints.txt
@@ -68,6 +68,7 @@ gym==0.26.2
 gym-notices==0.0.8
 h5py==3.8.0
 idna==3.4
+imageio==2.31.1
 ipykernel==6.23.2
 ipython==8.14.0
 isoduration==20.11.0

diff --git a/docs/notebooks/requirements.txt b/docs/notebooks/requirements.txt
@@ -21,3 +21,4 @@ jupytext
 gym[box2d]
 box2d
 box2d-kengz
+imageio
diff --git a/docs/notebooks/trust_region.pct.py b/docs/notebooks/trust_region.pct.py
@@ -0,0 +1,283 @@
+# ---
+# jupyter:
+#   jupytext:
+#     cell_metadata_filter: -all
+#     custom_cell_magics: kql
+#     text_representation:
+#       extension: .py
+#       format_name: percent
+#       format_version: '1.3'
+#       jupytext_version: 1.11.2
+#   kernelspec:
+#     display_name: .venv_310
+#     language: python
+#     name: python3
+# ---
+
+# %% [markdown]
+# # Trust region Bayesian optimization
+#
+# We will demonstrate three trust region Bayesian optimization algorithms in this tutorial.
+
+# %%
+import numpy as np
+import tensorflow as tf
+
+np.random.seed(1793)
+tf.random.set_seed(1793)
+
+# %% [markdown]
+# ## Define the problem and model
+#
+# We can use trust regions for Bayesian optimization in much the same way as we used EGO and EI in
+# the [introduction notebook](expected_improvement.ipynb). Since the setup is very similar to
+# that tutorial, we'll skip over most of the detail.
+
+# %%
+import trieste
+from trieste.objectives import Branin
+
+branin = Branin.objective
+search_space = Branin.search_space
+
+num_initial_data_points = 10
+initial_query_points = search_space.sample(num_initial_data_points)
+observer = trieste.objectives.utils.mk_observer(branin)
+initial_data = observer(initial_query_points)
+
+# %% [markdown]
+# As usual, we'll use Gaussian process regression to model the function. Note that we set the
+# likelihood variance to a small number because we are dealing with a noise-free problem.
+
+# %%
+from trieste.models.gpflow import GaussianProcessRegression, build_gpr
+
+
+def build_model():
+    gpflow_model = build_gpr(
+        initial_data, search_space, likelihood_variance=1e-7
+    )
+    return GaussianProcessRegression(gpflow_model)
+
+
+# %% [markdown]
+# ## Trust region `TREGO` acquisition rule
+#
+# First we show how to run Bayesian optimization with the `TREGO` algorithm. This is a trust region
+# algorithm that alternates between regular EGO steps and local steps within one trust region.
+#
+# ### Create `TREGO` rule and run optimization loop
+#
+# We can run the Bayesian optimization loop by defining a `BayesianOptimizer` and calling its
+# `optimize` method with the trust region rule. Once the optimization loop is complete, the
+# optimizer will return one new query point for every step in the loop; that's 5 points in total.
+
+# %%
+acq_rule = trieste.acquisition.rule.TrustRegion()
+bo = trieste.bayesian_optimizer.BayesianOptimizer(observer, search_space)
+
+num_steps = 5
+result = bo.optimize(
+    num_steps, initial_data, build_model(), acq_rule, track_state=True
+)
+dataset = result.try_get_final_dataset()
+
+# %% [markdown]
+# ### Visualizing `TREGO` results
+#
+# Let's take a look at where we queried the observer, the original query points (crosses), new
+# query points (dots) and the optimum point found (purple dot), and where they lie with respect to
+# the contours of the Branin.
+
+# %%
+from trieste.experimental.plotting import plot_bo_points, plot_function_2d
+
+
+def plot_final_result(_dataset: trieste.data.Dataset) -> None:
+    arg_min_idx = tf.squeeze(tf.argmin(_dataset.observations, axis=0))
+    query_points = _dataset.query_points.numpy()
+    _, ax = plot_function_2d(
+        branin,
+        search_space.lower,
+        search_space.upper,
+        grid_density=40,
+        contour=True,
+    )
+
+    plot_bo_points(query_points, ax[0, 0], num_initial_data_points, arg_min_idx)
+
+
+plot_final_result(dataset)
+
+# %% [markdown]
+# We can also visualize the progress of the optimization by plotting the trust regions at each step.
+# The trust regions are shown as translucent boxes, with the current optimum point in each region
+# shown in matching color.
+#
+# Note there is only one trust region in this plot, but the rule in the next section will show multiple trust
+# regions.
+
+# %%
+import base64
+import io
+from typing import List
+
+import imageio
+import IPython
+import matplotlib.pyplot as plt
+
+from trieste.experimental.plotting import plot_trust_region_history_2d
+
+
+def fig_to_frame(fig: plt.Figure) -> np.ndarray:
+    fig.canvas.draw()
+    size_pix = fig.get_size_inches() * fig.dpi
+    image = np.frombuffer(fig.canvas.tostring_rgb(), dtype="uint8")
+    return image.reshape(list(size_pix[::-1].astype(int)) + [3])
+
+
+def frames_to_gif(
+    frames: List[np.ndarray], duration=5000
+) -> IPython.display.HTML:
+    gif_file = io.BytesIO()
+    imageio.mimsave(gif_file, frames, format="gif", loop=0, duration=duration)
+    gif = IPython.display.HTML(
+        '<img src="data:image/gif;base64,{0}"/>'.format(
+            base64.b64encode(gif_file.getvalue()).decode()
+        )
+    )
+    return gif
+
+
+def plot_history(result: trieste.bayesian_optimizer.OptimizationResult) -> None:
+    frames = []
+    for step, hist in enumerate(
+        result.history + [result.final_result.unwrap()]
+    ):
+        fig, _ = plot_trust_region_history_2d(
+            branin,
+            search_space.lower,
+            search_space.upper,
+            hist,
+            num_init=num_initial_data_points,
+        )
+
+        if fig is not None:
+            fig.suptitle(f"step number {step}")
+            frames.append(fig_to_frame(fig))
+            plt.close(fig)
+
+    IPython.display.display(frames_to_gif(frames))
+
+
+plot_history(result)
+
+# %% [markdown]
+# ## Batch trust region rule
+#
+# Next we demonstrate how to run Bayesian optimization with the batch trust region rule.
+#
+# ### Create the batch trust region acquisition rule
+#
+# We achieve Bayesian optimization with trust region by specifying `BatchTrustRegionBox` as the
+# acquisition rule.
+#
+# This rule needs an initial number `num_query_points` of sub-spaces (or trust regions) to be
+# provided and performs optimization in parallel across all these sub-spaces. Each region
+# contributes one query point, resulting in each acquisition step collecting `num_query_points`
+# points overall. As the optimization process continues, the bounds of these sub-spaces are
+# dynamically updated.
+#
+# In addition, this rule requires the specification of a batch aquisition base-rule for performing
+# optimization; for our example we use `EfficientGlobalOptimization` coupled with
+# `ParallelContinuousThompsonSampling`.
+#
+# Note: the number of sub-spaces/regions must match the number of batch query points.
+
+# %%
+num_query_points = 5
+
+init_subspaces = [
+    trieste.acquisition.rule.SingleObjectiveTrustRegionBox(search_space)
+    for _ in range(num_query_points)
+]
+base_rule = trieste.acquisition.rule.EfficientGlobalOptimization(  # type: ignore[var-annotated]
+    builder=trieste.acquisition.ParallelContinuousThompsonSampling(),
+    num_query_points=num_query_points,
+)
+acq_rule = trieste.acquisition.rule.BatchTrustRegionBox(  # type: ignore[assignment]
+    init_subspaces, base_rule
+)
+
+# %% [markdown]
+# ### Run the optimization loop
+#
+# We run the Bayesian optimization loop as before by defining a `BayesianOptimizer` and calling its
+# `optimize` method with the trust region rule. Once the optimization loop is complete, the
+# optimizer will return `num_query_points` new query points for every step in the loop. With
+# 5 steps, that's 25 points in total.
+
+# %%
+bo = trieste.bayesian_optimizer.BayesianOptimizer(observer, search_space)
+
+num_steps = 5
+result = bo.optimize(
+    num_steps, initial_data, build_model(), acq_rule, track_state=True
+)
+dataset = result.try_get_final_dataset()
+
+# %% [markdown]
+# ### Visualizing batch trust region results
+#
+# We visualize the results as before.
+
+# %%
+plot_final_result(dataset)
+
+# %%
+plot_history(result)
+
+# %% [markdown]
+# ## Trust region `TurBO` acquisition rule
+#
+# Finally, we show how to run Bayesian optimization with the `TurBO` algorithm. This is a
+# trust region algorithm that uses local models and datasets to approximate the objective function
+# within one trust region.
+#
+# ### Create `TurBO` rule and run optimization loop
+#
+# This rule requires the specification of an aquisition base-rule for performing
+# optimization within the trust region; for our example we use `DiscreteThompsonSampling`.
+
+# %%
+acq_rule = trieste.acquisition.rule.TURBO(  # type: ignore[assignment]
+    search_space, rule=trieste.acquisition.rule.DiscreteThompsonSampling(500, 3)
+)
+bo = trieste.bayesian_optimizer.BayesianOptimizer(observer, search_space)
+
+num_steps = 5
+result = bo.optimize(
+    num_steps,
+    initial_data,
+    build_model(),
+    acq_rule,
+    track_state=True,
+    fit_model=False,
+)
+dataset = result.try_get_final_dataset()
+
+# %% [markdown]
+# ### Visualizing `TurBO` results
+#
+# We display the results as earlier.
+
+# %%
+plot_final_result(dataset)
+
+# %%
+plot_history(result)
+
+# %% [markdown]
+# ## LICENSE
+#
+# [Apache License 2.0](https://github.com/secondmind-labs/trieste/blob/develop/LICENSE)
diff --git a/docs/tutorials.rst b/docs/tutorials.rst
@@ -40,6 +40,7 @@ The following tutorials illustrate solving different types of optimization probl
    notebooks/qhsri-tutorial
    notebooks/multifidelity_modelling
    notebooks/rembo
+   notebooks/trust_region
 
 Frequently asked questions
 --------------------------

diff --git a/trieste/experimental/plotting/__init__.py b/trieste/experimental/plotting/__init__.py
@@ -30,6 +30,7 @@
         plot_mobo_history,
         plot_mobo_points_in_obj_space,
         plot_regret,
+        plot_trust_region_history_2d,
     )
     from .plotting_plotly import (
         add_bo_points_plotly,