secondmind-labs · khurram-ghani · Sep 11, 2023 · Aug 9, 2023 · Aug 22, 2023 · Aug 24, 2023
diff --git a/docs/notebooks/constraints.txt b/docs/notebooks/constraints.txt
@@ -68,6 +68,7 @@ gym==0.26.2
 gym-notices==0.0.8
 h5py==3.8.0
 idna==3.4
+imageio==2.31.1
 ipykernel==6.23.2
 ipython==8.14.0
 isoduration==20.11.0

diff --git a/docs/notebooks/requirements.txt b/docs/notebooks/requirements.txt
@@ -21,3 +21,4 @@ jupytext
 gym[box2d]
 box2d
 box2d-kengz
+imageio
diff --git a/docs/notebooks/trust_region.pct.py b/docs/notebooks/trust_region.pct.py
@@ -0,0 +1,281 @@
+# ---
+# jupyter:
+#   jupytext:
+#     cell_metadata_filter: -all
+#     custom_cell_magics: kql
+#     text_representation:
+#       extension: .py
+#       format_name: percent
+#       format_version: '1.3'
+#       jupytext_version: 1.11.2
+#   kernelspec:
+#     display_name: .venv_310
+#     language: python
+#     name: python3
+# ---
+
+# %% [markdown]
+# # Trust region Bayesian optimization
+#
+# We will demonstrate three trust region Bayesian optimization algorithms in this tutorial.
+
+# %%
+import numpy as np
+import tensorflow as tf
+
+np.random.seed(1793)
+tf.random.set_seed(1793)
+
+# %% [markdown]
+# ## Define the problem and model
+#
+# We can use trust regions for Bayesian optimization in much the same way as we used EGO and EI in
+# the [introduction notebook](expected_improvement.ipynb). Since the setup is very similar to
+# that tutorial, we'll skip over most of the detail.
+
+# %%
+import trieste
+from trieste.objectives import Branin
+
+branin = Branin.objective
+search_space = Branin.search_space
+
+num_initial_data_points = 10
+initial_query_points = search_space.sample(num_initial_data_points)
+observer = trieste.objectives.utils.mk_observer(branin)
+initial_data = observer(initial_query_points)
+
+# %% [markdown]
+# As usual, we'll use Gaussian process regression to model the function. Note that we set the
+# likelihood variance to a small number because we are dealing with a noise-free problem.
+
+# %%
+from trieste.models.gpflow import GaussianProcessRegression, build_gpr
+
+
+def build_model():
+    gpflow_model = build_gpr(
+        initial_data, search_space, likelihood_variance=1e-7
+    )
+    return GaussianProcessRegression(gpflow_model)
+
+
+# %% [markdown]
+# ## Trust region `TREGO` acquisition rule
+#
+# First we show how to run Bayesian optimization with the `TREGO` algorithm. This is a trust region
+# algorithm that alternates between regular EGO steps and local steps within one trust region
+# (see <cite data-cite="diouane2022trego"/>).
+#
+# ### Create `TREGO` rule and run optimization loop
+#
+# We can run the Bayesian optimization loop by defining a `BayesianOptimizer` and calling its
+# `optimize` method with the trust region rule. Once the optimization loop is complete, the
+# optimizer will return one new query point for every step in the loop; that's 5 points in total.
+#
+# `TREGO` is a "meta" rule that applies a base-rule, either inside a trust region or the whole
+# space. The default base-rule is `EfficientGlobalOptimization`, but a different base-rule can be
+# provided as an argument to `TREGO`. Here we explicitly set it to make usage clear.
+
+# %%
+trego_acq_rule = trieste.acquisition.rule.TrustRegion(
+    rule=trieste.acquisition.rule.EfficientGlobalOptimization()
+)
+bo = trieste.bayesian_optimizer.BayesianOptimizer(observer, search_space)
+
+num_steps = 5
+result = bo.optimize(
+    num_steps, initial_data, build_model(), trego_acq_rule, track_state=True
+)
+dataset = result.try_get_final_dataset()
+
+# %% [markdown]
+# ### Visualizing `TREGO` results
+#
+# Let's take a look at where we queried the observer, the original query points (crosses), new
+# query points (dots) and the optimum point found (purple dot), and where they lie with respect to
+# the contours of the Branin.
+
+# %%
+from trieste.experimental.plotting import plot_bo_points, plot_function_2d
+
+
+def plot_final_result(_dataset: trieste.data.Dataset) -> None:
+    arg_min_idx = tf.squeeze(tf.argmin(_dataset.observations, axis=0))
+    query_points = _dataset.query_points.numpy()
+    _, ax = plot_function_2d(
+        branin,
+        search_space.lower,
+        search_space.upper,
+        grid_density=40,
+        contour=True,
+    )
+
+    plot_bo_points(query_points, ax[0, 0], num_initial_data_points, arg_min_idx)
+
+
+plot_final_result(dataset)
+
+# %% [markdown]
+# We can also visualize the progress of the optimization by plotting the acquisition space at each
+# step. This space is either the full search space or the trust region, depending on the step, and
+# is shown as a translucent box; with the current optimum point in a region shown in matching
+# color.
+#
+# Note there is only one trust region in this plot, however the rule in the next section will show
+# multiple trust regions.
+
+# %%
+import base64
+
+import IPython
+import matplotlib.pyplot as plt
+
+from trieste.experimental.plotting import (
+    convert_figure_to_frame,
+    convert_frames_to_gif,
+    plot_trust_region_history_2d,
+)
+
+
+def plot_history(result: trieste.bayesian_optimizer.OptimizationResult) -> None:
+    frames = []
+    for step, hist in enumerate(
+        result.history + [result.final_result.unwrap()]
+    ):
+        fig, _ = plot_trust_region_history_2d(
+            branin,
+            search_space.lower,
+            search_space.upper,
+            hist,
+            num_init=num_initial_data_points,
+        )
+
+        if fig is not None:
+            fig.suptitle(f"step number {step}")
+            frames.append(convert_figure_to_frame(fig))
+            plt.close(fig)
+
+    gif_file = convert_frames_to_gif(frames)
+    gif = IPython.display.HTML(
+        '<img src="data:image/gif;base64,{0}"/>'.format(
+            base64.b64encode(gif_file.getvalue()).decode()
+        )
+    )
+    IPython.display.display(gif)
+
+
+plot_history(result)
+
+# %% [markdown]
+# ## Batch trust region rule
+#
+# Next we demonstrate how to run Bayesian optimization with the batch trust region rule.
+#
+# ### Create the batch trust region acquisition rule
+#
+# We achieve Bayesian optimization with trust region by specifying `BatchTrustRegionBox` as the
+# acquisition rule.
+#
+# This rule needs an initial number `num_query_points` of sub-spaces (or trust regions) to be
+# provided and performs optimization in parallel across all these sub-spaces. Each region
+# contributes one query point, resulting in each acquisition step collecting `num_query_points`
+# points overall. As the optimization process continues, the bounds of these sub-spaces are
+# dynamically updated.
+#
+# In addition, this is a "meta" rule that requires the specification of a batch aquisition
+# base-rule for performing optimization; for our example we use `EfficientGlobalOptimization`
+# coupled with the `ParallelContinuousThompsonSampling` acquisition function.
+#
+# Note: the number of sub-spaces/regions must match the number of batch query points.
+
+# %%
+num_query_points = 5
+
+init_subspaces = [
+    trieste.acquisition.rule.SingleObjectiveTrustRegionBox(search_space)
+    for _ in range(num_query_points)
+]
+base_rule = trieste.acquisition.rule.EfficientGlobalOptimization(  # type: ignore[var-annotated]
+    builder=trieste.acquisition.ParallelContinuousThompsonSampling(),
+    num_query_points=num_query_points,
+)
+batch_acq_rule = trieste.acquisition.rule.BatchTrustRegionBox(
+    init_subspaces, base_rule
+)
+
+# %% [markdown]
+# ### Run the optimization loop
+#
+# We run the Bayesian optimization loop as before by defining a `BayesianOptimizer` and calling its
+# `optimize` method with the trust region rule. Once the optimization loop is complete, the
+# optimizer will return `num_query_points` new query points for every step in the loop. With
+# 5 steps, that's 25 points in total.
+
+# %%
+bo = trieste.bayesian_optimizer.BayesianOptimizer(observer, search_space)
+
+num_steps = 5
+result = bo.optimize(
+    num_steps, initial_data, build_model(), batch_acq_rule, track_state=True
+)
+dataset = result.try_get_final_dataset()
+
+# %% [markdown]
+# ### Visualizing batch trust region results
+#
+# We visualize the results as before.
+
+# %%
+plot_final_result(dataset)
+
+# %%
+plot_history(result)
+
+# %% [markdown]
+# ## Trust region `TurBO` acquisition rule
+#
+# Finally, we show how to run Bayesian optimization with the `TurBO` algorithm. This is a
+# trust region algorithm that uses local models and datasets to approximate the objective function
+# within one trust region.
+#
+# ### Create `TurBO` rule and run optimization loop
+#
+# As before, this meta-rule requires the specification of an aquisition base-rule for performing
+# optimization within the trust region; for our example we use `DiscreteThompsonSampling`.
+#
+# Note that we switch off global model fitting by setting `fit_model=False`. This is because
+# `TurBO` uses a local model and fitting the global model would be redundant and wasteful.
+
+# %%
+turbo_acq_rule = trieste.acquisition.rule.TURBO(
+    search_space, rule=trieste.acquisition.rule.DiscreteThompsonSampling(500, 3)
+)
+bo = trieste.bayesian_optimizer.BayesianOptimizer(observer, search_space)
+
+num_steps = 5
+result = bo.optimize(
+    num_steps,
+    initial_data,
+    build_model(),
+    turbo_acq_rule,
+    track_state=True,
+    fit_model=False,
+)
+dataset = result.try_get_final_dataset()
+
+# %% [markdown]
+# ### Visualizing `TurBO` results
+#
+# We display the results as earlier.
+
+# %%
+plot_final_result(dataset)
+
+# %%
+plot_history(result)
+
+# %% [markdown]
+# ## LICENSE
+#
+# [Apache License 2.0](https://github.com/secondmind-labs/trieste/blob/develop/LICENSE)
diff --git a/docs/refs.bib b/docs/refs.bib
@@ -521,3 +521,11 @@ @inproceedings{wang2013bayesian
   year={2013}
 }
 
+@misc{diouane2022trego,
+      title={TREGO: a Trust-Region Framework for Efficient Global Optimization},
+      author={Youssef Diouane and Victor Picheny and Rodolphe Le Riche and Alexandre Scotto Di Perrotolo},
+      year={2022},
+      eprint={2101.06808},
+      archivePrefix={arXiv},
+      primaryClass={math.OC}
+}
diff --git a/docs/tutorials.rst b/docs/tutorials.rst
@@ -40,6 +40,7 @@ The following tutorials illustrate solving different types of optimization probl
    notebooks/qhsri-tutorial
    notebooks/multifidelity_modelling
    notebooks/rembo
+   notebooks/trust_region
 
 Frequently asked questions
 --------------------------

diff --git a/setup.py b/setup.py
@@ -49,7 +49,7 @@
         "greenlet>=1.1.0",
     ],
     extras_require={
-        "plotting": ["seaborn", "plotly"],
+        "plotting": ["seaborn", "plotly", "imageio"],
         "qhsri": ["pymoo", "cvxpy"],
     },
 )
diff --git a/trieste/experimental/plotting/__init__.py b/trieste/experimental/plotting/__init__.py
@@ -23,13 +23,16 @@
         plot_objective_and_constraints,
     )
     from .plotting import (
+        convert_figure_to_frame,
+        convert_frames_to_gif,
         plot_acq_function_2d,
         plot_bo_points,
         plot_function_2d,
         plot_gp_2d,
         plot_mobo_history,
         plot_mobo_points_in_obj_space,
         plot_regret,
+        plot_trust_region_history_2d,
     )
     from .plotting_plotly import (
         add_bo_points_plotly,