Optimization with `ContinuousDescriptorInput`s and engineered Features

Continuous descriptor inputs can be used in combination with engineered features to incorporate more domain knowledge into an optimization. Example could be a solvent of formulation optimization where per continuous input feature additional information about its properties is available.

For examples in the literature have a look at this paper.

Imports

import pandas as pd
import os
import matplotlib.pyplot as plt
import numpy as np

from bofire.data_models.features.api import ContinuousInput, ContinuousDescriptorInput, SumFeature, WeightedSumFeature, ContinuousOutput
from bofire.data_models.domain.api import Inputs, EngineeredFeatures, Outputs, Domain, Constraints
from bofire.benchmarks.api import Himmelblau, FormulationWrapper
from bofire.runners.api import run
from bofire.strategies.api import RandomStrategy, SoboStrategy
from bofire.data_models.surrogates.api import SingleTaskGPSurrogate
import bofire.surrogates.api as surrogates
from bofire.data_models.surrogates.api import BotorchSurrogates
from typing import Optional

SMOKE_TEST = os.environ.get("SMOKE_TEST")

Problem Setup

For demo purposes, the formulation wrapper is used around the two dimensional Himmelblau Benchmark to wrap it as a formulation problem with 7 features in total. Per original feature, three new features are introduced and one filler feature. The sum of each feature group is used as (normalized) input for the evaluation of the original Himmelblau function. A seventh feature is introduced as filler to always reach a total of 1 to fulfill the formulation/equality constraint. For more information on this setup have a look at the docstring of FormulationWrapper.

bench = FormulationWrapper(benchmark=Himmelblau(), n_features_per_original_feature=3, n_filler_features=1)

The continuos descriptor features have the following descriptor values for the descriptors x_1 and x_2:

pd.concat([feat.to_df() for feat in bench.domain.inputs.get(ContinuousDescriptorInput)])

	x_1	x_2
x_1_0	1.0	0.0
x_1_1	1.0	0.0
x_1_2	1.0	0.0
x_2_0	0.0	1.0
x_2_1	0.0	1.0
x_2_2	0.0	1.0

Benchmarks

Random Strategy

As baseline, we run the random strategy on the problem.

def sample(domain):
    strategy = RandomStrategy.make(domain=domain)
    return strategy.ask(10)


def best(domain: Domain, experiments: pd.DataFrame) -> float:
    return experiments.y.min()

random_results = []
for _ in range(15 if not SMOKE_TEST else 1):
    results = run(
        benchmark=bench,
        strategy_factory=lambda domain: RandomStrategy.make(domain=domain),
        n_iterations=40 if not SMOKE_TEST else 2,
        metric=best,
        initial_sampler=sample,
        n_runs=1,
        n_procs=1,
    )
    random_results.append(results[0][0])

  0%|          | 0/2 [00:00<?, ?it/s]Run 0:   0%|          | 0/2 [00:00<?, ?it/s]Run 0:   0%|          | 0/2 [00:00<?, ?it/s, Current Best:=20.077]Run 0:  50%|█████     | 1/2 [00:00<00:00,  9.18it/s, Current Best:=20.077]Run 0:  50%|█████     | 1/2 [00:00<00:00,  9.18it/s, Current Best:=20.077]Run 0:  50%|█████     | 1/2 [00:00<00:00,  9.18it/s, Current Best:=20.077]Run 0: 100%|██████████| 2/2 [00:00<00:00,  9.21it/s, Current Best:=20.077]Run 0: 100%|██████████| 2/2 [00:00<00:00,  9.19it/s, Current Best:=20.077]

Sobo Strategy

Next we run the SoboStrategy on the problem.

def sample(domain):
    return initial_experiments[domain.inputs.get_keys()].copy()

def best(domain: Domain, experiments: pd.DataFrame) -> float:
    return experiments.y.min()

sobo_results = []
for i in range(15 if not SMOKE_TEST else 1):
    initial_experiments = random_results[i][:10].copy()
    results = run(
        benchmark=bench,
        strategy_factory=lambda domain: SoboStrategy.make(domain=domain),
        n_iterations=40 if not SMOKE_TEST else 2,
        metric=best,
        initial_sampler=sample,
        n_runs=1,
        n_procs=1,
    )
    sobo_results.append(results[0][0])

/opt/hostedtoolcache/Python/3.12.12/x64/lib/python3.12/site-packages/bofire/surrogates/botorch.py:181: UserWarning: The given NumPy array is not writable, and PyTorch does not support non-writable tensors. This means writing to this tensor will result in undefined behavior. You may want to copy the array to protect its data or make it writable before converting it to a tensor. This type of warning will be suppressed for the rest of this program. (Triggered internally at /pytorch/torch/csrc/utils/tensor_numpy.cpp:213.)
  torch.from_numpy(Y.values).to(**tkwargs),
  0%|          | 0/2 [00:00<?, ?it/s]Run 0:   0%|          | 0/2 [00:04<?, ?it/s]Run 0:   0%|          | 0/2 [00:04<?, ?it/s, Current Best:=1.294]Run 0:  50%|█████     | 1/2 [00:04<00:04,  4.61s/it, Current Best:=1.294]Run 0:  50%|█████     | 1/2 [00:09<00:04,  4.61s/it, Current Best:=1.294]Run 0:  50%|█████     | 1/2 [00:09<00:04,  4.61s/it, Current Best:=1.294]Run 0: 100%|██████████| 2/2 [00:09<00:00,  4.72s/it, Current Best:=1.294]Run 0: 100%|██████████| 2/2 [00:09<00:00,  4.71s/it, Current Best:=1.294]

Now we run the SoboStrategy again, but with an engineered feature as additional input. The WeightedSumFeature computes the sum over the specified descriptors weighted by the values of the involved original features.

def create_strategy(domain):
    surrogate_data = SingleTaskGPSurrogate(
        inputs=domain.inputs,
        outputs=domain.outputs,
        engineered_features=EngineeredFeatures(
            features=[
                WeightedSumFeature(
                    key="WeightedSum",
                    features=bench.domain.inputs.get_keys(ContinuousDescriptorInput),
                    descriptors=["x_1", "x_2"]
                    )]),
        #kernel=RBFKernel(features=["x_1", "x_2"], lengthscale_prior=HVARFNER_LENGTHSCALE_PRIOR())
    )
    return SoboStrategy.make(domain=domain, surrogate_specs=BotorchSurrogates(surrogates=[surrogate_data]))

sobo_engineered_results_all = []
for i in range(15 if not SMOKE_TEST else 1):
    initial_experiments = random_results[i][:10].copy()
    results = run(
        benchmark=bench,
        strategy_factory=create_strategy,
        n_iterations=40,
        metric=best,
        initial_sampler=sample,
        n_runs=1,
        n_procs=1,
    )
    sobo_engineered_results_all.append(results[0][0])

/opt/hostedtoolcache/Python/3.12.12/x64/lib/python3.12/site-packages/bofire/surrogates/engineered_features.py:116: UserWarning: Creating a tensor from a list of numpy.ndarrays is extremely slow. Please consider converting the list to a single numpy.ndarray with numpy.array() before converting to a tensor. (Triggered internally at /pytorch/torch/csrc/utils/tensor_new.cpp:253.)
  descriptors = torch.tensor(
  0%|          | 0/40 [00:00<?, ?it/s]Run 0:   0%|          | 0/40 [00:05<?, ?it/s]Run 0:   0%|          | 0/40 [00:05<?, ?it/s, Current Best:=20.077]Run 0:   2%|▎         | 1/40 [00:05<03:30,  5.39s/it, Current Best:=20.077]Run 0:   2%|▎         | 1/40 [00:11<03:30,  5.39s/it, Current Best:=20.077]Run 0:   2%|▎         | 1/40 [00:11<03:30,  5.39s/it, Current Best:=20.077]Run 0:   5%|▌         | 2/40 [00:11<03:49,  6.03s/it, Current Best:=20.077]Run 0:   5%|▌         | 2/40 [00:16<03:49,  6.03s/it, Current Best:=20.077]Run 0:   5%|▌         | 2/40 [00:16<03:49,  6.03s/it, Current Best:=20.077]Run 0:   8%|▊         | 3/40 [00:16<03:25,  5.56s/it, Current Best:=20.077]Run 0:   8%|▊         | 3/40 [00:21<03:25,  5.56s/it, Current Best:=20.077]Run 0:   8%|▊         | 3/40 [00:21<03:25,  5.56s/it, Current Best:=20.077]Run 0:  10%|█         | 4/40 [00:21<03:13,  5.37s/it, Current Best:=20.077]Run 0:  10%|█         | 4/40 [00:26<03:13,  5.37s/it, Current Best:=20.077]Run 0:  10%|█         | 4/40 [00:26<03:13,  5.37s/it, Current Best:=20.077]Run 0:  12%|█▎        | 5/40 [00:26<02:56,  5.05s/it, Current Best:=20.077]Run 0:  12%|█▎        | 5/40 [00:32<02:56,  5.05s/it, Current Best:=20.077]Run 0:  12%|█▎        | 5/40 [00:32<02:56,  5.05s/it, Current Best:=20.077]Run 0:  15%|█▌        | 6/40 [00:32<03:05,  5.45s/it, Current Best:=20.077]Run 0:  15%|█▌        | 6/40 [00:39<03:05,  5.45s/it, Current Best:=20.077]Run 0:  15%|█▌        | 6/40 [00:39<03:05,  5.45s/it, Current Best:=20.077]Run 0:  18%|█▊        | 7/40 [00:39<03:09,  5.75s/it, Current Best:=20.077]Run 0:  18%|█▊        | 7/40 [00:45<03:09,  5.75s/it, Current Best:=20.077]Run 0:  18%|█▊        | 7/40 [00:45<03:09,  5.75s/it, Current Best:=9.065] Run 0:  20%|██        | 8/40 [00:45<03:07,  5.86s/it, Current Best:=9.065]Run 0:  20%|██        | 8/40 [00:51<03:07,  5.86s/it, Current Best:=9.065]Run 0:  20%|██        | 8/40 [00:51<03:07,  5.86s/it, Current Best:=9.065]Run 0:  22%|██▎       | 9/40 [00:51<03:04,  5.95s/it, Current Best:=9.065]Run 0:  22%|██▎       | 9/40 [00:57<03:04,  5.95s/it, Current Best:=9.065]Run 0:  22%|██▎       | 9/40 [00:57<03:04,  5.95s/it, Current Best:=9.065]Run 0:  25%|██▌       | 10/40 [00:57<03:03,  6.10s/it, Current Best:=9.065]Run 0:  25%|██▌       | 10/40 [01:03<03:03,  6.10s/it, Current Best:=9.065]Run 0:  25%|██▌       | 10/40 [01:03<03:03,  6.10s/it, Current Best:=9.065]Run 0:  28%|██▊       | 11/40 [01:03<02:56,  6.08s/it, Current Best:=9.065]Run 0:  28%|██▊       | 11/40 [01:09<02:56,  6.08s/it, Current Best:=9.065]Run 0:  28%|██▊       | 11/40 [01:09<02:56,  6.08s/it, Current Best:=9.065]Run 0:  30%|███       | 12/40 [01:09<02:50,  6.08s/it, Current Best:=9.065]Run 0:  30%|███       | 12/40 [01:16<02:50,  6.08s/it, Current Best:=9.065]Run 0:  30%|███       | 12/40 [01:16<02:50,  6.08s/it, Current Best:=9.065]Run 0:  32%|███▎      | 13/40 [01:16<02:49,  6.28s/it, Current Best:=9.065]Run 0:  32%|███▎      | 13/40 [01:22<02:49,  6.28s/it, Current Best:=9.065]Run 0:  32%|███▎      | 13/40 [01:22<02:49,  6.28s/it, Current Best:=9.065]Run 0:  35%|███▌      | 14/40 [01:22<02:40,  6.18s/it, Current Best:=9.065]Run 0:  35%|███▌      | 14/40 [01:28<02:40,  6.18s/it, Current Best:=9.065]Run 0:  35%|███▌      | 14/40 [01:28<02:40,  6.18s/it, Current Best:=9.065]Run 0:  38%|███▊      | 15/40 [01:28<02:34,  6.16s/it, Current Best:=9.065]Run 0:  38%|███▊      | 15/40 [01:34<02:34,  6.16s/it, Current Best:=9.065]Run 0:  38%|███▊      | 15/40 [01:34<02:34,  6.16s/it, Current Best:=9.065]Run 0:  40%|████      | 16/40 [01:34<02:28,  6.17s/it, Current Best:=9.065]Run 0:  40%|████      | 16/40 [01:41<02:28,  6.17s/it, Current Best:=9.065]Run 0:  40%|████      | 16/40 [01:41<02:28,  6.17s/it, Current Best:=9.065]Run 0:  42%|████▎     | 17/40 [01:41<02:22,  6.20s/it, Current Best:=9.065]Run 0:  42%|████▎     | 17/40 [01:48<02:22,  6.20s/it, Current Best:=9.065]Run 0:  42%|████▎     | 17/40 [01:48<02:22,  6.20s/it, Current Best:=9.065]Run 0:  45%|████▌     | 18/40 [01:48<02:27,  6.71s/it, Current Best:=9.065]Run 0:  45%|████▌     | 18/40 [01:53<02:27,  6.71s/it, Current Best:=9.065]Run 0:  45%|████▌     | 18/40 [01:53<02:27,  6.71s/it, Current Best:=9.065]Run 0:  48%|████▊     | 19/40 [01:53<02:08,  6.14s/it, Current Best:=9.065]Run 0:  48%|████▊     | 19/40 [01:59<02:08,  6.14s/it, Current Best:=9.065]Run 0:  48%|████▊     | 19/40 [01:59<02:08,  6.14s/it, Current Best:=9.065]Run 0:  50%|█████     | 20/40 [01:59<02:02,  6.10s/it, Current Best:=9.065]Run 0:  50%|█████     | 20/40 [02:07<02:02,  6.10s/it, Current Best:=9.065]Run 0:  50%|█████     | 20/40 [02:07<02:02,  6.10s/it, Current Best:=9.065]Run 0:  52%|█████▎    | 21/40 [02:07<02:02,  6.46s/it, Current Best:=9.065]/opt/hostedtoolcache/Python/3.12.12/x64/lib/python3.12/site-packages/botorch/optim/optimize.py:796: RuntimeWarning: Optimization failed in `gen_candidates_scipy` with the following warning(s):
[OptimizationWarning('Optimization failed within `scipy.optimize.minimize` with status 8 and message Positive directional derivative for linesearch.')]
Trying again with a new set of initial conditions.
  return _optimize_acqf_batch(opt_inputs=opt_inputs)
Run 0:  52%|█████▎    | 21/40 [02:18<02:02,  6.46s/it, Current Best:=9.065]Run 0:  52%|█████▎    | 21/40 [02:18<02:02,  6.46s/it, Current Best:=9.065]Run 0:  55%|█████▌    | 22/40 [02:18<02:21,  7.88s/it, Current Best:=9.065]Run 0:  55%|█████▌    | 22/40 [02:24<02:21,  7.88s/it, Current Best:=9.065]Run 0:  55%|█████▌    | 22/40 [02:24<02:21,  7.88s/it, Current Best:=9.065]Run 0:  57%|█████▊    | 23/40 [02:24<02:06,  7.43s/it, Current Best:=9.065]Run 0:  57%|█████▊    | 23/40 [02:32<02:06,  7.43s/it, Current Best:=9.065]Run 0:  57%|█████▊    | 23/40 [02:32<02:06,  7.43s/it, Current Best:=3.016]Run 0:  60%|██████    | 24/40 [02:32<02:00,  7.54s/it, Current Best:=3.016]Run 0:  60%|██████    | 24/40 [02:40<02:00,  7.54s/it, Current Best:=3.016]Run 0:  60%|██████    | 24/40 [02:40<02:00,  7.54s/it, Current Best:=3.016]Run 0:  62%|██████▎   | 25/40 [02:40<01:54,  7.62s/it, Current Best:=3.016]Run 0:  62%|██████▎   | 25/40 [02:47<01:54,  7.62s/it, Current Best:=3.016]Run 0:  62%|██████▎   | 25/40 [02:47<01:54,  7.62s/it, Current Best:=3.016]Run 0:  65%|██████▌   | 26/40 [02:47<01:44,  7.46s/it, Current Best:=3.016]Run 0:  65%|██████▌   | 26/40 [02:54<01:44,  7.46s/it, Current Best:=3.016]Run 0:  65%|██████▌   | 26/40 [02:54<01:44,  7.46s/it, Current Best:=3.016]Run 0:  68%|██████▊   | 27/40 [02:54<01:35,  7.33s/it, Current Best:=3.016]Run 0:  68%|██████▊   | 27/40 [03:00<01:35,  7.33s/it, Current Best:=3.016]Run 0:  68%|██████▊   | 27/40 [03:00<01:35,  7.33s/it, Current Best:=3.016]Run 0:  70%|███████   | 28/40 [03:00<01:24,  7.04s/it, Current Best:=3.016]Run 0:  70%|███████   | 28/40 [03:07<01:24,  7.04s/it, Current Best:=3.016]Run 0:  70%|███████   | 28/40 [03:07<01:24,  7.04s/it, Current Best:=3.016]Run 0:  72%|███████▎  | 29/40 [03:07<01:17,  7.04s/it, Current Best:=3.016]Run 0:  72%|███████▎  | 29/40 [03:14<01:17,  7.04s/it, Current Best:=3.016]Run 0:  72%|███████▎  | 29/40 [03:14<01:17,  7.04s/it, Current Best:=3.016]Run 0:  75%|███████▌  | 30/40 [03:14<01:09,  6.92s/it, Current Best:=3.016]Run 0:  75%|███████▌  | 30/40 [03:21<01:09,  6.92s/it, Current Best:=3.016]Run 0:  75%|███████▌  | 30/40 [03:21<01:09,  6.92s/it, Current Best:=0.590]Run 0:  78%|███████▊  | 31/40 [03:21<01:01,  6.87s/it, Current Best:=0.590]Run 0:  78%|███████▊  | 31/40 [03:28<01:01,  6.87s/it, Current Best:=0.590]Run 0:  78%|███████▊  | 31/40 [03:28<01:01,  6.87s/it, Current Best:=0.590]Run 0:  80%|████████  | 32/40 [03:28<00:56,  7.02s/it, Current Best:=0.590]Run 0:  80%|████████  | 32/40 [03:35<00:56,  7.02s/it, Current Best:=0.590]Run 0:  80%|████████  | 32/40 [03:35<00:56,  7.02s/it, Current Best:=0.590]Run 0:  82%|████████▎ | 33/40 [03:35<00:48,  6.98s/it, Current Best:=0.590]Run 0:  82%|████████▎ | 33/40 [03:41<00:48,  6.98s/it, Current Best:=0.590]Run 0:  82%|████████▎ | 33/40 [03:41<00:48,  6.98s/it, Current Best:=0.590]Run 0:  85%|████████▌ | 34/40 [03:41<00:40,  6.70s/it, Current Best:=0.590]Run 0:  85%|████████▌ | 34/40 [03:49<00:40,  6.70s/it, Current Best:=0.590]Run 0:  85%|████████▌ | 34/40 [03:49<00:40,  6.70s/it, Current Best:=0.590]Run 0:  88%|████████▊ | 35/40 [03:49<00:35,  7.06s/it, Current Best:=0.590]Run 0:  88%|████████▊ | 35/40 [03:55<00:35,  7.06s/it, Current Best:=0.590]Run 0:  88%|████████▊ | 35/40 [03:55<00:35,  7.06s/it, Current Best:=0.590]Run 0:  90%|█████████ | 36/40 [03:55<00:27,  6.87s/it, Current Best:=0.590]Run 0:  90%|█████████ | 36/40 [04:02<00:27,  6.87s/it, Current Best:=0.590]Run 0:  90%|█████████ | 36/40 [04:02<00:27,  6.87s/it, Current Best:=0.590]Run 0:  92%|█████████▎| 37/40 [04:02<00:20,  6.84s/it, Current Best:=0.590]Run 0:  92%|█████████▎| 37/40 [04:09<00:20,  6.84s/it, Current Best:=0.590]Run 0:  92%|█████████▎| 37/40 [04:09<00:20,  6.84s/it, Current Best:=0.590]Run 0:  95%|█████████▌| 38/40 [04:09<00:13,  6.88s/it, Current Best:=0.590]Run 0:  95%|█████████▌| 38/40 [04:15<00:13,  6.88s/it, Current Best:=0.590]Run 0:  95%|█████████▌| 38/40 [04:15<00:13,  6.88s/it, Current Best:=0.590]Run 0:  98%|█████████▊| 39/40 [04:15<00:06,  6.67s/it, Current Best:=0.590]Run 0:  98%|█████████▊| 39/40 [04:20<00:06,  6.67s/it, Current Best:=0.590]Run 0:  98%|█████████▊| 39/40 [04:20<00:06,  6.67s/it, Current Best:=0.590]Run 0: 100%|██████████| 40/40 [04:20<00:00,  6.23s/it, Current Best:=0.590]Run 0: 100%|██████████| 40/40 [04:20<00:00,  6.52s/it, Current Best:=0.590]

Plot the performance

Next we plot the performance. Using the engineered features shows a clear benefit. Using a SAAS model on it would lead to even better results, as only two features are needed and SAAS models are very good in figuring out the features of interest.

def get_padded_trajectories(dfs: list[pd.DataFrame]) -> np.ndarray:
    trajectories = []
    for df in dfs:
        y_values = [df.y[:10].max()] + df.y[10:].tolist()
        cummin = np.minimum.accumulate(np.log10(y_values))
        trajectories.append(np.array(cummin))
    max_len = max(len(t) for t in trajectories)
    return [np.pad(traj, (0, max_len-len(traj)), mode='edge') for traj in trajectories]

fig, ax = plt.subplots()

random_trajectories = get_padded_trajectories(random_results)
std_random = np.std(random_trajectories, axis=0)
mean_random = np.mean(random_trajectories, axis=0)
sem_random = std_random / np.sqrt(len(random_trajectories))
ax.plot(mean_random, label='Random', color='blue')
ax.fill_between(range(len(mean_random)), mean_random - sem_random, mean_random + sem_random, color='blue', alpha=0.2)


sobo_trajectories = get_padded_trajectories(sobo_results)
std_sobo = np.std(sobo_trajectories, axis=0)
mean_sobo = np.mean(sobo_trajectories, axis=0)
sem_sobo = std_sobo / np.sqrt(len(sobo_trajectories))
ax.plot(mean_sobo, label='SOBO', color='green')
ax.fill_between(range(len(mean_sobo)), mean_sobo - sem_sobo, mean_sobo + sem_sobo, color='green', alpha=0.2)

sobo_engineered_trajectories = get_padded_trajectories(sobo_engineered_results_all)
std_sobo_engineered = np.std(sobo_engineered_trajectories, axis=0)
mean_sobo_engineered = np.mean(sobo_engineered_trajectories, axis=0)
sem_sobo_engineered = std_sobo_engineered / np.sqrt(len(sobo_engineered_trajectories))
ax.plot(mean_sobo_engineered, label='SOBO Engineered', color='red')
ax.fill_between(range(len(mean_sobo_engineered)), mean_sobo_engineered - sem_sobo_engineered, mean_sobo_engineered + sem_sobo_engineered, color='red', alpha=0.2)

ax.set_title('Optimization Performance')
ax.legend()
plt.show()