From feb0f0418d1ad0125d1252df4d40697862715132 Mon Sep 17 00:00:00 2001 From: David Eriksson Date: Wed, 15 Mar 2023 11:13:23 -0600 Subject: [PATCH 1/2] Drop the number of candidates --- scripts/run_tutorials.py | 2 - tutorials/scalable_constrained_bo.ipynb | 377 ++++++++++-------------- 2 files changed, 163 insertions(+), 216 deletions(-) diff --git a/scripts/run_tutorials.py b/scripts/run_tutorials.py index c9849133b6..70ca41109b 100644 --- a/scripts/run_tutorials.py +++ b/scripts/run_tutorials.py @@ -27,8 +27,6 @@ RUN_IF_SMOKE_TEST_IGNORE_IF_STANDARD = { # only used in smoke tests "thompson_sampling.ipynb", # very slow without KeOps + GPU "composite_mtbo.ipynb", # TODO: very slow, figure out if we can make it faster - # Timing out in standard mode - "scalable_constrained_bo.ipynb", } diff --git a/tutorials/scalable_constrained_bo.ipynb b/tutorials/scalable_constrained_bo.ipynb index 637dc355b7..209d496929 100644 --- a/tutorials/scalable_constrained_bo.ipynb +++ b/tutorials/scalable_constrained_bo.ipynb @@ -7,7 +7,7 @@ "# Scalable Constrained Bayesian Optimization (SCBO)\n", "In this tutorial, we show how to implement Scalable Constrained Bayesian Optimization (SCBO) [1] in a closed loop in BoTorch.\n", "\n", - "We optimize the 20𝐷 Ackley function on the domain [−5,10]^20. This implementation uses two simple constraint functions c1 and c2. Our goal is to find values x which maximize Ackley(x) subject to the constraints c1(x) <= 0 and c2(x) <= 0.\n", + "We optimize the 20𝐷 Ackley function on the domain $[−5,10]^{20}$. This implementation uses two simple constraint functions $c1$ and $c2$. Our goal is to find values $x$ which maximizes $Ackley(x)$ subject to the constraints $c1(x) \\leq 0$ and $c2(x) \\leq 0$.\n", "\n", "[1]: David Eriksson and Matthias Poloczek. Scalable constrained Bayesian optimization. In International Conference on Artificial Intelligence and Statistics, pages 730–738. PMLR, 2021.\n", "(https://doi.org/10.48550/arxiv.2002.08526)\n", @@ -17,40 +17,37 @@ }, { "cell_type": "code", - "execution_count": 3, + "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "import math\n", + "import os\n", + "import warnings\n", "from dataclasses import dataclass\n", "\n", - "import torch\n", - "from torch import Tensor\n", - "from botorch.fit import fit_gpytorch_mll\n", - "from botorch.models import SingleTaskGP\n", - "from botorch.test_functions import Ackley\n", - "from botorch.utils.transforms import unnormalize\n", - "from torch.quasirandom import SobolEngine\n", - "\n", "import gpytorch\n", + "import torch\n", "from gpytorch.constraints import Interval\n", "from gpytorch.kernels import MaternKernel, ScaleKernel\n", "from gpytorch.likelihoods import GaussianLikelihood\n", "from gpytorch.mlls import ExactMarginalLogLikelihood\n", - "from botorch.models.model_list_gp_regression import ModelListGP\n", + "from torch import Tensor\n", + "from torch.quasirandom import SobolEngine\n", "\n", - "# Constrained Max Posterior Sampling\n", - "# is a new sampling class, similar to MaxPosteriorSampling,\n", - "# which implements the constrained version of Thompson Sampling described in [1]\n", + "from botorch.fit import fit_gpytorch_mll\n", + "# Constrained Max Posterior Sampling s a new sampling class, similar to MaxPosteriorSampling,\n", + "# which implements the constrained version of Thompson Sampling described in [1].\n", "from botorch.generation.sampling import ConstrainedMaxPosteriorSampling\n", - "\n", - "import warnings\n", + "from botorch.models import SingleTaskGP\n", + "from botorch.models.model_list_gp_regression import ModelListGP\n", + "from botorch.test_functions import Ackley\n", + "from botorch.utils.transforms import unnormalize\n", "\n", "warnings.filterwarnings(\"ignore\")\n", "\n", "device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n", "dtype = torch.double\n", - "import os\n", "\n", "SMOKE_TEST = os.environ.get(\"SMOKE_TEST\")" ] @@ -64,7 +61,7 @@ }, { "cell_type": "code", - "execution_count": 5, + "execution_count": 2, "metadata": {}, "outputs": [], "source": [ @@ -102,7 +99,7 @@ }, { "cell_type": "code", - "execution_count": 6, + "execution_count": 3, "metadata": {}, "outputs": [], "source": [ @@ -136,20 +133,20 @@ }, { "cell_type": "code", - "execution_count": 7, + "execution_count": 4, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ - "TurboState(dim=20, batch_size=4, length=0.8, length_min=0.0078125, length_max=1.6, failure_counter=0, failure_tolerance=5, success_counter=0, success_tolerance=10, best_value=-inf, best_constraint_values=tensor([inf, inf]), restart_triggered=False)\n" + "ScboState(dim=20, batch_size=4, length=0.8, length_min=0.0078125, length_max=1.6, failure_counter=0, failure_tolerance=5, success_counter=0, success_tolerance=10, best_value=-inf, best_constraint_values=tensor([inf, inf]), restart_triggered=False)\n" ] } ], "source": [ "@dataclass\n", - "class TurboState:\n", + "class ScboState:\n", " dim: int\n", " batch_size: int\n", " length: float = 0.8\n", @@ -160,12 +157,7 @@ " success_counter: int = 0\n", " success_tolerance: int = 10 # Note: The original paper uses 3\n", " best_value: float = -float(\"inf\")\n", - " best_constraint_values: Tensor = (\n", - " torch.ones(\n", - " 2,\n", - " )\n", - " * torch.inf\n", - " )\n", + " best_constraint_values: Tensor = torch.ones(2,) * torch.inf\n", " restart_triggered: bool = False\n", "\n", " def __post_init__(self):\n", @@ -192,22 +184,20 @@ "\n", "\n", "def update_state(state, Y_next, C_next):\n", - " \"\"\"Method used to update the TuRBO state after each\n", - " step of optimization.\n", - "\n", - " Success and failure counters are updated accoding to\n", - " the objective values (Y_next) and constraint values (C_next)\n", - " of the batch of candidate points evaluated on the optimization step.\n", - "\n", - " As in the original TuRBO paper, a success is counted whenver\n", - " any one of the new candidate points imporves upon the incumbent\n", - " best point. The key difference for SCBO is that we only compare points\n", - " by their objective values when both points are valid (meet all constraints).\n", - " If exactly one of the two points beinc compared voliates a constraint, the\n", - " other valid point is automatically considered to be better. If both points\n", - " violate some constraints, we compare them inated by their constraint values.\n", + " \"\"\"Method used to update the TuRBO state after each step of optimization.\n", + "\n", + " Success and failure counters are updated according to the objective values \n", + " (Y_next) and constraint values (C_next) of the batch of candidate points \n", + " evaluated on the optimization step.\n", + "\n", + " As in the original TuRBO paper, a success is counted whenver any one of the \n", + " new candidate points improves upon the incumbent best point. The key difference \n", + " for SCBO is that we only compare points by their objective values when both points\n", + " are valid (meet all constraints). If exactly one of the two points being compared \n", + " violates a constraint, the other valid point is automatically considered to be better. \n", + " If both points violate some constraints, we compare them inated by their constraint values.\n", " The better point in this case is the one with minimum total constraint violation\n", - " (the minimum sum over constraint values)\"\"\"\n", + " (the minimum sum of constraint values)\"\"\"\n", "\n", " # Determine which candidates meet the constraints (are valid)\n", " bool_tensor = C_next <= 0\n", @@ -234,34 +224,33 @@ " # throw out all invalid candidates\n", " # (a valid candidate is always better than an invalid one)\n", "\n", - " # Case 1: if best valid candidate found has a higher obj value that incumbent best\n", - " # count a success, the obj valuse has been improved\n", - " imporved_obj = max(Valid_Y_next) > state.best_value + 1e-3 * math.fabs(\n", + " # Case 1: if the best valid candidate found has a higher objective value that \n", + " # incumbent best count a success, the obj valuse has been improved\n", + " improved_obj = max(Valid_Y_next) > state.best_value + 1e-3 * math.fabs(\n", " state.best_value\n", " )\n", " # Case 2: if incumbent best violates constraints\n", - " # count a success, we now have suggested a point which is valid and therfore better\n", + " # count a success, we now have suggested a point which is valid and thus better\n", " obtained_validity = torch.all(state.best_constraint_values > 0)\n", - " if imporved_obj or obtained_validity: # If Case 1 or Case 2\n", + " if improved_obj or obtained_validity: # If Case 1 or Case 2\n", " # count a success and update the best value and constraint values\n", " state.success_counter += 1\n", " state.failure_counter = 0\n", " state.best_value = max(Valid_Y_next).item()\n", " state.best_constraint_values = Valid_C_next[Valid_Y_next.argmax()]\n", " else:\n", - " # otherwise, count a fialure\n", + " # otherwise, count a failure\n", " state.success_counter = 0\n", " state.failure_counter += 1\n", "\n", " # Finally, update the length of the trust region according to the\n", - " # updated success and failure counts\n", + " # updated success and failure counters\n", " state = update_tr_length(state)\n", - "\n", " return state\n", "\n", "\n", "# Define example state\n", - "state = TurboState(dim=dim, batch_size=batch_size)\n", + "state = ScboState(dim=dim, batch_size=batch_size)\n", "print(state)" ] }, @@ -276,7 +265,7 @@ }, { "cell_type": "code", - "execution_count": 8, + "execution_count": 5, "metadata": {}, "outputs": [], "source": [ @@ -292,14 +281,16 @@ "source": [ "### Generating a batch of candidates for SCBO \n", "\n", - "Just as in the TuRBO Tutorial (https://botorch.org/tutorials/turbo_1), we'll define a method generate_batch to generate a new batch of candidate points within the TuRBO trust region using thompson sampling. \n", + "Just as in the TuRBO Tutorial (https://botorch.org/tutorials/turbo_1), we'll define a method generate_batch to generate a new batch of candidate points within the TuRBO trust region using Thompson sampling. \n", + "\n", + "The key difference here from TuRBO is that, instead of using MaxPosteriorSampling to simply grab the candidates within the trust region with the maximum posterior values, we use ConstrainedMaxPosteriorSampling to instead grab the candidates within the trust region with the maximum posterior values subject to the constraint that the posteriors for the constraint models for c1(x) and c2(x) must be less than or equal to 0 for both candidates. \n", "\n", - "The key difference here from TuRBO is that, instead of using MaxPosteriorSampling to simply grab the candidates within the trust region with the maximum posterior values, we use ConstrainedMaxPosteriorSampling to instead grab the candidates within the trust region with the maximum posterior values subject to the constrain that the posteriors for the constraint models for c1(x) and c2(x) must be less than or equal to 0 for each candidate. In otherwords, we use additional GPs ('constraiant models') to model each black-box constraint (c1 and c2), and throw out all candidates for which the posterior prediction of these constraint models is greater than 0 (throw out all predicted constraint violators). According to [1], in the special case when all of the candidaates arae predicted to be constraint violators, we select the candidate with the minimum predicted violation. (See botorch.generation.sampling.ConstrainedMaxPosteriorSampling for implementation details)." + "We use additional GPs ('constraint models') to model each black-box constraint (c1 and c2), and throw out all candidates for which the sampled value for these constraint models is greater than 0. According to [1], in the special case when all of the candidaates are predicted to be constraint violators, we select the candidate with the minimum predicted violation. (See botorch.generation.sampling.ConstrainedMaxPosteriorSampling for implementation details)." ] }, { "cell_type": "code", - "execution_count": 9, + "execution_count": 6, "metadata": {}, "outputs": [], "source": [ @@ -309,20 +300,15 @@ " X, # Evaluated points on the domain [0, 1]^d\n", " Y, # Function values\n", " batch_size,\n", - " n_candidates=None, # Number of candidates for Thompson sampling\n", - " constraint_model=None,\n", + " n_candidates, # Number of candidates for Thompson sampling\n", + " constraint_model,\n", "):\n", " assert X.min() >= 0.0 and X.max() <= 1.0 and torch.all(torch.isfinite(Y))\n", - " if n_candidates is None:\n", - " n_candidates = min(5000, max(2000, 200 * X.shape[-1]))\n", "\n", - " # Scale the TR to be proportional to the lengthscales\n", + " # Create the TR bounds\n", " x_center = X[Y.argmax(), :].clone()\n", - " weights = model.covar_module.base_kernel.lengthscale.squeeze().detach()\n", - " weights = weights / weights.mean()\n", - " weights = weights / torch.prod(weights.pow(1.0 / len(weights)))\n", - " tr_lb = torch.clamp(x_center - weights * state.length / 2.0, 0.0, 1.0)\n", - " tr_ub = torch.clamp(x_center + weights * state.length / 2.0, 0.0, 1.0)\n", + " tr_lb = torch.clamp(x_center - state.length / 2.0, 0.0, 1.0)\n", + " tr_ub = torch.clamp(x_center + state.length / 2.0, 0.0, 1.0)\n", "\n", " # Thompson Sampling w/ Constraints (SCBO)\n", " dim = X.shape[-1]\n", @@ -359,21 +345,21 @@ }, { "cell_type": "code", - "execution_count": 10, + "execution_count": 7, "metadata": {}, "outputs": [ { "data": { "text/plain": [ - "(tensor(-9.6854, device='cuda:0', dtype=torch.float64),\n", - " tensor(4.8509, device='cuda:0', dtype=torch.float64),\n", - " tensor(-9.8032, device='cuda:0', dtype=torch.float64),\n", - " tensor(4.7317, device='cuda:0', dtype=torch.float64),\n", - " tensor(-15.9292, device='cuda:0', dtype=torch.float64),\n", - " tensor(-12.4023, device='cuda:0', dtype=torch.float64))" + "(tensor(-9.6854, dtype=torch.float64),\n", + " tensor(4.8509, dtype=torch.float64),\n", + " tensor(-9.8032, dtype=torch.float64),\n", + " tensor(4.7317, dtype=torch.float64),\n", + " tensor(-15.9292, dtype=torch.float64),\n", + " tensor(-12.4023, dtype=torch.float64))" ] }, - "execution_count": 10, + "execution_count": 7, "metadata": {}, "output_type": "execute_result" } @@ -397,107 +383,96 @@ }, { "cell_type": "code", - "execution_count": 11, + "execution_count": null, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ - "44) Best value: -1.34e+01, TR length: 8.00e-01\n", - "48) Best value: -1.27e+01, TR length: 8.00e-01\n", - "52) Best value: -9.77e+00, TR length: 8.00e-01\n", - "56) Best value: -9.77e+00, TR length: 8.00e-01\n", - "60) Best value: -9.77e+00, TR length: 8.00e-01\n", - "64) Best value: -9.77e+00, TR length: 8.00e-01\n", - "68) Best value: -9.77e+00, TR length: 8.00e-01\n", - "72) Best value: -9.08e+00, TR length: 8.00e-01\n", - "76) Best value: -9.06e+00, TR length: 8.00e-01\n", - "80) Best value: -8.26e+00, TR length: 8.00e-01\n", - "84) Best value: -8.26e+00, TR length: 8.00e-01\n", - "88) Best value: -7.34e+00, TR length: 8.00e-01\n", - "92) Best value: -7.34e+00, TR length: 8.00e-01\n", - "96) Best value: -7.34e+00, TR length: 8.00e-01\n", - "100) Best value: -7.34e+00, TR length: 8.00e-01\n", - "104) Best value: -7.34e+00, TR length: 8.00e-01\n", - "108) Best value: -7.34e+00, TR length: 4.00e-01\n", - "112) Best value: -6.99e+00, TR length: 4.00e-01\n", - "116) Best value: -6.85e+00, TR length: 4.00e-01\n", - "120) Best value: -6.00e+00, TR length: 4.00e-01\n", - "124) Best value: -6.00e+00, TR length: 4.00e-01\n", - "128) Best value: -6.00e+00, TR length: 4.00e-01\n", - "132) Best value: -6.00e+00, TR length: 4.00e-01\n", - "136) Best value: -6.00e+00, TR length: 4.00e-01\n", - "140) Best value: -5.67e+00, TR length: 4.00e-01\n", - "144) Best value: -5.67e+00, TR length: 4.00e-01\n", - "148) Best value: -5.67e+00, TR length: 4.00e-01\n", - "152) Best value: -5.67e+00, TR length: 4.00e-01\n", - "156) Best value: -5.67e+00, TR length: 4.00e-01\n", - "160) Best value: -5.67e+00, TR length: 2.00e-01\n", - "164) Best value: -4.99e+00, TR length: 2.00e-01\n", - "168) Best value: -3.85e+00, TR length: 2.00e-01\n", - "172) Best value: -3.85e+00, TR length: 2.00e-01\n", - "176) Best value: -3.85e+00, TR length: 2.00e-01\n", - "180) Best value: -3.85e+00, TR length: 2.00e-01\n", - "184) Best value: -3.85e+00, TR length: 2.00e-01\n", - "188) Best value: -3.85e+00, TR length: 1.00e-01\n", - "192) Best value: -3.85e+00, TR length: 1.00e-01\n", - "196) Best value: -3.70e+00, TR length: 1.00e-01\n", - "200) Best value: -3.70e+00, TR length: 1.00e-01\n", - "204) Best value: -3.62e+00, TR length: 1.00e-01\n", - "208) Best value: -3.31e+00, TR length: 1.00e-01\n", - "212) Best value: -3.17e+00, TR length: 1.00e-01\n", - "216) Best value: -3.17e+00, TR length: 1.00e-01\n", - "220) Best value: -3.14e+00, TR length: 1.00e-01\n", - "224) Best value: -3.14e+00, TR length: 1.00e-01\n", - "228) Best value: -3.10e+00, TR length: 1.00e-01\n", - "232) Best value: -2.34e+00, TR length: 1.00e-01\n", - "236) Best value: -2.34e+00, TR length: 1.00e-01\n", - "240) Best value: -2.34e+00, TR length: 1.00e-01\n", - "244) Best value: -2.34e+00, TR length: 1.00e-01\n", - "248) Best value: -2.34e+00, TR length: 1.00e-01\n", - "252) Best value: -2.34e+00, TR length: 5.00e-02\n", - "256) Best value: -1.93e+00, TR length: 5.00e-02\n", - "260) Best value: -1.93e+00, TR length: 5.00e-02\n", - "264) Best value: -1.93e+00, TR length: 5.00e-02\n", - "268) Best value: -1.72e+00, TR length: 5.00e-02\n", - "272) Best value: -1.72e+00, TR length: 5.00e-02\n", - "276) Best value: -1.72e+00, TR length: 5.00e-02\n", - "280) Best value: -1.72e+00, TR length: 5.00e-02\n", - "284) Best value: -1.72e+00, TR length: 5.00e-02\n", - "288) Best value: -1.72e+00, TR length: 2.50e-02\n", - "292) Best value: -1.54e+00, TR length: 2.50e-02\n", - "296) Best value: -1.54e+00, TR length: 2.50e-02\n", - "300) Best value: -1.54e+00, TR length: 2.50e-02\n", - "304) Best value: -1.54e+00, TR length: 2.50e-02\n", - "308) Best value: -1.54e+00, TR length: 2.50e-02\n", - "312) Best value: -1.38e+00, TR length: 2.50e-02\n", - "316) Best value: -1.22e+00, TR length: 2.50e-02\n", - "320) Best value: -1.22e+00, TR length: 2.50e-02\n", - "324) Best value: -1.22e+00, TR length: 2.50e-02\n", - "328) Best value: -1.22e+00, TR length: 2.50e-02\n", - "332) Best value: -1.22e+00, TR length: 2.50e-02\n", - "336) Best value: -1.09e+00, TR length: 2.50e-02\n", - "340) Best value: -1.09e+00, TR length: 2.50e-02\n", - "344) Best value: -1.09e+00, TR length: 2.50e-02\n", - "348) Best value: -1.09e+00, TR length: 2.50e-02\n", - "352) Best value: -1.09e+00, TR length: 2.50e-02\n", - "356) Best value: -1.09e+00, TR length: 1.25e-02\n", - "360) Best value: -1.09e+00, TR length: 1.25e-02\n", - "364) Best value: -1.09e+00, TR length: 1.25e-02\n", - "368) Best value: -8.61e-01, TR length: 1.25e-02\n", - "372) Best value: -8.54e-01, TR length: 1.25e-02\n", - "376) Best value: -8.54e-01, TR length: 1.25e-02\n", - "380) Best value: -7.06e-01, TR length: 1.25e-02\n", - "384) Best value: -4.93e-01, TR length: 1.25e-02\n", - "388) Best value: -4.93e-01, TR length: 1.25e-02\n", - "392) Best value: -4.34e-01, TR length: 1.25e-02\n", - "396) Best value: -4.21e-01, TR length: 1.25e-02\n", - "400) Best value: -4.21e-01, TR length: 1.25e-02\n", - "404) Best value: -4.21e-01, TR length: 1.25e-02\n", - "408) Best value: -4.21e-01, TR length: 1.25e-02\n", - "412) Best value: -4.21e-01, TR length: 1.25e-02\n", - "416) Best value: -4.21e-01, TR length: 6.25e-03\n" + "44) Best value: -1.27e+01, TR length: 8.00e-01\n", + "48) Best value: -1.19e+01, TR length: 8.00e-01\n", + "52) Best value: -1.02e+01, TR length: 8.00e-01\n", + "56) Best value: -1.02e+01, TR length: 8.00e-01\n", + "60) Best value: -1.02e+01, TR length: 8.00e-01\n", + "64) Best value: -1.02e+01, TR length: 8.00e-01\n", + "68) Best value: -9.97e+00, TR length: 8.00e-01\n", + "72) Best value: -8.17e+00, TR length: 8.00e-01\n", + "76) Best value: -8.17e+00, TR length: 8.00e-01\n", + "80) Best value: -8.16e+00, TR length: 8.00e-01\n", + "84) Best value: -8.16e+00, TR length: 8.00e-01\n", + "88) Best value: -8.16e+00, TR length: 8.00e-01\n", + "92) Best value: -8.16e+00, TR length: 8.00e-01\n", + "96) Best value: -8.16e+00, TR length: 8.00e-01\n", + "100) Best value: -8.16e+00, TR length: 4.00e-01\n", + "104) Best value: -7.50e+00, TR length: 4.00e-01\n", + "108) Best value: -6.87e+00, TR length: 4.00e-01\n", + "112) Best value: -6.87e+00, TR length: 4.00e-01\n", + "116) Best value: -5.65e+00, TR length: 4.00e-01\n", + "120) Best value: -5.65e+00, TR length: 4.00e-01\n", + "124) Best value: -5.65e+00, TR length: 4.00e-01\n", + "128) Best value: -5.65e+00, TR length: 4.00e-01\n", + "132) Best value: -5.65e+00, TR length: 4.00e-01\n", + "136) Best value: -5.65e+00, TR length: 2.00e-01\n", + "140) Best value: -4.71e+00, TR length: 2.00e-01\n", + "144) Best value: -4.71e+00, TR length: 2.00e-01\n", + "148) Best value: -4.71e+00, TR length: 2.00e-01\n", + "152) Best value: -4.36e+00, TR length: 2.00e-01\n", + "156) Best value: -4.20e+00, TR length: 2.00e-01\n", + "160) Best value: -4.20e+00, TR length: 2.00e-01\n", + "164) Best value: -4.20e+00, TR length: 2.00e-01\n", + "168) Best value: -4.20e+00, TR length: 2.00e-01\n", + "172) Best value: -4.20e+00, TR length: 2.00e-01\n", + "176) Best value: -4.00e+00, TR length: 2.00e-01\n", + "180) Best value: -3.98e+00, TR length: 2.00e-01\n", + "184) Best value: -3.98e+00, TR length: 2.00e-01\n", + "188) Best value: -3.89e+00, TR length: 2.00e-01\n", + "192) Best value: -3.89e+00, TR length: 2.00e-01\n", + "196) Best value: -3.89e+00, TR length: 2.00e-01\n", + "200) Best value: -3.89e+00, TR length: 2.00e-01\n", + "204) Best value: -3.77e+00, TR length: 2.00e-01\n", + "208) Best value: -3.77e+00, TR length: 2.00e-01\n", + "212) Best value: -3.77e+00, TR length: 2.00e-01\n", + "216) Best value: -3.61e+00, TR length: 2.00e-01\n", + "220) Best value: -3.61e+00, TR length: 2.00e-01\n", + "224) Best value: -3.61e+00, TR length: 2.00e-01\n", + "228) Best value: -3.61e+00, TR length: 2.00e-01\n", + "232) Best value: -3.61e+00, TR length: 2.00e-01\n", + "236) Best value: -3.61e+00, TR length: 1.00e-01\n", + "240) Best value: -3.22e+00, TR length: 1.00e-01\n", + "244) Best value: -3.06e+00, TR length: 1.00e-01\n", + "248) Best value: -2.85e+00, TR length: 1.00e-01\n", + "252) Best value: -2.85e+00, TR length: 1.00e-01\n", + "256) Best value: -2.70e+00, TR length: 1.00e-01\n", + "260) Best value: -2.70e+00, TR length: 1.00e-01\n", + "264) Best value: -2.69e+00, TR length: 1.00e-01\n", + "268) Best value: -2.69e+00, TR length: 1.00e-01\n", + "272) Best value: -2.69e+00, TR length: 1.00e-01\n", + "276) Best value: -2.69e+00, TR length: 1.00e-01\n", + "280) Best value: -2.69e+00, TR length: 1.00e-01\n", + "284) Best value: -2.69e+00, TR length: 5.00e-02\n", + "288) Best value: -2.66e+00, TR length: 5.00e-02\n", + "292) Best value: -2.16e+00, TR length: 5.00e-02\n", + "296) Best value: -1.60e+00, TR length: 5.00e-02\n", + "300) Best value: -1.60e+00, TR length: 5.00e-02\n", + "304) Best value: -1.60e+00, TR length: 5.00e-02\n", + "308) Best value: -1.60e+00, TR length: 5.00e-02\n", + "312) Best value: -1.60e+00, TR length: 5.00e-02\n", + "316) Best value: -1.60e+00, TR length: 2.50e-02\n", + "320) Best value: -1.56e+00, TR length: 2.50e-02\n", + "324) Best value: -1.37e+00, TR length: 2.50e-02\n", + "328) Best value: -1.37e+00, TR length: 2.50e-02\n", + "332) Best value: -1.37e+00, TR length: 2.50e-02\n", + "336) Best value: -1.28e+00, TR length: 2.50e-02\n", + "340) Best value: -1.26e+00, TR length: 2.50e-02\n", + "344) Best value: -1.26e+00, TR length: 2.50e-02\n", + "348) Best value: -1.26e+00, TR length: 2.50e-02\n", + "352) Best value: -1.26e+00, TR length: 2.50e-02\n", + "356) Best value: -1.26e+00, TR length: 2.50e-02\n", + "360) Best value: -1.26e+00, TR length: 1.25e-02\n", + "364) Best value: -1.21e+00, TR length: 1.25e-02\n", + "368) Best value: -9.79e-01, TR length: 1.25e-02\n", + "372) Best value: -9.79e-01, TR length: 1.25e-02\n" ] } ], @@ -505,8 +480,10 @@ "# Initialize TuRBO state\n", "from botorch.models.transforms.outcome import Standardize\n", "\n", - "state = TurboState(dim, batch_size=batch_size)\n", - "N_CANDIDATES = min(5000, max(2000, 200 * dim)) if not SMOKE_TEST else 4\n", + "state = ScboState(dim, batch_size=batch_size)\n", + "# Note: We use 2000 candidates here to make the tutorial run faster. \n", + "# SCBO actually uses min(5000, max(2000, 200 * dim)) candidate points by default.\n", + "N_CANDIDATES = 2000 if not SMOKE_TEST else 4\n", "\n", "\n", "def get_fitted_model(X, Y):\n", @@ -567,22 +544,18 @@ " # Update TuRBO state\n", " state = update_state(state, Y_next, C_next)\n", "\n", - " # Append data\n", - " # Notice we append all data, even points that violate\n", - " # the constriants, this is so our constraint models\n", - " # can learn more about the constranit functions and\n", - " # gain confidence about where violation occurs\n", + " # Append data. Note that we append all data, even points that violate\n", + " # the constraints. This is so our constraint models can learn more \n", + " # about the constraint functions and gain confidence in where violations occur.\n", " train_X = torch.cat((train_X, X_next), dim=0)\n", " train_Y = torch.cat((train_Y, Y_next), dim=0)\n", " C1 = torch.cat((C1, C1_next), dim=0)\n", " C2 = torch.cat((C2, C2_next), dim=0)\n", "\n", - " # Print current status\n", - " # Note: state.best_value is always the best objective value\n", - " # found so far which meets the constraints, or in the case\n", - " # that no points have been found yet which meet the constraints,\n", - " # it is the objective value of the point with the\n", - " # minimum constraint violation\n", + " # Print current status. Note that state.best_value is always the best \n", + " # objective value found so far which meets the constraints, or in the case\n", + " # that no points have been found yet which meet the constraints, it is the \n", + " # objective value of the point with the minimum constraint violation.\n", " print(\n", " f\"{len(train_X)}) Best value: {state.best_value:.2e}, TR length: {state.length:.2e}\"\n", " )" @@ -590,19 +563,11 @@ }, { "cell_type": "code", - "execution_count": 12, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "With constraints, the best value we found is: -0.4209\n" - ] - } - ], + "outputs": [], "source": [ - "# Valid samples must have BOTH c1 <= 0 and c2 <= 0\n", + "# Valid samples must have BOTH c1 <= 0 and c2 <= 0\n", "constraint_vals = torch.cat([C1, C2], dim=-1)\n", "bool_tensor = constraint_vals <= 0\n", "bool_tensor = torch.all(bool_tensor, dim=-1).unsqueeze(-1)\n", @@ -617,30 +582,15 @@ "source": [ "### Plot Results\n", "\n", - "Notice that with these two simple constraints, SCBO preforms about the same as to TuRBO (see TuRBO 1 tutorial notebok)" + "With these two simple constraints, SCBO performs similarly to TuRBO (see TuRBO-1 tutorial notebok)" ] }, { "cell_type": "code", - "execution_count": 13, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": { - "needs_background": "light" - }, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ - "# Plot Optimization Results\n", - "\n", "import matplotlib.pyplot as plt\n", "import numpy as np\n", "from matplotlib import rc\n", @@ -673,7 +623,7 @@ ], "metadata": { "kernelspec": { - "display_name": "Python 3.8.8 ('base')", + "display_name": "Python 3 (ipykernel)", "language": "python", "name": "python3" }, @@ -687,9 +637,8 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.8.8" + "version": "3.9.13" }, - "orig_nbformat": 4, "vscode": { "interpreter": { "hash": "9beb4c3e6521665a47c2b1e65f245d1b2309f4194f15ed6955f5e52622a9d29e" From 48d72834784ed7f7e07e19e04f1efde8d1ece571 Mon Sep 17 00:00:00 2001 From: David Eriksson Date: Wed, 15 Mar 2023 11:13:55 -0600 Subject: [PATCH 2/2] Update scalable_constrained_bo.ipynb --- tutorials/scalable_constrained_bo.ipynb | 37 +++++++++++++++++++++---- 1 file changed, 31 insertions(+), 6 deletions(-) diff --git a/tutorials/scalable_constrained_bo.ipynb b/tutorials/scalable_constrained_bo.ipynb index 209d496929..94a56fe820 100644 --- a/tutorials/scalable_constrained_bo.ipynb +++ b/tutorials/scalable_constrained_bo.ipynb @@ -383,7 +383,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 8, "metadata": {}, "outputs": [ { @@ -472,7 +472,13 @@ "360) Best value: -1.26e+00, TR length: 1.25e-02\n", "364) Best value: -1.21e+00, TR length: 1.25e-02\n", "368) Best value: -9.79e-01, TR length: 1.25e-02\n", - "372) Best value: -9.79e-01, TR length: 1.25e-02\n" + "372) Best value: -9.79e-01, TR length: 1.25e-02\n", + "376) Best value: -9.75e-01, TR length: 1.25e-02\n", + "380) Best value: -9.75e-01, TR length: 1.25e-02\n", + "384) Best value: -9.75e-01, TR length: 1.25e-02\n", + "388) Best value: -9.75e-01, TR length: 1.25e-02\n", + "392) Best value: -9.75e-01, TR length: 1.25e-02\n", + "396) Best value: -9.75e-01, TR length: 6.25e-03\n" ] } ], @@ -563,9 +569,17 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 9, "metadata": {}, - "outputs": [], + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "With constraints, the best value we found is: -0.9748\n" + ] + } + ], "source": [ "# Valid samples must have BOTH c1 <= 0 and c2 <= 0\n", "constraint_vals = torch.cat([C1, C2], dim=-1)\n", @@ -587,9 +601,20 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 10, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "image/png": "\n", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], "source": [ "import matplotlib.pyplot as plt\n", "import numpy as np\n",