Add Bayesian Optimization into HiOp (#711)

nychiang · thartland · web-flow · commit ff0686bcd458 · 2025-03-14T09:51:55.000-07:00
* create branch

* add submodule smt

* add files into the correct folders

* remove smt

* update url

* remove python temp files

* addressing some of Cosmins concerns and cleaning up BODriver

---------

Co-authored-by: Tucker Hartland &lt;tucker.hartland@gmail.com&gt;
diff --git a/.gitignore b/.gitignore
@@ -5,3 +5,5 @@ build_*
 .DS_Store
 _dist-default-build
 _dist-DEBUG
+*hiopbbpy.egg-info
+*__pycache__
diff --git a/.gitmodules b/.gitmodules
@@ -1,3 +1,4 @@
 [submodule "tpl/eigen"]
 	path = tpl/eigen
 	url = https://gitlab.com/libeigen/eigen.git
+
diff --git a/pyproject.toml b/pyproject.toml
@@ -0,0 +1,3 @@
+[build-system]
+requires = ["setuptools", "wheel", "numpy"]
+build-backend = "setuptools.build_meta"
diff --git a/setup.py b/setup.py
@@ -0,0 +1,29 @@
+'''
+This is the setup file for installing hiopbbpy
+
+Authors:    Tucker Hartland <hartland1@llnl.gov>
+            Nai-Yuan Chiang <chiang7@llnl.gov>
+'''
+
+import sys
+import numpy as np
+from setuptools import setup, find_packages
+
+
+metadata = dict(
+        name="hiopbbpy",
+        version="0.0.1",
+        description="HiOp black box optimization (hiopbbpy)",
+        author="Tucker hartland et al.",
+        author_email="hartland1@llnl.gov",
+        license="BSD-3",
+        packages=find_packages(where="src"),
+        package_dir={"": "src"},
+        install_requires=["smt"],
+        python_requires=">=3.9",
+        zip_safe=False,
+        url="https://github.com/LLNL/hiop",
+        download_url="https://github.com/LLNL/hiop",
+)
+
+setup(**metadata)
diff --git a/src/Drivers/hiopbbpy/BODriver.py b/src/Drivers/hiopbbpy/BODriver.py
@@ -0,0 +1,42 @@
+"""
+  Code description:
+     for a 2D example LpNormProblem
+        1) randomly sample training points
+        2) define a Kriging-based Gaussian-process (smt backend)
+           trained on said data
+        3) determine the minimizer via BOAlgorithm
+"""
+
+import numpy as np
+import matplotlib.pyplot as plt
+import warnings
+warnings.filterwarnings("ignore")
+from LpNormProblem import LpNormProblem
+from hiopbbpy.surrogate_modeling import smtKRG
+from hiopbbpy.opt import BOAlgorithm
+
+
+### parameters
+n_samples = 5 # number of the initial samples to train GP
+theta = 1.e-2 # hyperparameter for GP kernel
+
+nx = 2 # dimension of the problem
+xlimits = np.array([[-5, 5], [-5, 5]]) # bounds on optimization variable
+
+problem = LpNormProblem(nx, xlimits)
+print(problem.name, " problem")
+
+### initial training set
+x_train = problem.sample(n_samples)
+y_train = problem.evaluate(x_train)
+
+# Define the GP surrogate model
+gp_model = smtKRG(theta, xlimits, nx)
+gp_model.train(x_train, y_train)
+
+# Instantiate and run Bayesian Optimization
+bo = BOAlgorithm(gp_model, x_train, y_train)
+bo.optimize(problem)
+
+# Retrieve optimal point
+x_opt, y_opt = bo.getOptimalPoint()
diff --git a/src/Drivers/hiopbbpy/LpNormProblem.py b/src/Drivers/hiopbbpy/LpNormProblem.py
@@ -0,0 +1,25 @@
+"""
+Implementation of the LPNorm problem class f(x) = || x ||_p
+
+Authors:    Tucker Hartland <hartland1@llnl.gov>
+            Nai-Yuan Chiang <chiang7@llnl.gov>
+"""
+import numpy as np
+from hiopbbpy.problems.problem import Problem
+
+class LpNormProblem(Problem):
+    def __init__(self, ndim, xlimits, p=2.0):
+        name = "LpNormProblem"
+        super().__init__(ndim, xlimits, name=name)
+        self.p = p
+
+    def _evaluate(self, x):
+        ne, nx = x.shape
+        assert nx == self.ndim
+        y = np.zeros((ne, 1))
+        ytemp = np.linalg.norm(x, ord=self.p, axis=1)
+        if len(ytemp.shape) == 1:
+            y[:,0] = ytemp[:]
+        elif len(ytemp.shape) == 2:
+            y[:,:] = ytemp[:,:]
+        return y
diff --git a/src/hiopbbpy/__init__.py b/src/hiopbbpy/__init__.py
@@ -0,0 +1,4 @@
+__all__ = [
+        "problems",
+        "surrogate_modeling",
+        "opt"]
diff --git a/src/hiopbbpy/opt/__init__.py b/src/hiopbbpy/opt/__init__.py
@@ -0,0 +1,9 @@
+from .boalgorithm import (BOAlgorithmBase, BOAlgorithm)
+from .acquisition import (acquisition, LCBacquisition)
+
+__all__ = [
+        "BOAlgorithmBase"
+        "BOAlgorithm"
+        "acquisition"
+        "LCBacquisition"
+        ]
diff --git a/src/hiopbbpy/opt/acquisition.py b/src/hiopbbpy/opt/acquisition.py
@@ -0,0 +1,32 @@
+"""
+This file implements different acquisition functions, which are used in Bayesian optimization to decide where to sample next.
+
+Authors:    Tucker Hartland <hartland1@llnl.gov>
+            Nai-Yuan Chiang <chiang7@llnl.gov>
+"""
+
+import numpy as np
+from ..surrogate_modeling.gp import GaussianProcess
+
+# A base class for acquisition functions
+class acquisition(object):
+    def __init__(self, gpsurrogate):
+        assert isinstance(gpsurrogate, GaussianProcess) # add something here
+        self.gpsurrogate = gpsurrogate
+    
+    # Abstract method to evaluate the acquisition function at x.
+    def evaluate(self, x: np.ndarray) -> np.ndarray:
+        raise NotImplementedError("Child class of acquisition should implement method evaluate")
+
+
+# A subclass of acquisition, implementing the Lower Confidence Bound (LCB) acquisition function.
+class LCBacquisition(acquisition):
+    def __init__(self, gpsurrogate, beta=3.0):
+        super().__init__(gpsurrogate)
+        self.beta = beta
+
+    # Method to evaluate the acquisition function at x.
+    def evaluate(self, x : np.ndarray) -> np.ndarray:
+        mu = self.gpsurrogate.mean(x)
+        sig = self.gpsurrogate.variance(x)
+        return mu - self.beta * np.sqrt(sig)
diff --git a/src/hiopbbpy/opt/boalgorithm.py b/src/hiopbbpy/opt/boalgorithm.py
@@ -0,0 +1,173 @@
+"""
+Implementation of the Bayesian Optimization Algorithms
+
+Authors:    Tucker Hartland <hartland1@llnl.gov>
+            Nai-Yuan Chiang <chiang7@llnl.gov>
+"""
+
+import numpy as np
+from numpy.random import uniform
+from scipy.optimize import minimize
+from ..surrogate_modeling.gp import GaussianProcess
+from .acquisition import LCBacquisition
+from ..problems.problem import Problem
+
+# A base class defining a general framework for Bayesian Optimization
+class BOAlgorithmBase:
+    def __init__(self):
+        self.acquisition_type = "LCB" # Type of acquisition function (default = "LCB")
+        self.xtrain = None            # Training data
+        self.ytrain = None            # Training data
+        self.n_iter = 20              # Maximum number of optimization steps
+        self.n_start = 10             # estimating acquisition global optima by determining local optima n_start times and then determining the discrete max of that set
+        self.q = 1                    # batch size
+        # save some internal member train
+        self.y_hist = None            # History of evaluations
+        self.x_hist = None            # History of evaluations
+        self.x_opt = None             # Best observed point
+        self.y_opt = None             # Best observed value
+        self.idx_opt = None           # Index of the best observed value in the history
+
+    # Sets the acquisition function type and batch size
+    def setAcquisitionType(self, acquisition_type, q=1):
+        self.acquisition_type = acquisition_type
+        self.q = q
+
+    # Sets the training data
+    def setTrainingData(self, xtrain, ytrain):
+        self.xtrain = xtrain
+        self.ytrain = ytrain
+
+    # Method to perform Bayesian optimization
+    def optimize(self, fun):
+        assert NotImplementedError("Child class of hiopEGO should implement method optimize")
+
+    # Method to return the recorded optimization iterations and objectives
+    def getOptimizationHistory(self):
+        x_hist = np.array(self.x_hist, copy=True)
+        y_hist = np.array(self.y_hist, copy=True)
+        return x_hist, y_hist
+
+    # Method to return the optimal solution and objective
+    def getOptimalPoint(self):
+        x_opt = np.array(self.x_opt, copy=True)
+        y_opt = np.array(self.y_opt, copy=True)
+        return x_opt, y_opt
+
+# A subclass of BOAlgorithmBase implementing a full Bayesian Optimization workflow
+class BOAlgorithm(BOAlgorithmBase):
+    def __init__(self, gpsurrogate, xtrain, ytrain, acquisition_type = "LCB"):
+        super().__init__()
+        assert isinstance(gpsurrogate, GaussianProcess)
+        assert acquisition_type in ["LCB"]
+        self.setTrainingData(xtrain, ytrain)
+        self.setAcquisitionType(acquisition_type)
+        self.gpsurrogate = gpsurrogate
+        self.n_iter = 20
+        self.method = "SLSQP"
+        self.bounds = self.gpsurrogate.get_bounds()
+        self.constraints = ()
+        self.options = {"maxiter": 200}
+        self.acqf_minimizer_callback = None
+
+    # Method to set up a callback function to minimize the acquisition function
+    def _setup_acqf_minimizer_callback(self):
+        self.acqf_minimizer_callback = lambda fun, x0: pyminimize(fun, x0, self.method, self.bounds, self.constraints, self.options)
+
+    # Method to train the GP model
+    def _train_surrogate(self, x_train, y_train):
+        self.gpsurrogate.train(x_train, y_train)
+
+    # Method to find the best next sampling point via optimizing the acquisition function
+    def _find_best_point(self, x_train, y_train, x0 = None):
+        self._train_surrogate(x_train, y_train)
+
+        if self.acquisition_type == "LCB":
+            acqf = LCBacquisition(self.gpsurrogate)
+        else:
+            raise NotImplementedError("No implemented acquisition_type associated to"+self.acquisition_type)
+
+        acqf_callback = lambda x: float(np.array(acqf.evaluate(np.atleast_2d(x))).flat[0])
+        
+        x_all = []
+        y_all = []
+        for ii in range(self.n_start):
+            success = False
+            # Generate random starting point if x0 is not provided
+            if x0 is None:
+                x0 = np.array([uniform(b[0], b[1]) for b in self.bounds])
+            xopt, yout, success = self.acqf_minimizer_callback(acqf_callback, x0)
+            
+            if success:
+                x_all.append(xopt)
+                y_all.append(yout)
+        
+        best_xopt = x_all[np.argmin(np.array(y_all))]
+
+        return best_xopt
+
+    # Set the optimization method
+    def set_method(self, method):
+        self.method = method
+
+    # Set the user options for the Bayesian optimization
+    def set_options(self, options):
+        self.options = options
+
+    # Method to perform Bayesian optimization
+    def optimize(self, prob:Problem):
+      x_train = self.xtrain
+      y_train = self.ytrain
+      
+      n_init_sample = np.size(x_train,0)
+      print(f"n_init_sample: {n_init_sample}")
+      self._setup_acqf_minimizer_callback()
+
+      self.x_hist = []
+      self.y_hist = []
+
+      for i in range(self.n_iter):
+          print(f"*****************************")
+          print(f"Iteration {i+1}/{self.n_iter}")
+
+          # Get a new sample point
+          x_new = self._find_best_point(x_train, y_train)
+
+          # Evaluate the new sample point
+          y_new = prob.evaluate(np.atleast_2d(x_new))
+
+          # Update training set
+          x_train = np.vstack([x_train, x_new])
+          y_train = np.vstack([y_train, y_new])
+
+          # Save the new sample point and its observation
+          self.x_hist.append(x_new)
+          self.y_hist.append(y_new)
+
+          print(f"Sampled point X: {x_new.flatten()}, Observation Y: {y_new.flatten()}")
+
+      # Save the optimal results and all the training data
+      self.idx_opt = np.argmin(y_train)
+      self.x_opt = x_train[self.idx_opt]
+      self.y_opt = y_train[self.idx_opt]
+      self.setTrainingData(x_train, y_train)
+
+      print()
+      print()
+      if self.idx_opt < n_init_sample:
+          print(f"Optimal at initial sample: {self.idx_opt+1}")
+      else:
+          print(f"Optimal at BO iteration: {self.idx_opt-n_init_sample+1} ")
+          
+      print(f"Optimal point: {self.x_opt.flatten()}, Optimal value: {self.y_opt}")
+
+
+# Find the minimum of the input objective `fun`, using the minimize function from SciPy. 
+def pyminimize(fun, x0, method, bounds, constraints, options):
+    y = minimize(fun, x0, method=method, bounds=bounds, constraints=constraints, options=options)
+    success = y.success
+    if not success:
+        print(y.message)
+    xopt = y.x
+    yopt = y.fun
+    return xopt, yopt, success
diff --git a/src/hiopbbpy/problems/__init__.py b/src/hiopbbpy/problems/__init__.py
@@ -0,0 +1,6 @@
+from .problem import Problem
+
+__all__ = [
+        "Problem"
+        ]
+
diff --git a/src/hiopbbpy/problems/problem.py b/src/hiopbbpy/problems/problem.py
diff --git a/src/hiopbbpy/surrogate_modeling/__init__.py b/src/hiopbbpy/surrogate_modeling/__init__.py
diff --git a/src/hiopbbpy/surrogate_modeling/gp.py b/src/hiopbbpy/surrogate_modeling/gp.py
diff --git a/src/hiopbbpy/surrogate_modeling/krg.py b/src/hiopbbpy/surrogate_modeling/krg.py

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+[build-system]`
	`2`	`+requires = ["setuptools", "wheel", "numpy"]`
	`3`	`+build-backend = "setuptools.build_meta"`