Add bo_w_trees and tests for bo_w_tp

jungtaekkim · Oct 11, 2021 · bc92dfd · bc92dfd
1 parent 83fb915
commit bc92dfd
Show file tree

Hide file tree

Showing 6 changed files with 1,122 additions and 6 deletions.
diff --git a/bayeso/bo/base_bo.py b/bayeso/bo/base_bo.py
@@ -59,7 +59,8 @@ def __init__(self,
         assert (range_X[:, 0] <= range_X[:, 1]).all()
         assert str_surrogate in constants.ALLOWED_SURROGATE
         assert str_acq in constants.ALLOWED_BO_ACQ
-        assert str_optimizer_method_bo in constants.ALLOWED_OPTIMIZER_METHOD_BO
+        assert str_optimizer_method_bo in constants.ALLOWED_OPTIMIZER_METHOD_BO \
+            + constants.ALLOWED_OPTIMIZER_METHOD_BO_TREES
 
         self.range_X = range_X
         self.num_dim = range_X.shape[0]

diff --git a/bayeso/bo/bo_w_gp.py b/bayeso/bo/bo_w_gp.py
@@ -16,7 +16,6 @@
     import cma
 except: # pragma: no cover
     cma = None
-import qmcpy
 
 from bayeso.bo import base_bo
 from bayeso import covariance
@@ -29,7 +28,7 @@
 
 class BOwGP(base_bo.BaseBO):
     """
-    It is a Bayesian optimization class.
+    It is a Bayesian optimization class with Gaussian process regression.
 
     :param range_X: a search space. Shape: (d, 2).
     :type range_X: numpy.ndarray

diff --git a/bayeso/bo/bo_w_tp.py b/bayeso/bo/bo_w_tp.py
@@ -16,7 +16,6 @@
     import cma
 except: # pragma: no cover
     cma = None
-import qmcpy
 
 from bayeso.bo import base_bo
 from bayeso import covariance
@@ -29,7 +28,7 @@
 
 class BOwTP(base_bo.BaseBO):
     """
-    It is a Bayesian optimization class.
+    It is a Bayesian optimization class with Student-:math:`t` process regression.
 
     :param range_X: a search space. Shape: (d, 2).
     :type range_X: numpy.ndarray

diff --git a/bayeso/bo/bo_w_trees.py b/bayeso/bo/bo_w_trees.py
@@ -0,0 +1,237 @@
+#
+# author: Jungtaek Kim (jtkim@postech.ac.kr)
+# last updated: October 8, 2021
+#
+"""It defines a class of Bayesian optimization
+with tree-based surrogate models."""
+
+import numpy as np
+import time
+
+from bayeso.bo import base_bo
+from bayeso.trees import trees_common
+from bayeso import constants
+from bayeso.utils import utils_bo
+from bayeso.utils import utils_logger
+
+
+class BOwTrees(base_bo.BaseBO):
+    """
+    It is a Bayesian optimization class with tree-based surrogate models.
+
+    :param range_X: a search space. Shape: (d, 2).
+    :type range_X: numpy.ndarray
+    :param str_surrogate: the name of surrogate model.
+    :type str_surrogate: str., optional
+    :param str_acq: the name of acquisition function.
+    :type str_acq: str., optional
+    :param normalize_Y: flag for normalizing outputs.
+    :type normalize_Y: bool., optional
+    :param str_optimizer_method_bo: the name of optimization method for
+        Bayesian optimization.
+    :type str_optimizer_method_bo: str., optional
+    :param debug: flag for printing log messages.
+    :type debug: bool., optional
+
+    """
+
+    def __init__(self, range_X: np.ndarray,
+        str_surrogate: str=constants.STR_SURROGATE_TREES,
+        str_acq: str=constants.STR_BO_ACQ,
+        normalize_Y: bool=constants.NORMALIZE_RESPONSE,
+        str_optimizer_method_bo: str=constants.STR_OPTIMIZER_METHOD_AO_TREES,
+        debug: bool=False
+    ):
+        """
+        Constructor method
+
+        """
+
+        assert isinstance(range_X, np.ndarray)
+        assert isinstance(str_surrogate, str)
+        assert isinstance(str_acq, str)
+        assert isinstance(normalize_Y, bool)
+        assert isinstance(str_optimizer_method_bo, str)
+        assert isinstance(debug, bool)
+        assert len(range_X.shape) == 2
+        assert range_X.shape[1] == 2
+        assert (range_X[:, 0] <= range_X[:, 1]).all()
+        assert str_surrogate in constants.ALLOWED_SURROGATE_TREES
+        assert str_acq in constants.ALLOWED_BO_ACQ
+        assert str_optimizer_method_bo in constants.ALLOWED_OPTIMIZER_METHOD_BO_TREES
+
+        super().__init__(range_X, str_surrogate, str_acq, str_optimizer_method_bo, normalize_Y, debug)
+
+    def get_trees(self, X_train, Y_train,
+        num_trees=100,
+        depth_max=5,
+        size_min_leaf=1,
+    ):
+        num_features = int(np.sqrt(self.num_dim))
+
+        if self.str_surrogate == 'rf':
+            from bayeso.trees import trees_random_forest
+            trees = trees_random_forest.get_random_forest(
+                X_train, Y_train, num_trees, depth_max, size_min_leaf, num_features
+            )
+        else:
+            raise NotImplementedError('allowed str_surrogate, but it is not implemented.')
+
+        return trees
+
+    def compute_posteriors(self,
+        X: np.ndarray, trees: constants.TYPING_LIST
+    ) -> np.ndarray:
+        """
+        It returns posterior mean and standard deviation functions over `X`.
+
+        :param X: inputs. Shape: (l, d) or (l, m, d).
+        :type X: numpy.ndarray
+        :param cov_X_X: kernel matrix over `X_train`. Shape: (n, n).
+        :type cov_X_X: numpy.ndarray
+        :param inv_cov_X_X: kernel matrix inverse over `X_train`. Shape: (n, n).
+        :type inv_cov_X_X: numpy.ndarray
+        :param hyps: dictionary of hyperparameters for Gaussian process.
+        :type hyps: dict.
+
+        :returns: posterior mean and standard deviation functions
+            over `X`. Shape: ((l, ), (l, )).
+        :rtype: (numpy.ndarray, numpy.ndarray)
+
+        """
+
+        pred_mean, pred_std = trees_common.predict_by_trees(X, trees)
+
+        pred_mean = np.squeeze(pred_mean, axis=1)
+        pred_std = np.squeeze(pred_std, axis=1)
+
+        return pred_mean, pred_std
+
+    def compute_acquisitions(self, X: np.ndarray,
+        X_train: np.ndarray, Y_train: np.ndarray,
+        trees: constants.TYPING_LIST
+    ) -> np.ndarray:
+        """
+        It computes acquisition function values over 'X',
+        where `X_train` and `Y_train` are given.
+
+        :param X: inputs. Shape: (l, d) or (l, m, d).
+        :type X: numpy.ndarray
+        :param X_train: inputs. Shape: (n, d) or (n, m, d).
+        :type X_train: numpy.ndarray
+        :param Y_train: outputs. Shape: (n, 1).
+        :type Y_train: numpy.ndarray
+
+        :returns: acquisition function values over `X`. Shape: (l, ).
+        :rtype: numpy.ndarray
+
+        """
+
+        assert isinstance(X, np.ndarray)
+        assert isinstance(X_train, np.ndarray)
+        assert isinstance(Y_train, np.ndarray)
+        assert len(X.shape) == 1 or len(X.shape) == 2 or len(X.shape) == 3
+        assert len(X_train.shape) == 2 or len(X_train.shape) == 3
+        assert len(Y_train.shape) == 2
+        assert Y_train.shape[1] == 1
+        assert X_train.shape[0] == Y_train.shape[0]
+
+        if len(X.shape) == 1:
+            X = np.atleast_2d(X)
+
+        if len(X_train.shape) == 2:
+            assert X.shape[1] == X_train.shape[1] == self.num_dim
+        else:
+            assert X.shape[2] == X_train.shape[2] == self.num_dim
+
+        fun_acquisition = utils_bo.choose_fun_acquisition(self.str_acq, constants.GP_NOISE)
+
+        pred_mean, pred_std = self.compute_posteriors(X, trees)
+
+        acquisitions = fun_acquisition(
+            pred_mean=pred_mean, pred_std=pred_std, Y_train=Y_train
+        )
+        acquisitions *= constants.MULTIPLIER_ACQ
+
+        return acquisitions
+
+    def optimize(self, X_train: np.ndarray, Y_train: np.ndarray,
+        str_sampling_method: str=constants.STR_SAMPLING_METHOD_AO,
+        num_samples: int=constants.NUM_SAMPLES_AO_TREES,
+    ) -> constants.TYPING_TUPLE_ARRAY_DICT:
+        """
+        It computes acquired example, candidates of acquired examples,
+        acquisition function values for the candidates, covariance matrix,
+        inverse matrix of the covariance matrix, hyperparameters optimized,
+        and execution times.
+
+        :param X_train: inputs. Shape: (n, d) or (n, m, d).
+        :type X_train: numpy.ndarray
+        :param Y_train: outputs. Shape: (n, 1).
+        :type Y_train: numpy.ndarray
+        :param str_sampling_method: the name of sampling method for
+            acquisition function optimization.
+        :type str_sampling_method: str., optional
+        :param num_samples: the number of samples.
+        :type num_samples: int., optional
+
+        :returns: acquired example and dictionary of information. Shape: ((d, ), dict.).
+        :rtype: (numpy.ndarray, dict.)
+
+        :raises: AssertionError
+
+        """
+
+        assert isinstance(X_train, np.ndarray)
+        assert isinstance(Y_train, np.ndarray)
+        assert isinstance(str_sampling_method, str)
+        assert isinstance(num_samples, int)
+        assert len(X_train.shape) == 2
+        assert len(Y_train.shape) == 2
+        assert Y_train.shape[1] == 1
+        assert X_train.shape[0] == Y_train.shape[0]
+        assert X_train.shape[1] == self.num_dim
+        assert num_samples > 0
+        assert str_sampling_method in constants.ALLOWED_SAMPLING_METHOD
+
+        time_start = time.time()
+
+        if self.normalize_Y and np.max(Y_train) != np.min(Y_train):
+            Y_train = (Y_train - np.min(Y_train)) / (np.max(Y_train) - np.min(Y_train)) \
+                * constants.MULTIPLIER_RESPONSE
+
+        time_start_surrogate = time.time()
+        trees = self.get_trees(X_train, Y_train)
+        time_end_surrogate = time.time()
+
+        time_start_acq = time.time()
+        next_points = self.get_samples(
+            str_sampling_method,
+            fun_objective=None,
+            num_samples=num_samples
+        )
+
+        fun_negative_acquisition = lambda X_test: -1.0 * self.compute_acquisitions(
+            X_test, X_train, Y_train, trees
+        )
+        acquisitions = fun_negative_acquisition(next_points)
+        ind_next_point = np.argmin(acquisitions)
+        next_point = next_points[ind_next_point]
+
+        time_end_acq = time.time()
+
+        time_end = time.time()
+
+        dict_info = {
+            'next_points': next_points,
+            'acquisitions': acquisitions,
+            'trees': trees,
+            'time_surrogate': time_end_surrogate - time_start_surrogate,
+            'time_acq': time_end_acq - time_start_acq,
+            'time_overall': time_end - time_start,
+        }
+
+        if self.debug:
+            self.logger.debug('overall time consumed to acquire: %.4f sec.', time_end - time_start)
+
+        return next_point, dict_info
diff --git a/bayeso/constants.py b/bayeso/constants.py
@@ -17,18 +17,21 @@
 TOLERANCE_DUPLICATED_ACQ = 1e-4
 
 STR_SURROGATE = 'gp'
+STR_SURROGATE_TREES = 'rf'
 STR_OPTIMIZER_METHOD_GP = 'BFGS'
 STR_OPTIMIZER_METHOD_TP = 'SLSQP'
 STR_COV = 'matern52'
 STR_BO_ACQ = 'ei'
 STR_INITIALIZING_METHOD_BO = 'sobol'
 STR_OPTIMIZER_METHOD_AO = 'L-BFGS-B'
 STR_SAMPLING_METHOD_AO = 'sobol'
+STR_OPTIMIZER_METHOD_AO_TREES = 'random'
 STR_MLM_METHOD = 'regular'
 STR_MODELSELECTION_METHOD = 'ml'
 
 NUM_GRIDS_AO = 50
 NUM_SAMPLES_AO = 100
+NUM_SAMPLES_AO_TREES = 10000
 
 MULTIPLIER_ACQ = 10.0
 MULTIPLIER_RESPONSE = 10.0
@@ -56,6 +59,7 @@
 ]
 ALLOWED_OPTIMIZER_METHOD_TP = ['L-BFGS-B', 'SLSQP']
 ALLOWED_OPTIMIZER_METHOD_BO = ['L-BFGS-B', 'DIRECT', 'CMA-ES']
+ALLOWED_OPTIMIZER_METHOD_BO_TREES = ['random']
 
 # INFO: Do not use _ (underscore) in base str_cov.
 ALLOWED_COV_BASE = ['eq', 'se', 'matern32', 'matern52']
@@ -66,7 +70,8 @@
 ALLOWED_SAMPLING_METHOD = ALLOWED_INITIALIZING_METHOD_BO + ['grid']
 ALLOWED_MLM_METHOD = ['regular', 'combined', 'converged']
 ALLOWED_MODELSELECTION_METHOD = ['ml', 'loocv']
-ALLOWED_SURROGATE = ['gp', 'tp', 'rf']
+ALLOWED_SURROGATE_TREES = ['rf']
+ALLOWED_SURROGATE = ALLOWED_SURROGATE_TREES + ['gp', 'tp']
 
 COLORS = np.array([
     'red',