Libensemble · shuds13 · Feb 7, 2024 · Jan 10, 2024 · Jan 17, 2024 · Jan 18, 2024
diff --git a/libensemble/gen_funcs/persistent_gpCAM.py b/libensemble/gen_funcs/persistent_gpCAM.py
@@ -1,11 +1,10 @@
 """Persistent generator exposing gpCAM functionality"""
 
-import copy
 import time
 
 import numpy as np
+from numpy.lib.recfunctions import repack_fields
 from gpcam import GPOptimizer as GP
-from scipy.spatial.distance import pdist, squareform
 
 from libensemble.message_numbers import EVAL_GEN_TAG, FINISHED_PERSISTENT_GEN_TAG, PERSIS_STOP, STOP_TAG
 from libensemble.tools.persistent_support import PersistentSupport
@@ -37,6 +36,24 @@ def _initialize_gpcAM(user_specs, libE_info):
     return b, n, lb, ub, all_x, all_y, ps
 
 
+def _read_testpoints(U):
+    """Read numpy file containing evaluated points for measuring GP error"""
+    test_points_file = U.get('test_points_file')
+    if test_points_file is None:
+        return None
+
+    test_points = np.load(test_points_file)
+
+    # Remove any NaNs
+    nan_indices = [i for i, fval in enumerate(test_points['f']) if np.isnan(fval)]
+    test_points = np.delete(test_points, nan_indices, axis=0)
+
+    # In case large fields we don't need
+    test_points = repack_fields(test_points[["x", "f"]])
+
+    return test_points
+
+
 def _generate_mesh(lb, ub, num_points=10):
     """
     Generate a mesh of points in n-dimensional space over a hypercube defined by lb and ub.
@@ -54,41 +71,78 @@ def _generate_mesh(lb, ub, num_points=10):
 
     # Convert the meshgrid to a list of points
     points = np.stack(mesh, axis=-1).reshape(-1, len(lb))
-    D = squareform(pdist(points))
-    return points, D
+
+    return points
 
 
-def _update_gp_and_eval_var(all_x, all_y, x_for_var):
+def _update_gp_and_eval_var(all_x, all_y, x_for_var, test_points, persis_info):
     """
     Update the GP using the points in all_x and their function values in
     all_y. (We are assuming deterministic values in all_y, so we set the noise
     to be 1e-8 when build the GP.) Then evaluates the posterior covariance at
-    points in x_for_var.
+    points in x_for_var. If we have test points, calculate mean square error
+    at those points.
     """
-    my_gp2S = GP(all_x, all_y, noise_variances=1e-8 * np.ones(len(all_y)))
-    my_gp2S.train(max_iter=2)
-    var_rand = my_gp2S.posterior_covariance(x_for_var, variance_only=True)["v(x)"]
-    # print(np.max(var_rand))
+    my_gp2S = GP(all_x, all_y, noise_variances=1e-12 * np.ones(len(all_y)))
+    my_gp2S.train()
+
+    # Obtain covariance in groups to prevent memory overload.
+    n_rows = x_for_var.shape[0]
+    var_vals = []
+    group_size = 1000
+
+    for start_idx in range(0, n_rows, group_size):
+        end_idx = min(start_idx + group_size, n_rows)
+        var_vals_group = my_gp2S.posterior_covariance(x_for_var[start_idx:end_idx], variance_only=True)["v(x)"]
+        var_vals.extend(var_vals_group)
 
-    return var_rand
+    assert len(var_vals) == n_rows, "Something wrong with the grouping"
 
+    persis_info.setdefault("max_variance", []).append(np.max(var_vals))
+    persis_info.setdefault("mean_variance", []).append(np.mean(var_vals))
 
-def _find_eligible_points(sorted_indices, sorted_D, r):
+    if test_points is not None:
+        f_est = my_gp2S.posterior_mean(test_points["x"])["f(x)"]
+        mse = np.mean((f_est - test_points["f"])**2)
+        persis_info.setdefault("mean_squared_error", []).append(mse)
+    return np.array(var_vals)
+
+
+def calculate_grid_distances(lb, ub, num_points):
+    """Calculate mininum and maximum distances between points in grid"""
+    num_points = [num_points] * len(lb)
+    spacings = [(ub[i] - lb[i]) / (num_points[i] - 1) for i in range(len(lb))]
+    min_distance = min(spacings)
+    max_distance = np.sqrt(sum([(ub[i] - lb[i]) ** 2 for i in range(len(lb))]))
+    return min_distance, max_distance
+
+
+def is_point_far_enough(point, eligible_points, r):
+    """Check if point is at least r distance away from all points in eligible_points."""
+    for ep in eligible_points:
+        if np.linalg.norm(point - ep) < r:
+            return False
+    return True
+
+
+def _find_eligible_points(x_for_var, sorted_indices, r, batch_size):
     """
     Find points in X such that no point has another point within distance r with a larger F value.
 
+    :param x_for_var: positions of each point mesh
     :param sorted_indices: Indices sorted based on variance (highest to lowest).
-    :param sorted_D: Sorted pirwise distance matrix for points in X.
     :param r: Radius constraint.
-    :return: Indices of the eligible points in the original X.
+    :param batch_size: Number of points requested
+    :return: The eligible points in the original X.
     """
-
-    eligible_indices = []
-    for idx in range(len(sorted_indices)):
-        # Check if this point is within r distance of any point already added
-        if not any(sorted_D[idx, :idx] < r):
-            eligible_indices.append(sorted_indices[idx])
-    return eligible_indices
+    eligible_points = []
+    for idx in sorted_indices:
+        point = x_for_var[idx]
+        if is_point_far_enough(point, eligible_points, r):
+            eligible_points.append(point)
+            if len(eligible_points) == batch_size:
+                break
+    return np.array(eligible_points)
 
 
 def persistent_gpCAM_simple(H_in, persis_info, gen_specs, libE_info):
@@ -103,60 +157,60 @@ def persistent_gpCAM_simple(H_in, persis_info, gen_specs, libE_info):
     """  # noqa
     U = gen_specs["user"]
 
+    test_points = _read_testpoints(U)
+
     batch_size, n, lb, ub, all_x, all_y, ps = _initialize_gpcAM(U, libE_info)
 
     # Send batches until manager sends stop tag
     tag = None
     persis_info["max_variance"] = []
 
     if U.get("use_grid"):
-        x_for_var, D = _generate_mesh(lb, ub)
-        vals_above_diagonal = D[np.triu_indices(len(x_for_var), 1)]
-        r_high_init = np.max(vals_above_diagonal)
-        r_low_init = np.min(vals_above_diagonal)
+        num_points = 10
+        x_for_var = _generate_mesh(lb, ub, num_points)
+        r_low_init, r_high_init = calculate_grid_distances(lb, ub, num_points)
 
     while tag not in [STOP_TAG, PERSIS_STOP]:
         if all_x.shape[0] == 0:
             x_new = persis_info["rand_stream"].uniform(lb, ub, (batch_size, n))
         else:
             if not U.get("use_grid"):
                 x_for_var = persis_info["rand_stream"].uniform(lb, ub, (10 * batch_size, n))
-            var_rand = _update_gp_and_eval_var(all_x, all_y, x_for_var)
-            persis_info["max_variance"].append(np.max(var_rand))
+            var_vals = _update_gp_and_eval_var(all_x, all_y, x_for_var, test_points, persis_info)
 
             if U.get("use_grid"):
                 r_high = r_high_init
                 r_low = r_low_init
-                new_inds = []
+                x_new = []
                 r_cand = r_high  # Let's start with a large radius and stop when we have batchsize points
 
-                sorted_indices = np.argsort(-var_rand)
-                sorted_D = D[:, sorted_indices][sorted_indices]
-                while len(new_inds) < batch_size:
-                    new_inds = _find_eligible_points(sorted_indices, sorted_D, r_cand)
-                    if len(new_inds) < batch_size:
+                sorted_indices = np.argsort(-var_vals)
+                while len(x_new) < batch_size:
+                    x_new = _find_eligible_points(x_for_var, sorted_indices, r_cand, batch_size)
+                    if len(x_new) < batch_size:
                         r_high = r_cand
                     r_cand = (r_high + r_low) / 2.0
-
-                x_new = x_for_var[new_inds[:batch_size]]
             else:
-                x_new = x_for_var[np.argsort(var_rand)[-batch_size:]]
+                x_new = x_for_var[np.argsort(var_vals)[-batch_size:]]
 
         H_o = np.zeros(batch_size, dtype=gen_specs["out"])
         H_o["x"] = x_new
         tag, Work, calc_in = ps.send_recv(H_o)
 
         if calc_in is not None:
+            y_new = np.atleast_2d(calc_in["f"]).T
+            nan_indices = [i for i, fval in enumerate(y_new) if np.isnan(fval)]
+            x_new = np.delete(x_new, nan_indices, axis=0)
+            y_new = np.delete(y_new, nan_indices, axis=0)
             all_x = np.vstack((all_x, x_new))
-            all_y = np.vstack((all_y, np.atleast_2d(calc_in["f"]).T))
+            all_y = np.vstack((all_y, y_new))
 
-    # If final points are sent with PERSIS_STOP, update model and get final var_rand
+    # If final points are sent with PERSIS_STOP, update model and get final var_vals
     if calc_in is not None:
         # H_o not updated by default - is persis_info
-        if not use_grid:
+        if not U.get("use_grid"):
             x_for_var = persis_info["rand_stream"].uniform(lb, ub, (10 * batch_size, n))
-        var_rand = _update_gp_and_eval_var(all_x, all_y, x_for_var)
-        persis_info["max_variance"].append(np.max(var_rand))
+        var_vals = _update_gp_and_eval_var(all_x, all_y, x_for_var, test_points, persis_info)
 
     return H_o, persis_info, FINISHED_PERSISTENT_GEN_TAG