Merge remote-tracking branch 'upstream/master' into value_function

pytorch · Nov 8, 2020 · 85a1efe · 85a1efe
2 parents b4a823d + dc868cc
commit 85a1efe
Show file tree

Hide file tree

Showing 9 changed files with 1,093 additions and 14 deletions.
diff --git a/botorch/models/contextual.py b/botorch/models/contextual.py
@@ -0,0 +1,88 @@
+#!/usr/bin/env python3
+# Copyright (c) Facebook, Inc. and its affiliates.
+#
+# This source code is licensed under the MIT license found in the
+# LICENSE file in the root directory of this source tree.
+
+from typing import Dict, List, Optional
+
+from botorch.models.gp_regression import FixedNoiseGP
+from botorch.models.kernels.contextual_lcea import LCEAKernel
+from botorch.models.kernels.contextual_sac import SACKernel
+from torch import Tensor
+
+
+class SACGP(FixedNoiseGP):
+    """The GP uses Structural Additive Contextual(SAC) kernel.
+
+    Args:
+        train_X: (n x d) X training data.
+        train_Y: (n x 1) Y training data.
+        train_Yvar: (n x 1) Noise variances of each training Y.
+        decomposition: Keys are context names. Values are the indexes of
+            parameters belong to the context. The parameter indexes are in
+            the same order across contexts.
+    """
+
+    def __init__(
+        self,
+        train_X: Tensor,
+        train_Y: Tensor,
+        train_Yvar: Tensor,
+        decomposition: Dict[str, List[int]],
+    ) -> None:
+        super().__init__(train_X=train_X, train_Y=train_Y, train_Yvar=train_Yvar)
+        self.covar_module = SACKernel(
+            decomposition=decomposition, batch_shape=self._aug_batch_shape
+        )
+        self.decomposition = decomposition
+        self.to(train_X)
+
+
+class LCEAGP(FixedNoiseGP):
+    r"""The GP with Latent Context Embedding Additive (LCE-A) Kernel.
+    Note that the model does not support batch training. Input training
+    data sets should have dim = 2.
+
+    Args:
+        train_X: (n x d) X training data.
+        train_Y: (n x 1) Y training data.
+        train_Yvar: (n x 1) Noise variance of Y.
+        decomposition: Keys are context names. Values are the indexes of
+            parameters belong to the context. The parameter indexes are in the
+            same order across contexts.
+        cat_feature_dict: Keys are context names and values are list of categorical
+            features i.e. {"context_name" : [cat_0, ..., cat_k]}. k equals to number
+            of categorical variables. If None, we use context names in the
+            decomposition as the only categorical feature i.e. k = 1
+        embs_feature_dict: Pre-trained continuous embedding features of each context.
+        embs_dim_list: Embedding dimension for each categorical variable. The length
+            equals to num of categorical features k. If None, emb dim is set to 1
+            for each categorical variable.
+        context_weight_dict: Known population Weights of each context.
+    """
+
+    def __init__(
+        self,
+        train_X: Tensor,
+        train_Y: Tensor,
+        train_Yvar: Tensor,
+        decomposition: Dict[str, List[int]],
+        train_embedding: bool = True,
+        cat_feature_dict: Optional[Dict] = None,
+        embs_feature_dict: Optional[Dict] = None,
+        embs_dim_list: Optional[List[int]] = None,
+        context_weight_dict: Optional[Dict] = None,
+    ) -> None:
+        super().__init__(train_X=train_X, train_Y=train_Y, train_Yvar=train_Yvar)
+        self.covar_module = LCEAKernel(
+            decomposition=decomposition,
+            batch_shape=self._aug_batch_shape,
+            train_embedding=train_embedding,
+            cat_feature_dict=cat_feature_dict,
+            embs_feature_dict=embs_feature_dict,
+            embs_dim_list=embs_dim_list,
+            context_weight_dict=context_weight_dict,
+        )
+        self.decomposition = decomposition
+        self.to(train_X)
diff --git a/botorch/models/contextual_multioutput.py b/botorch/models/contextual_multioutput.py
@@ -0,0 +1,178 @@
+#!/usr/bin/env python3
+# Copyright (c) Facebook, Inc. and its affiliates.
+#
+# This source code is licensed under the MIT license found in the
+# LICENSE file in the root directory of this source tree.
+
+from typing import List, Optional
+
+import torch
+from botorch.models.multitask import MultiTaskGP
+from gpytorch.distributions.multivariate_normal import MultivariateNormal
+from gpytorch.kernels.rbf_kernel import RBFKernel
+from gpytorch.lazy import InterpolatedLazyTensor, LazyTensor
+from gpytorch.likelihoods.gaussian_likelihood import FixedNoiseGaussianLikelihood
+from gpytorch.priors.torch_priors import UniformPrior
+from torch import Tensor
+from torch.nn import ModuleList
+
+
+class LCEMGP(MultiTaskGP):
+    r"""The Multi-Task GP with the latent context embedding multioutput
+    (LCE-M) kernel.
+
+    Args:
+        train_X: (n x d) X training data.
+        train_Y: (n x 1) Y training data.
+        task_feature: column index of train_X to get context indices.
+        context_cat_feature: (n_contexts x k) one-hot encoded context
+            features. Rows are ordered by context indices. k equals to
+            number of categorical variables. If None, task indices will
+            be used and k = 1
+        context_emb_feature: (n_contexts x m) pre-given continuous
+            embedding features. Rows are ordered by context indices.
+        embs_dim_list: Embedding dimension for each categorical variable.
+            The length equals to k. If None, emb dim is set to 1 for each
+            categorical variable.
+        output_tasks: A list of task indices for which to compute model
+            outputs for. If omitted, return outputs for all task indices.
+    """
+
+    def __init__(
+        self,
+        train_X: Tensor,
+        train_Y: Tensor,
+        task_feature: int,
+        context_cat_feature: Optional[Tensor] = None,
+        context_emb_feature: Optional[Tensor] = None,
+        embs_dim_list: Optional[List[int]] = None,
+        output_tasks: Optional[List[int]] = None,
+    ) -> None:
+        super().__init__(
+            train_X=train_X,
+            train_Y=train_Y,
+            task_feature=task_feature,
+            output_tasks=output_tasks,
+        )
+        #  context indices
+        all_tasks = train_X[:, task_feature].unique()
+        self.all_tasks = all_tasks.to(dtype=torch.long).tolist()
+        self.all_tasks.sort()  # unique in python does automatic sort; add for safety
+
+        if context_cat_feature is None:
+            context_cat_feature = all_tasks.unsqueeze(-1)
+        self.context_cat_feature = context_cat_feature  # row indices = context indices
+        self.context_emb_feature = context_emb_feature
+
+        #  construct emb_dims based on categorical features
+        if embs_dim_list is None:
+            #  set embedding_dim = 1 for each categorical variable
+            embs_dim_list = [1 for _i in range(context_cat_feature.size(1))]
+        n_embs = sum(embs_dim_list)
+        self.emb_dims = [
+            (len(context_cat_feature[:, i].unique()), embs_dim_list[i])
+            for i in range(context_cat_feature.size(1))
+        ]
+        # contruct embedding layer: need to handle multiple categorical features
+        self.emb_layers = ModuleList(
+            [
+                torch.nn.Embedding(num_embeddings=x, embedding_dim=y, max_norm=1.0)
+                for x, y in self.emb_dims
+            ]
+        )
+        self.task_covar_module = RBFKernel(
+            ard_num_dims=n_embs, lengthscale_prior=UniformPrior(0.0, 2.0)
+        )
+        self.to(train_X)
+
+    def _eval_context_covar(self) -> LazyTensor:
+        """obtain context covariance matrix (num_contexts x num_contexts)"""
+        all_embs = self._task_embeddings()
+        return self.task_covar_module(all_embs)
+
+    def _task_embeddings(self) -> Tensor:
+        """generate embedding features for all contexts."""
+        embeddings = [
+            emb_layer(
+                self.context_cat_feature[:, i].to(dtype=torch.long)  # pyre-ignore
+            )
+            for i, emb_layer in enumerate(self.emb_layers)
+        ]
+        embeddings = torch.cat(embeddings, dim=1)
+
+        # add given embeddings if any
+        if self.context_emb_feature is not None:
+            embeddings = torch.cat(
+                [embeddings, self.context_emb_feature], dim=1  # pyre-ignore
+            )
+        return embeddings
+
+    def task_covar_matrix(self, task_idcs: Tensor) -> Tensor:
+        """compute covariance matrix of a list of given context
+
+        Args:
+            task_idcs: (n x 1) or (b x n x 1) task indices tensor
+        """
+        covar_matrix = self._eval_context_covar()
+        return InterpolatedLazyTensor(
+            base_lazy_tensor=covar_matrix,
+            left_interp_indices=task_idcs,
+            right_interp_indices=task_idcs,
+        ).evaluate()
+
+    def forward(self, x: Tensor) -> MultivariateNormal:
+        x_basic, task_idcs = self._split_inputs(x)
+        # Compute base mean and covariance
+        mean_x = self.mean_module(x_basic)
+        covar_x = self.covar_module(x_basic)
+        # Compute task covariances
+        covar_i = self.task_covar_matrix(task_idcs)
+        covar = covar_x.mul(covar_i)
+        return MultivariateNormal(mean_x, covar)
+
+
+class FixedNoiseLCEMGP(LCEMGP):
+    r"""The Multi-Task GP the latent context embedding multioutput
+    (LCE-M) kernel, with known observation noise.
+
+    Args:
+        train_X: (n x d) X training data.
+        train_Y: (n x 1) Y training data.
+        train_Yvar: (n x 1) Noise variances of each training Y.
+        task_feature: column index of train_X to get context indices.
+        context_cat_feature: (n_contexts x k) one-hot encoded context
+            features. Rows are ordered by context indices. k equals to
+            number of categorical variables. If None, task indices will
+            be used and k = 1.
+        context_emb_feature: (n_contexts x m) pre-given continuous
+            embedding features. Rows are ordered by context indices.
+        embs_dim_list: Embedding dimension for each categorical variable.
+            The length equals to k. If None, emb dim is set to 1 for each
+            categorical variable.
+        output_tasks: A list of task indices for which to compute model
+            outputs for. If omitted, return outputs for all task indices.
+    """
+
+    def __init__(
+        self,
+        train_X: Tensor,
+        train_Y: Tensor,
+        train_Yvar: Tensor,
+        task_feature: int,
+        context_cat_feature: Optional[Tensor] = None,
+        context_emb_feature: Optional[Tensor] = None,
+        embs_dim_list: Optional[List[int]] = None,
+        output_tasks: Optional[List[int]] = None,
+    ) -> None:
+        self._validate_tensor_args(X=train_X, Y=train_Y, Yvar=train_Yvar)
+        super().__init__(
+            train_X=train_X,
+            train_Y=train_Y,
+            task_feature=task_feature,
+            context_cat_feature=context_cat_feature,
+            context_emb_feature=context_emb_feature,
+            embs_dim_list=embs_dim_list,
+            output_tasks=output_tasks,
+        )
+        self.likelihood = FixedNoiseGaussianLikelihood(noise=train_Yvar)
+        self.to(train_X)