mves sampled costs (#352)

Daniel Jiang · facebook-github-bot · commit e07f5bdea614 · 2020-01-15T09:56:21.000-08:00
Summary: Pull Request resolved: #352 make sure MVES can support sampled costs like KG (ports over the logic from KG) Reviewed By: Balandat Differential Revision: D19203233 fbshipit-source-id: 23bd742753fd78f8539409b18c9b74d4b83c6402
diff --git a/botorch/acquisition/max_value_entropy_search.py b/botorch/acquisition/max_value_entropy_search.py
@@ -21,6 +21,7 @@
     arXiv:1901.08275v1, 2019
 """
 
+from copy import deepcopy
 from math import log
 from typing import Callable, Optional
 
@@ -297,7 +298,6 @@ def _compute_information_gain(
         H1_hat = H1_bar - beta * (H0_bar - H0)
         ig = H0 - H1_hat  # batch_shape x num_fantasies
         ig = ig.permute(-1, *range(ig.dim() - 1))  # num_fantasies x batch_shape
-
         return ig
 
 
@@ -382,13 +382,29 @@ def __init__(
         self.cost_aware_utility = cost_aware_utility
         self.expand = expand
         self.project = project
+        self._cost_sampler = None
+
         # @TODO make sure fidelity_dims align in project, expand & cost_aware_utility
         # It seems very difficult due to the current way of handling project/expand
 
         # resample max values after initializing self.project
         # so that the max value samples are at the highest fidelity
         self._sample_max_values()
 
+    @property
+    def cost_sampler(self):
+        if self._cost_sampler is None:
+            # Note: Using the deepcopy here is essential. Removing this poses a
+            # problem if the base model and the cost model have a different number
+            # of outputs or test points (this would be caused by expand), as this
+            # would trigger re-sampling the base samples in the fantasy sampler.
+            # By cloning the sampler here, the right thing will happen if the
+            # the sizes are compatible, if they are not this will result in
+            # samples being drawn using different base samples, but it will at
+            # least avoid changing state of the fantasy sampler.
+            self._cost_sampler = deepcopy(self.fantasies_sampler)
+        return self._cost_sampler
+
     @t_batch_mode_transform(expected_q=1)
     def forward(self, X: Tensor) -> Tensor:
         r"""Evaluates `qMultifidelityMaxValueEntropy` at the design points `X`
@@ -422,8 +438,8 @@ def forward(self, X: Tensor) -> Tensor:
         ig = self._compute_information_gain(
             X=X_expand, mean_M=mean_M, variance_M=variance_M, covar_mM=covar_mM
         )
-
-        return self.cost_aware_utility(X, ig).mean(dim=0)  # average over the fantasies
+        ig = self.cost_aware_utility(X=X, deltas=ig, sampler=self.cost_sampler)
+        return ig.mean(dim=0)  # average over the fantasies
 
 
 def _sample_max_value_Thompson(
diff --git a/test/acquisition/test_max_value_entropy_search.py b/test/acquisition/test_max_value_entropy_search.py
@@ -8,6 +8,7 @@
 from unittest import mock
 
 import torch
+from botorch.acquisition.cost_aware import InverseCostWeightedUtility
 from botorch.acquisition.max_value_entropy_search import (
     _sample_max_value_Gumbel,
     _sample_max_value_Thompson,
@@ -124,13 +125,17 @@ def test_q_multi_fidelity_max_value_entropy(self):
             self.assertEqual(qMF_MVE.num_fantasies, 16)
             self.assertEqual(qMF_MVE.num_mv_samples, 10)
             self.assertIsInstance(qMF_MVE.sampler, SobolQMCNormalSampler)
+            self.assertIsInstance(qMF_MVE.cost_sampler, SobolQMCNormalSampler)
             self.assertEqual(qMF_MVE.sampler.sample_shape, torch.Size([128]))
             self.assertIsInstance(qMF_MVE.fantasies_sampler, SobolQMCNormalSampler)
             self.assertEqual(qMF_MVE.fantasies_sampler.sample_shape, torch.Size([16]))
             self.assertIsInstance(qMF_MVE.expand, Callable)
             self.assertIsInstance(qMF_MVE.project, Callable)
             self.assertIsNone(qMF_MVE.X_pending)
             self.assertEqual(qMF_MVE.posterior_max_values.shape, torch.Size([10, 1]))
+            self.assertIsInstance(
+                qMF_MVE.cost_aware_utility, InverseCostWeightedUtility
+            )
 
             # test evaluation
             X = torch.rand(1, 2, device=self.device, dtype=dtype)