Epistimio · Thomsch · Jun 12, 2020 · May 8, 2020 · May 12, 2020 · May 23, 2020
diff --git a/docs/src/user/algorithms.rst b/docs/src/user/algorithms.rst
@@ -210,6 +210,10 @@ the most promising point among the candidates.
 .. _Tree-structured Parzen Estimator:
     https://papers.nips.cc/paper/4443-algorithms-for-hyper-parameter-optimization.pdf
 
+.. note::
+
+   Current implementation only supports uniform, uniform discrete and choices as prior.
+   As for choices prior, the probabilities if any given will be ignored.
 
 Configuration
 ~~~~~~~~~~~~~

diff --git a/src/orion/algo/tpe.py b/src/orion/algo/tpe.py
@@ -36,6 +36,23 @@ def compute_max_ei_point(points, below_likelis, above_likelis):
     return points[point_index]
 
 
+def ramp_up_weights(total_num, flat_num, equal_weight):
+    """Adjust weights of observed trials.
+
+    :param total_num: total number of observed trials.
+    :param flat_num: the number of the most recent trials which
+        get the full weight where the others will be applied with a linear ramp
+        from 0 to 1.0. It will only take effect if equal_weight is False.
+    :param equal_weight: whether all the observed trails share the same weights.
+    """
+    if total_num < flat_num or equal_weight:
+        return numpy.ones(total_num)
+
+    ramp_weights = numpy.linspace(1.0 / total_num, 1.0, num=total_num - flat_num)
+    flat_weights = numpy.ones(flat_num)
+    return numpy.concatenate([ramp_weights, flat_weights])
+
+
 # pylint:disable=assignment-from-no-return
 def adaptive_parzen_estimator(mus, low, high,
                               prior_weight=1.0,
@@ -56,15 +73,6 @@ def adaptive_parzen_estimator(mus, low, high,
         get the full weight where the others will be applied with a linear ramp
         from 0 to 1.0. It will only take effect if equal_weight is False.
     """
-    def update_weights(total_num):
-        """Generate weights for all components"""
-        if total_num < flat_num or equal_weight:
-            return numpy.ones(total_num)
-
-        ramp_weights = numpy.linspace(1.0 / total_num, 1.0, num=total_num - flat_num)
-        flat_weights = numpy.ones(flat_num)
-        return numpy.concatenate([ramp_weights, flat_weights])
-
     mus = numpy.asarray(mus)
 
     prior_mu = (low + high) * 0.5
@@ -76,7 +84,7 @@ def update_weights(total_num):
         sorted_mus = mus[order]
         prior_mu_pos = numpy.searchsorted(sorted_mus, prior_mu)
 
-        weights = update_weights(size)
+        weights = ramp_up_weights(size, flat_num, equal_weight)
 
         mixture_mus = numpy.zeros(size + 1)
         mixture_mus[:prior_mu_pos] = sorted_mus[:prior_mu_pos]
@@ -163,7 +171,7 @@ class TPE(BaseAlgorithm):
 
     # pylint:disable=too-many-arguments
     def __init__(self, space, seed=None,
-                 n_initial_points=20, n_ei_candidates=24,
+                 n_initial_points=5, n_ei_candidates=24,
                  gamma=0.25, equal_weight=False,
                  prior_weight=1.0, full_weight_num=25):
 
@@ -177,12 +185,13 @@ def __init__(self, space, seed=None,
                                   full_weight_num=full_weight_num)
 
         for dimension in self.space.values():
+            if dimension.type not in ['real', 'integer', 'categorical']:
+                raise ValueError("TPE now only supports Real, Integer "
+                                 "and Categorical Dimension.")
 
-            if dimension.type not in ['real']:
-                raise ValueError("TPE now only supports Real Dimension.")
-
-            if dimension.prior_name not in ['uniform']:
-                raise ValueError("TPE now only supports uniform as prior.")
+            if dimension.prior_name not in ['uniform', 'int_uniform', 'choices']:
+                raise ValueError("TPE now only supports uniform, uniform discrete "
+                                 "and choices as prior.")
 
             shape = dimension.shape
             if shape and len(shape) != 1:
@@ -245,8 +254,11 @@ def suggest(self, num=1):
         else:
             point = []
             below_points, above_points = self.split_trials()
-            below_points = numpy.array([flatten_dims(point, self.space) for point in below_points])
-            above_points = numpy.array([flatten_dims(point, self.space) for point in above_points])
+
+            below_points = [flatten_dims(point, self.space) for point in below_points]
+            above_points = [flatten_dims(point, self.space) for point in above_points]
+            below_points = list(map(list, zip(*below_points)))
+            above_points = list(map(list, zip(*above_points)))
 
             idx = 0
             for dimension in self.space.values():
@@ -255,12 +267,23 @@ def suggest(self, num=1):
                 if not shape:
                     shape = (1,)
 
-                if dimension.type == 'real':
-                    points = self.sample_real_dimension(dimension, shape[0],
-                                                        below_points[:, idx: idx + shape[0]],
-                                                        above_points[:, idx: idx + shape[0]])
+                if dimension.type == 'real' and dimension.prior_name == 'uniform':
+                    points = self.sample_one_dimension(dimension, shape[0],
+                                                       below_points[idx: idx + shape[0]],
+                                                       above_points[idx: idx + shape[0]],
+                                                       self._sample_real_point)
+                elif dimension.type == 'integer' and dimension.prior_name == 'int_uniform':
+                    points = self.sample_one_dimension(dimension, shape[0],
+                                                       below_points[idx: idx + shape[0]],
+                                                       above_points[idx: idx + shape[0]],
+                                                       self._sample_int_point)
+                elif dimension.type == 'categorical' and dimension.prior_name == 'choices':
+                    points = self.sample_one_dimension(dimension, shape[0],
+                                                       below_points[idx: idx + shape[0]],
+                                                       above_points[idx: idx + shape[0]],
+                                                       self._sample_categorical_point)
                 else:
-                    raise ValueError("TPE now only support Real Dimension.")
+                    raise NotImplementedError()
 
                 if len(points) < shape[0]:
                     logger.warning('TPE failed to sample new point with configuration %s',
@@ -275,25 +298,27 @@ def suggest(self, num=1):
 
         return samples
 
-    def sample_real_dimension(self, dimension, shape_size, below_points, above_points):
-        """Sample values for a real dimension
+    # pylint:disable=no-self-use
+    def sample_one_dimension(self, dimension, shape_size, below_points, above_points, sampler):
+        """Sample values for a dimension
 
-        :param dimension: Real Dimension.
+        :param dimension: Dimension.
         :param shape_size: 1D Shape Size of the Real Dimension.
         :param below_points: good points with shape (m, n), n=shape_size.
         :param above_points: bad points with shape (m, n), n=shape_size.
+        :param sampler: method to sample one value for upon the dimension.
         """
         points = []
 
         for j in range(shape_size):
-            new_point = self._sample_real_point(dimension, below_points[:, j], above_points[:, j])
-            if new_point:
+            new_point = sampler(dimension, below_points[j], above_points[j])
+            if new_point is not None:
                 points.append(new_point)
 
         return points
 
     def _sample_real_point(self, dimension, below_points, above_points):
-        """Sample one value for a real dimension based on the observed good and bad points"""
+        """Sample one value for real dimension based on the observed good and bad points"""
         low, high = dimension.interval()
         below_mus, below_sigmas, below_weights = \
             adaptive_parzen_estimator(below_points, low, high, self.prior_weight,
@@ -314,6 +339,51 @@ def _sample_real_point(self, dimension, below_points, above_points):
 
         return None
 
+    def _sample_int_point(self, dimension, below_points, above_points):
+        """Sample one value for integer dimension based on the observed good and bad points"""
+        low, high = dimension.interval()
+        choices = range(low, high)
+
+        below_points = numpy.array(below_points).astype(int) - low
+        above_points = numpy.array(above_points).astype(int) - low
+
+        sampler_below = CategoricalSampler(self, below_points, choices)
+        candidate_points = sampler_below.sample(self.n_ei_candidates)
+
+        if list(candidate_points):
+            sampler_above = CategoricalSampler(self, above_points, choices)
+
+            lik_blow = sampler_below.get_loglikelis(candidate_points)
-            lik_blow = sampler_below.get_loglikelis(candidate_points)
+            lik_below = sampler_below.get_loglikelis(candidate_points)
-            lik_blow = sampler_below.get_loglikelis(candidate_points)
+            lik_below = sampler_below.get_loglikelis(candidate_points)
+            lik_above = sampler_above.get_loglikelis(candidate_points)
+
+            new_point = compute_max_ei_point(candidate_points, lik_blow, lik_above)
-            new_point = compute_max_ei_point(candidate_points, lik_blow, lik_above)
+            new_point = compute_max_ei_point(candidate_points, lik_below, lik_above)
-            new_point = compute_max_ei_point(candidate_points, lik_blow, lik_above)
+            new_point = compute_max_ei_point(candidate_points, lik_below, lik_above)
+            new_point = new_point + low
+            return new_point
+
+        return None
+
+    def _sample_categorical_point(self, dimension, below_points, above_points):
+        """Sample one value for categorical dimension based on the observed good and bad points"""
+        choices = dimension.categories
+
+        below_points = [choices.index(point) for point in below_points]
+        above_points = [choices.index(point) for point in above_points]
+
+        sampler_below = CategoricalSampler(self, below_points, choices)
+        candidate_points = sampler_below.sample(self.n_ei_candidates)
+
+        if list(candidate_points):
+            sampler_above = CategoricalSampler(self, above_points, choices)
+
+            lik_blow = sampler_below.get_loglikelis(candidate_points)
-            lik_blow = sampler_below.get_loglikelis(candidate_points)
+            lik_below = sampler_below.get_loglikelis(candidate_points)
-            lik_blow = sampler_below.get_loglikelis(candidate_points)
+            lik_below = sampler_below.get_loglikelis(candidate_points)
+            lik_above = sampler_above.get_loglikelis(candidate_points)
+
+            new_point_index = compute_max_ei_point(candidate_points, lik_blow, lik_above)
-            new_point_index = compute_max_ei_point(candidate_points, lik_blow, lik_above)
+            new_point_index = compute_max_ei_point(candidate_points, lik_below, lik_above)
-            new_point_index = compute_max_ei_point(candidate_points, lik_blow, lik_above)
+            new_point_index = compute_max_ei_point(candidate_points, lik_below, lik_above)
+            new_point = choices[new_point_index]
+
+            return new_point
+        return None
+
     def split_trials(self):
         """Split the observed trials into good and bad ones based on the ratio `gamma``"""
         sorted_trials = sorted(self._trials_info.values(), key=lambda x: x[1]['objective'])
@@ -402,3 +472,48 @@ def get_loglikelis(self, points):
                                                axis=1))
 
         return point_likeli
+
+
+class CategoricalSampler():
+    """Categorical Sampler for discrete integer and categorical choices
+
+    Parameters
+    ----------
+    tpe: `TPE` algorithm
+        The tpe algorithm object which this sampler will be part of.
+    observations: list
+        Observed values in the dimension
+    choices: list
+        Candidate values for the dimension
+
+    """
+
+    def __init__(self, tpe, observations, choices):
+        self.tpe = tpe
+        self.obs = observations
+        self.choices = choices
+
+        self._build_multinomial_weights()
+
+    def _build_multinomial_weights(self):
+        """Build weights for categorical distribution based on observations"""
+        weights_obs = ramp_up_weights(len(self.obs),
+                                      self.tpe.full_weight_num, self.tpe.equal_weight)
+        counts_obs = numpy.bincount(self.obs, minlength=len(self.choices), weights=weights_obs)
+        counts_obs = counts_obs + self.tpe.prior_weight
+        self.weights = counts_obs / counts_obs.sum()
+
+    def sample(self, num=1):
+        """Sample required number of points"""
+        samples = self.tpe.rng.multinomial(n=1, pvals=self.weights, size=num)
+
+        assert samples.shape == (num,) + (len(self.weights),)
+
+        samples_index = samples.argmax(-1)
+        assert samples_index.shape == (num,)
+
+        return samples_index
+
+    def get_loglikelis(self, points):
+        """Return the log likelihood for the points"""
+        return numpy.log(numpy.asarray(self.weights)[points])
diff --git a/tests/functional/algos/test_algos.py b/tests/functional/algos/test_algos.py
@@ -71,11 +71,9 @@ def test_simple(monkeypatch, config_file):
 
 @pytest.mark.usefixtures("clean_db")
 @pytest.mark.usefixtures("null_db_instances")
-def test_random_stop(monkeypatch):
+@pytest.mark.parametrize('config_file', config_files)
+def test_random_stop(monkeypatch, config_file):
     """Test a simple usage scenario."""
-    # TODO: TPE should support this case once discrete is added,
-    #  then parametrized config_file should be used
-    config_file = 'random_config.yaml'
     monkeypatch.chdir(os.path.dirname(os.path.abspath(__file__)))
     orion.core.cli.main(["hunt", "--config", config_file,
                          "./black_box.py", "-x~uniform(-10, 5, discrete=True)"])