consider num_samples in bs thread priority (#207)

* consider num_samples in bs thread priority * continue search for bs
2021-09-14 18:36:10 -07:00 · 2021-09-14 18:36:10 -07:00 · a9d39b71da
parent ea6c6ded2f
commit a9d39b71da
3 changed files with 376 additions and 231 deletions
--- a/flaml/searcher/blendsearch.py
+++ b/flaml/searcher/blendsearch.py
@ -1,9 +1,9 @@
-'''!
- * Copyright (c) 2020-2021 Microsoft Corporation. All rights reserved.
+"""!
+ * Copyright (c) Microsoft Corporation. All rights reserved.
 * Licensed under the MIT License. See LICENSE file in the
 * project root for license information.
-'''
-from typing import Dict, Optional, List, Tuple, Callable
+"""
+from typing import Dict, Optional, List, Tuple, Callable, Union
 import numpy as np
 import time
 import pickle
@ -11,7 +11,8 @@ import pickle

 try:
    from ray import __version__ as ray_version
-    assert ray_version >= '1.0.0'
+
+    assert ray_version >= "1.0.0"
    from ray.tune.suggest import Searcher
    from ray.tune.suggest.optuna import OptunaSearch as GlobalSearch
 except (ImportError, AssertionError):
@ -20,42 +21,45 @@ except (ImportError, AssertionError):
 from ..tune.trial import unflatten_dict, flatten_dict
 from .search_thread import SearchThread
 from .flow2 import FLOW2
-from ..tune.space import (
-    add_cost_to_space, indexof, normalize, define_by_run_func)
+from ..tune.space import add_cost_to_space, indexof, normalize, define_by_run_func

 import logging
+
 logger = logging.getLogger(__name__)


 class BlendSearch(Searcher):
-    '''class for BlendSearch algorithm
-    '''
+    """class for BlendSearch algorithm"""

    cost_attr = "time_total_s"  # cost attribute in result
-    lagrange = '_lagrange'      # suffix for lagrange-modified metric
-    penalty = 1e+10             # penalty term for constraints
+    lagrange = "_lagrange"  # suffix for lagrange-modified metric
+    penalty = 1e10  # penalty term for constraints
    LocalSearch = FLOW2

-    def __init__(self,
-                 metric: Optional[str] = None,
-                 mode: Optional[str] = None,
-                 space: Optional[dict] = None,
-                 low_cost_partial_config: Optional[dict] = None,
-                 cat_hp_cost: Optional[dict] = None,
-                 points_to_evaluate: Optional[List[dict]] = None,
-                 evaluated_rewards: Optional[List] = None,
-                 prune_attr: Optional[str] = None,
-                 min_resource: Optional[float] = None,
-                 max_resource: Optional[float] = None,
-                 reduction_factor: Optional[float] = None,
-                 global_search_alg: Optional[Searcher] = None,
-                 config_constraints: Optional[
-                     List[Tuple[Callable[[dict], float], str, float]]] = None,
-                 metric_constraints: Optional[
-                     List[Tuple[str, str, float]]] = None,
-                 seed: Optional[int] = 20,
-                 experimental: Optional[bool] = False):
-        '''Constructor
+    def __init__(
+        self,
+        metric: Optional[str] = None,
+        mode: Optional[str] = None,
+        space: Optional[dict] = None,
+        low_cost_partial_config: Optional[dict] = None,
+        cat_hp_cost: Optional[dict] = None,
+        points_to_evaluate: Optional[List[dict]] = None,
+        evaluated_rewards: Optional[List] = None,
+        time_budget_s: Union[int, float] = None,
+        num_samples: Optional[int] = None,
+        prune_attr: Optional[str] = None,
+        min_resource: Optional[float] = None,
+        max_resource: Optional[float] = None,
+        reduction_factor: Optional[float] = None,
+        global_search_alg: Optional[Searcher] = None,
+        config_constraints: Optional[
+            List[Tuple[Callable[[dict], float], str, float]]
+        ] = None,
+        metric_constraints: Optional[List[Tuple[str, str, float]]] = None,
+        seed: Optional[int] = 20,
+        experimental: Optional[bool] = False,
+    ):
+        """Constructor

        Args:
            metric: A string of the metric name to optimize for.
@ -87,6 +91,8 @@ class BlendSearch(Searcher):
                as a list so the optimiser can be told the results without
                needing to re-compute the trial. Must be the same length as
                points_to_evaluate.
+            time_budget_s: int or float | Time budget in seconds.
+            num_samples: int | The number of configs to try.
            prune_attr: A string of the attribute used for pruning.
                Not necessarily in space.
                When prune_attr is in space, it is a hyperparameter, e.g.,
@ -119,7 +125,7 @@ class BlendSearch(Searcher):
                e.g., `['precision', '>=', 0.9]`
            seed: An integer of the random seed.
            experimental: A bool of whether to use experimental features.
-        '''
+        """
        self._metric, self._mode = metric, mode
        init_config = low_cost_partial_config or {}
        if not init_config:
@ -132,8 +138,7 @@ class BlendSearch(Searcher):
        if evaluated_rewards and mode:
            self._points_to_evaluate = []
            self._evaluated_rewards = []
-            best = max(evaluated_rewards) if mode == 'max' else min(
-                evaluated_rewards)
+            best = max(evaluated_rewards) if mode == "max" else min(evaluated_rewards)
            # only keep the best points as start points
            for i, r in enumerate(evaluated_rewards):
                if r == best:
@ -152,51 +157,78 @@ class BlendSearch(Searcher):
        if space:
            add_cost_to_space(space, init_config, self._cat_hp_cost)
        self._ls = self.LocalSearch(
-            init_config, metric, mode, space, prune_attr,
-            min_resource, max_resource, reduction_factor, self.cost_attr, seed)
+            init_config,
+            metric,
+            mode,
+            space,
+            prune_attr,
+            min_resource,
+            max_resource,
+            reduction_factor,
+            self.cost_attr,
+            seed,
+        )
        if global_search_alg is not None:
            self._gs = global_search_alg
-        elif getattr(self, '__name__', None) != 'CFO':
+        elif getattr(self, "__name__", None) != "CFO":
            if space and self._ls.hierarchical:
                from functools import partial
+
                gs_space = partial(define_by_run_func, space=space)
-                evaluated_rewards = None    # not supproted by define-by-run
+                evaluated_rewards = None  # not supproted by define-by-run
            else:
                gs_space = space
            gs_seed = seed - 10 if (seed - 10) >= 0 else seed - 11 + (1 << 32)
            if experimental:
                import optuna as ot
+
                sampler = ot.samplers.TPESampler(
-                    seed=seed, multivariate=True, group=True)
+                    seed=seed, multivariate=True, group=True
+                )
            else:
                sampler = None
            try:
                self._gs = GlobalSearch(
-                    space=gs_space, metric=metric, mode=mode, seed=gs_seed,
-                    sampler=sampler, points_to_evaluate=points_to_evaluate,
-                    evaluated_rewards=evaluated_rewards)
+                    space=gs_space,
+                    metric=metric,
+                    mode=mode,
+                    seed=gs_seed,
+                    sampler=sampler,
+                    points_to_evaluate=points_to_evaluate,
+                    evaluated_rewards=evaluated_rewards,
+                )
            except ValueError:
                self._gs = GlobalSearch(
-                    space=gs_space, metric=metric, mode=mode, seed=gs_seed,
-                    sampler=sampler)
+                    space=gs_space,
+                    metric=metric,
+                    mode=mode,
+                    seed=gs_seed,
+                    sampler=sampler,
+                )
            self._gs.space = space
        else:
            self._gs = None
        self._experimental = experimental
-        if getattr(self, '__name__', None) == 'CFO' and points_to_evaluate and len(
-           self._points_to_evaluate) > 1:
+        if (
+            getattr(self, "__name__", None) == "CFO"
+            and points_to_evaluate
+            and len(self._points_to_evaluate) > 1
+        ):
            # use the best config in points_to_evaluate as the start point
            self._candidate_start_points = {}
            self._started_from_low_cost = not low_cost_partial_config
        else:
            self._candidate_start_points = None
+        self._time_budget_s, self._num_samples = time_budget_s, num_samples
        if space:
            self._init_search()

-    def set_search_properties(self,
-                              metric: Optional[str] = None,
-                              mode: Optional[str] = None,
-                              config: Optional[Dict] = None) -> bool:
+    def set_search_properties(
+        self,
+        metric: Optional[str] = None,
+        mode: Optional[str] = None,
+        config: Optional[Dict] = None,
+    ) -> bool:
        metric_changed = mode_changed = False
        if metric and self._metric != metric:
            metric_changed = True
@ -216,34 +248,54 @@ class BlendSearch(Searcher):
                self._gs.set_search_properties(metric, mode, config)
                self._gs.space = config
            if config:
-                add_cost_to_space(
-                    config, self._ls.init_config, self._cat_hp_cost)
+                add_cost_to_space(config, self._ls.init_config, self._cat_hp_cost)
            self._ls.set_search_properties(metric, mode, config)
            self._init_search()
-        elif metric_changed or mode_changed:
-            # reset search when metric or mode changed
-            self._ls.set_search_properties(metric, mode)
-            if self._gs is not None:
-                self._gs = GlobalSearch(
-                    space=self._gs._space, metric=metric, mode=mode,
-                    sampler=self._gs._sampler)
-                self._gs.space = self._ls.space
-            self._init_search()
-        if config:
-            if 'time_budget_s' in config:
-                time_budget_s = config['time_budget_s']
-                if time_budget_s is not None:
-                    self._deadline = time_budget_s + time.time()
-                    SearchThread.set_eps(time_budget_s)
-            if 'metric_target' in config:
-                self._metric_target = config.get('metric_target')
+        else:
+            if metric_changed or mode_changed:
+                # reset search when metric or mode changed
+                self._ls.set_search_properties(metric, mode)
+                if self._gs is not None:
+                    self._gs = GlobalSearch(
+                        space=self._gs._space,
+                        metric=metric,
+                        mode=mode,
+                        sampler=self._gs._sampler,
+                    )
+                    self._gs.space = self._ls.space
+                self._init_search()
+            if config:
+                # CFO doesn't need these settings
+                if "time_budget_s" in config:
+                    self._time_budget_s = config["time_budget_s"]  # budget from now
+                    now = time.time()
+                    self._time_used += now - self._start_time
+                    self._start_time = now
+                    self._set_deadline()
+                if "metric_target" in config:
+                    self._metric_target = config.get("metric_target")
+                if "num_samples" in config:
+                    self._num_samples = (
+                        config["num_samples"]
+                        + len(self._result)
+                        + len(self._trial_proposed_by)
+                    )
        return True

+    def _set_deadline(self):
+        if self._time_budget_s is not None:
+            self._deadline = self._time_budget_s + self._start_time
+            SearchThread.set_eps(self._time_budget_s)
+        else:
+            self._deadline = np.inf
+
    def _init_search(self):
-        '''initialize the search
-        '''
+        """initialize the search"""
+        self._start_time = time.time()
+        self._time_used = 0
+        self._set_deadline()
        self._is_ls_ever_converged = False
-        self._subspace = {}     # the subspace for each trial id
+        self._subspace = {}  # the subspace for each trial id
        self._metric_target = np.inf * self._ls.metric_op
        self._search_thread_pool = {
            # id: int -> thread: SearchThread
@ -253,35 +305,41 @@ class BlendSearch(Searcher):
        self._init_used = self._ls.init_config is None
        self._trial_proposed_by = {}  # trial_id: str -> thread_id: int
        self._ls_bound_min = normalize(
-            self._ls.init_config.copy(), self._ls.space, self._ls.init_config,
-            {}, recursive=True)
+            self._ls.init_config.copy(),
+            self._ls.space,
+            self._ls.init_config,
+            {},
+            recursive=True,
+        )
        self._ls_bound_max = self._ls_bound_min.copy()
        self._gs_admissible_min = self._ls_bound_min.copy()
        self._gs_admissible_max = self._ls_bound_max.copy()
        self._result = {}  # config_signature: tuple -> result: Dict
-        self._deadline = np.inf
        if self._metric_constraints:
            self._metric_constraint_satisfied = False
            self._metric_constraint_penalty = [
-                self.penalty for _ in self._metric_constraints]
+                self.penalty for _ in self._metric_constraints
+            ]
        else:
            self._metric_constraint_satisfied = True
            self._metric_constraint_penalty = None
        self.best_resource = self._ls.min_resource

    def save(self, checkpoint_path: str):
-        ''' save states to a checkpoint path
-        '''
+        """save states to a checkpoint path"""
+        self._time_used += time.time() - self._start_time
+        self._start_time = time.time()
        save_object = self
        with open(checkpoint_path, "wb") as outputFile:
            pickle.dump(save_object, outputFile)

    def restore(self, checkpoint_path: str):
-        ''' restore states from checkpoint
-        '''
+        """restore states from checkpoint"""
        with open(checkpoint_path, "rb") as inputFile:
            state = pickle.load(inputFile)
        self.__dict__ = state.__dict__
+        self._start_time = time.time()
+        self._set_deadline()

    @property
    def metric_target(self):
@ -291,10 +349,10 @@ class BlendSearch(Searcher):
    def is_ls_ever_converged(self):
        return self._is_ls_ever_converged

-    def on_trial_complete(self, trial_id: str, result: Optional[Dict] = None,
-                          error: bool = False):
-        ''' search thread updater and cleaner
-        '''
+    def on_trial_complete(
+        self, trial_id: str, result: Optional[Dict] = None, error: bool = False
+    ):
+        """search thread updater and cleaner"""
        metric_constraint_satisfied = True
        if result and not error and self._metric_constraints:
            # account for metric constraints if any
@ -304,12 +362,15 @@ class BlendSearch(Searcher):
                value = result.get(metric_constraint)
                if value:
                    # sign is <= or >=
-                    sign_op = 1 if sign == '<=' else -1
+                    sign_op = 1 if sign == "<=" else -1
                    violation = (value - threshold) * sign_op
                    if violation > 0:
                        # add penalty term to the metric
-                        objective += self._metric_constraint_penalty[
-                            i] * violation * self._ls.metric_op
+                        objective += (
+                            self._metric_constraint_penalty[i]
+                            * violation
+                            * self._ls.metric_op
+                        )
                        metric_constraint_satisfied = False
                        if self._metric_constraint_penalty[i] < self.penalty:
                            self._metric_constraint_penalty[i] += violation
@ -321,16 +382,18 @@ class BlendSearch(Searcher):
        thread_id = self._trial_proposed_by.get(trial_id)
        if thread_id in self._search_thread_pool:
            self._search_thread_pool[thread_id].on_trial_complete(
-                trial_id, result, error)
+                trial_id, result, error
+            )
            del self._trial_proposed_by[trial_id]
        if result:
-            config = result.get('config', {})
+            config = result.get("config", {})
            if not config:
                for key, value in result.items():
-                    if key.startswith('config/'):
+                    if key.startswith("config/"):
                        config[key[7:]] = value
            signature = self._ls.config_signature(
-                config, self._subspace.get(trial_id, {}))
+                config, self._subspace.get(trial_id, {})
+            )
            if error:  # remove from result cache
                del self._result[signature]
            else:  # add to result cache
@ -345,28 +408,34 @@ class BlendSearch(Searcher):
                    if not self._metric_constraint_satisfied:
                        # no point has been found to satisfy metric constraint
                        self._expand_admissible_region(
-                            self._ls_bound_min, self._ls_bound_max,
-                            self._subspace.get(trial_id, self._ls.space))
-                    if self._gs is not None and self._experimental and (
-                       not self._ls.hierarchical):
-                        self._gs.add_evaluated_point(
-                            flatten_dict(config), objective)
+                            self._ls_bound_min,
+                            self._ls_bound_max,
+                            self._subspace.get(trial_id, self._ls.space),
+                        )
+                    if (
+                        self._gs is not None
+                        and self._experimental
+                        and (not self._ls.hierarchical)
+                    ):
+                        self._gs.add_evaluated_point(flatten_dict(config), objective)
                        # TODO: recover when supported
                        # converted = convert_key(config, self._gs.space)
                        # logger.info(converted)
                        # self._gs.add_evaluated_point(converted, objective)
-                elif metric_constraint_satisfied and self._create_condition(
-                        result):
+                elif metric_constraint_satisfied and self._create_condition(result):
                    # thread creator
                    thread_id = self._thread_count
-                    self._started_from_given = self._candidate_start_points \
+                    self._started_from_given = (
+                        self._candidate_start_points
                        and trial_id in self._candidate_start_points
+                    )
                    if self._started_from_given:
                        del self._candidate_start_points[trial_id]
                    else:
                        self._started_from_low_cost = True
-                    self._create_thread(config, result, self._subspace.get(
-                        trial_id, self._ls.space))
+                    self._create_thread(
+                        config, result, self._subspace.get(trial_id, self._ls.space)
+                    )
                # reset admissible region to ls bounding box
                self._gs_admissible_min.update(self._ls_bound_min)
                self._gs_admissible_max.update(self._ls_bound_max)
@ -374,26 +443,38 @@ class BlendSearch(Searcher):
        if thread_id and thread_id in self._search_thread_pool:
            # local search thread
            self._clean(thread_id)
-        if trial_id in self._subspace and not (self._candidate_start_points
-           and trial_id in self._candidate_start_points):
+        if trial_id in self._subspace and not (
+            self._candidate_start_points and trial_id in self._candidate_start_points
+        ):
            del self._subspace[trial_id]

    def _create_thread(self, config, result, space):
        self._search_thread_pool[self._thread_count] = SearchThread(
            self._ls.mode,
            self._ls.create(
-                config, result[self._ls.metric],
-                cost=result.get(self.cost_attr, 1), space=space),
-            self.cost_attr
+                config,
+                result[self._ls.metric],
+                cost=result.get(self.cost_attr, 1),
+                space=space,
+            ),
+            self.cost_attr,
        )
        self._thread_count += 1
        self._update_admissible_region(
-            unflatten_dict(config), self._ls_bound_min, self._ls_bound_max, space,
-            self._ls.space)
+            unflatten_dict(config),
+            self._ls_bound_min,
+            self._ls_bound_max,
+            space,
+            self._ls.space,
+        )

    def _update_admissible_region(
-        self, config, admissible_min, admissible_max, subspace: Dict = {},
-        space: Dict = {}
+        self,
+        config,
+        admissible_min,
+        admissible_max,
+        subspace: Dict = {},
+        space: Dict = {},
    ):
        # update admissible region
        normalized_config = normalize(config, subspace, config, {})
@ -404,13 +485,19 @@ class BlendSearch(Searcher):
                choice = indexof(domain, value)
                self._update_admissible_region(
                    value,
-                    admissible_min[key][choice], admissible_max[key][choice],
-                    subspace[key], domain[choice]
+                    admissible_min[key][choice],
+                    admissible_max[key][choice],
+                    subspace[key],
+                    domain[choice],
                )
            elif isinstance(value, dict):
                self._update_admissible_region(
-                    value, admissible_min[key], admissible_max[key],
-                    subspace[key], space[key])
+                    value,
+                    admissible_min[key],
+                    admissible_max[key],
+                    subspace[key],
+                    space[key],
+                )
            else:
                if value > admissible_max[key]:
                    admissible_max[key] = value
@ -418,19 +505,18 @@ class BlendSearch(Searcher):
                    admissible_min[key] = value

    def _create_condition(self, result: Dict) -> bool:
-        ''' create thread condition
-        '''
+        """create thread condition"""
        if len(self._search_thread_pool) < 2:
            return True
        obj_median = np.median(
-            [thread.obj_best1 for id, thread in self._search_thread_pool.items()
-             if id])
+            [thread.obj_best1 for id, thread in self._search_thread_pool.items() if id]
+        )
        return result[self._ls.metric] * self._ls.metric_op < obj_median

    def _clean(self, thread_id: int):
-        ''' delete thread and increase admissible region if converged,
+        """delete thread and increase admissible region if converged,
        merge local threads if they are close
-        '''
+        """
        assert thread_id
        todelete = set()
        for id in self._search_thread_pool:
@ -447,8 +533,10 @@ class BlendSearch(Searcher):
            self._is_ls_ever_converged = True
            todelete.add(thread_id)
            self._expand_admissible_region(
-                self._ls_bound_min, self._ls_bound_max,
-                self._search_thread_pool[thread_id].space)
+                self._ls_bound_min,
+                self._ls_bound_max,
+                self._search_thread_pool[thread_id].space,
+            )
            if self._candidate_start_points:
                if not self._started_from_given:
                    # remove start points whose perf is worse than the converged
@ -456,7 +544,8 @@ class BlendSearch(Searcher):
                    worse = [
                        trial_id
                        for trial_id, r in self._candidate_start_points.items()
-                        if r and r[self._ls.metric] * self._ls.metric_op >= obj]
+                        if r and r[self._ls.metric] * self._ls.metric_op >= obj
+                    ]
                    # logger.info(f"remove candidate start points {worse} than {obj}")
                    for trial_id in worse:
                        del self._candidate_start_points[trial_id]
@ -472,8 +561,10 @@ class BlendSearch(Searcher):
        best_trial_id = None
        obj_best = None
        for trial_id, r in self._candidate_start_points.items():
-            if r and (best_trial_id is None
-                      or r[self._ls.metric] * self._ls.metric_op < obj_best):
+            if r and (
+                best_trial_id is None
+                or r[self._ls.metric] * self._ls.metric_op < obj_best
+            ):
                best_trial_id = trial_id
                obj_best = r[self._ls.metric] * self._ls.metric_op
        if best_trial_id:
@ -481,20 +572,22 @@ class BlendSearch(Searcher):
            config = {}
            result = self._candidate_start_points[best_trial_id]
            for key, value in result.items():
-                if key.startswith('config/'):
+                if key.startswith("config/"):
                    config[key[7:]] = value
            self._started_from_given = True
            del self._candidate_start_points[best_trial_id]
-            self._create_thread(config, result, self._subspace.get(
-                best_trial_id, self._ls.space))
+            self._create_thread(
+                config, result, self._subspace.get(best_trial_id, self._ls.space)
+            )

    def _expand_admissible_region(self, lower, upper, space):
        for key in upper:
            ub = upper[key]
            if isinstance(ub, list):
-                choice = space[key]['_choice_']
+                choice = space[key]["_choice_"]
                self._expand_admissible_region(
-                    lower[key][choice], upper[key][choice], space[key])
+                    lower[key][choice], upper[key][choice], space[key]
+                )
            elif isinstance(ub, dict):
                self._expand_admissible_region(lower[key], ub, space[key])
            else:
@ -502,8 +595,7 @@ class BlendSearch(Searcher):
                lower[key] -= self._ls.STEPSIZE

    def _inferior(self, id1: int, id2: int) -> bool:
-        ''' whether thread id1 is inferior to id2
-        '''
+        """whether thread id1 is inferior to id2"""
        t1 = self._search_thread_pool[id1]
        t2 = self._search_thread_pool[id2]
        if t1.obj_best1 < t2.obj_best2:
@ -515,8 +607,7 @@ class BlendSearch(Searcher):
        return False

    def on_trial_result(self, trial_id: str, result: Dict):
-        ''' receive intermediate result
-        '''
+        """receive intermediate result"""
        if trial_id not in self._trial_proposed_by:
            return
        thread_id = self._trial_proposed_by[trial_id]
@ -527,8 +618,7 @@ class BlendSearch(Searcher):
        self._search_thread_pool[thread_id].on_trial_result(trial_id, result)

    def suggest(self, trial_id: str) -> Optional[Dict]:
-        ''' choose thread, suggest a valid config
-        '''
+        """choose thread, suggest a valid config"""
        if self._init_used and not self._points_to_evaluate:
            choice, backup = self._select_thread()
            # if choice < 0:  # timeout
@ -540,8 +630,10 @@ class BlendSearch(Searcher):
                # local search thread finishes
                if self._search_thread_pool[choice].converged:
                    self._expand_admissible_region(
-                        self._ls_bound_min, self._ls_bound_max,
-                        self._search_thread_pool[choice].space)
+                        self._ls_bound_min,
+                        self._ls_bound_max,
+                        self._search_thread_pool[choice].space,
+                    )
                    del self._search_thread_pool[choice]
                return None
            # preliminary check; not checking config validation
@ -558,8 +650,12 @@ class BlendSearch(Searcher):
                    return None
                use_rs = 1
            if choice or self._valid(
-               config, self._ls.space, space, self._gs_admissible_min,
-               self._gs_admissible_max):
+                config,
+                self._ls.space,
+                space,
+                self._gs_admissible_min,
+                self._gs_admissible_max,
+            ):
                # LS or valid or no backup choice
                self._trial_proposed_by[trial_id] = choice
                self._search_thread_pool[choice].running += use_rs
@ -568,7 +664,8 @@ class BlendSearch(Searcher):
                    # use CFO's init point
                    init_config = self._ls.init_config
                    config, space = self._ls.complete_config(
-                        init_config, self._ls_bound_min, self._ls_bound_max)
+                        init_config, self._ls_bound_min, self._ls_bound_max
+                    )
                    self._trial_proposed_by[trial_id] = choice
                    self._search_thread_pool[choice].running += 1
                else:
@ -583,12 +680,20 @@ class BlendSearch(Searcher):
            if not choice:  # global search
                # temporarily relax admissible region for parallel proposals
                self._update_admissible_region(
-                    config, self._gs_admissible_min, self._gs_admissible_max,
-                    space, self._ls.space)
+                    config,
+                    self._gs_admissible_min,
+                    self._gs_admissible_max,
+                    space,
+                    self._ls.space,
+                )
            else:
                self._update_admissible_region(
-                    config, self._ls_bound_min, self._ls_bound_max, space,
-                    self._ls.space)
+                    config,
+                    self._ls_bound_min,
+                    self._ls_bound_max,
+                    space,
+                    self._ls.space,
+                )
                self._gs_admissible_min.update(self._ls_bound_min)
                self._gs_admissible_max.update(self._ls_bound_max)
            signature = self._ls.config_signature(config, space)
@ -605,7 +710,8 @@ class BlendSearch(Searcher):
            else:
                init_config = self._ls.init_config
            config, space = self._ls.complete_config(
-                init_config, self._ls_bound_min, self._ls_bound_max)
+                init_config, self._ls_bound_min, self._ls_bound_max
+            )
            if reward is None:
                config_signature = self._ls.config_signature(config, space)
                result = self._result.get(config_signature)
@ -620,18 +726,15 @@ class BlendSearch(Searcher):
            self._search_thread_pool[0].running += 1
            self._subspace[trial_id] = space
            if reward is not None:
-                result = {
-                    self._metric: reward, self.cost_attr: 1,
-                    'config': config
-                }
+                result = {self._metric: reward, self.cost_attr: 1, "config": config}
                self.on_trial_complete(trial_id, result)
                return None
        return config

    def _should_skip(self, choice, trial_id, config, space) -> bool:
-        ''' if config is None or config's result is known or constraints are violated
-            return True; o.w. return False
-        '''
+        """if config is None or config's result is known or constraints are violated
+        return True; o.w. return False
+        """
        if config is None:
            return True
        config_signature = self._ls.config_signature(config, space)
@ -641,11 +744,15 @@ class BlendSearch(Searcher):
            for constraint in self._config_constraints:
                func, sign, threshold = constraint
                value = func(config)
-                if (sign == '<=' and value > threshold
-                        or sign == '>=' and value < threshold):
+                if (
+                    sign == "<="
+                    and value > threshold
+                    or sign == ">="
+                    and value < threshold
+                ):
                    self._result[config_signature] = {
                        self._metric: np.inf * self._ls.metric_op,
-                        'time_total_s': 1,
+                        "time_total_s": 1,
                    }
                    exists = True
                    break
@ -654,7 +761,8 @@ class BlendSearch(Searcher):
                result = self._result.get(config_signature)
                if result:  # finished
                    self._search_thread_pool[choice].on_trial_complete(
-                        trial_id, result, error=False)
+                        trial_id, result, error=False
+                    )
                    if choice:
                        # local search thread
                        self._clean(choice)
@ -666,14 +774,23 @@ class BlendSearch(Searcher):
        return False

    def _select_thread(self) -> Tuple:
-        ''' thread selector; use can_suggest to check LS availability
-        '''
+        """thread selector; use can_suggest to check LS availability"""
        # update priority
-        min_eci = self._deadline - time.time()
+        now = time.time()
+        min_eci = self._deadline - now
        if min_eci <= 0:
            # return -1, -1
            # keep proposing new configs assuming no budget left
            min_eci = 0
+        elif self._num_samples and self._num_samples > 0:
+            # estimate time left according to num_samples limitation
+            num_finished = len(self._result)
+            num_proposed = num_finished + len(self._trial_proposed_by)
+            num_left = max(self._num_samples - num_proposed, 0)
+            if num_proposed > 0:
+                time_used = now - self._start_time + self._time_used
+                min_eci = min(min_eci, time_used / num_finished * num_left)
+            # print(f"{min_eci}, {time_used / num_finished * num_left}, {num_finished}, {num_left}")
        max_speed = 0
        for thread in self._search_thread_pool.values():
            if thread.speed > max_speed:
@ -698,10 +815,10 @@ class BlendSearch(Searcher):
                    backup_thread_id = thread_id
        return top_thread_id, backup_thread_id

-    def _valid(self, config: Dict, space: Dict, subspace: Dict,
-               lower: Dict, upper: Dict) -> bool:
-        ''' config validator
-        '''
+    def _valid(
+        self, config: Dict, space: Dict, subspace: Dict, lower: Dict, upper: Dict
+    ) -> bool:
+        """config validator"""
        normalized_config = normalize(config, subspace, config, {})
        for key, lb in lower.items():
            if key in config:
@ -719,114 +836,143 @@ class BlendSearch(Searcher):
                else:
                    nestedspace = None
                if nestedspace:
-                    valid = self._valid(
-                        value, domain, nestedspace, lb, ub)
+                    valid = self._valid(value, domain, nestedspace, lb, ub)
                    if not valid:
                        return False
-                elif (value + self._ls.STEPSIZE < lower[key]
-                      or value > upper[key] + self._ls.STEPSIZE):
+                elif (
+                    value + self._ls.STEPSIZE < lower[key]
+                    or value > upper[key] + self._ls.STEPSIZE
+                ):
                    return False
        return True


 try:
    from ray import __version__ as ray_version
-    assert ray_version >= '1.0.0'
-    from ray.tune import (uniform, quniform, choice, randint, qrandint, randn,
-                          qrandn, loguniform, qloguniform)
+
+    assert ray_version >= "1.0.0"
+    from ray.tune import (
+        uniform,
+        quniform,
+        choice,
+        randint,
+        qrandint,
+        randn,
+        qrandn,
+        loguniform,
+        qloguniform,
+    )
 except (ImportError, AssertionError):
-    from ..tune.sample import (uniform, quniform, choice, randint, qrandint, randn,
-                               qrandn, loguniform, qloguniform)
+    from ..tune.sample import (
+        uniform,
+        quniform,
+        choice,
+        randint,
+        qrandint,
+        randn,
+        qrandn,
+        loguniform,
+        qloguniform,
+    )

 try:
    from nni.tuner import Tuner as NNITuner
    from nni.utils import extract_scalar_reward
 except ImportError:
+
    class NNITuner:
        pass

    def extract_scalar_reward(x: Dict):
-        return x.get('reward')
+        return x.get("reward")


 class BlendSearchTuner(BlendSearch, NNITuner):
-    '''Tuner class for NNI
-    '''
+    """Tuner class for NNI"""

-    def receive_trial_result(self, parameter_id, parameters, value,
-                             **kwargs):
-        '''
+    def receive_trial_result(self, parameter_id, parameters, value, **kwargs):
+        """
        Receive trial's final result.
        parameter_id: int
        parameters: object created by 'generate_parameters()'
        value: final metrics of the trial, including default metric
-        '''
+        """
        result = {
-            'config': parameters, self._metric: extract_scalar_reward(value),
-            self.cost_attr: 1 if isinstance(value, float) else value.get(
-                self.cost_attr, value.get('sequence', 1))
+            "config": parameters,
+            self._metric: extract_scalar_reward(value),
+            self.cost_attr: 1
+            if isinstance(value, float)
+            else value.get(self.cost_attr, value.get("sequence", 1))
            # if nni does not report training cost,
            # using sequence as an approximation.
            # if no sequence, using a constant 1
        }
        self.on_trial_complete(str(parameter_id), result)
+
    ...

    def generate_parameters(self, parameter_id, **kwargs) -> Dict:
-        '''
+        """
        Returns a set of trial (hyper-)parameters, as a serializable object
        parameter_id: int
-        '''
+        """
        return self.suggest(str(parameter_id))
+
    ...

    def update_search_space(self, search_space):
-        '''
+        """
        Tuners are advised to support updating search space at run-time.
        If a tuner can only set search space once before generating first hyper-parameters,
        it should explicitly document this behaviour.
        search_space: JSON object created by experiment owner
-        '''
+        """
        config = {}
        for key, value in search_space.items():
            v = value.get("_value")
-            _type = value['_type']
-            if _type == 'choice':
+            _type = value["_type"]
+            if _type == "choice":
                config[key] = choice(v)
-            elif _type == 'randint':
+            elif _type == "randint":
                config[key] = randint(*v)
-            elif _type == 'uniform':
+            elif _type == "uniform":
                config[key] = uniform(*v)
-            elif _type == 'quniform':
+            elif _type == "quniform":
                config[key] = quniform(*v)
-            elif _type == 'loguniform':
+            elif _type == "loguniform":
                config[key] = loguniform(*v)
-            elif _type == 'qloguniform':
+            elif _type == "qloguniform":
                config[key] = qloguniform(*v)
-            elif _type == 'normal':
+            elif _type == "normal":
                config[key] = randn(*v)
-            elif _type == 'qnormal':
+            elif _type == "qnormal":
                config[key] = qrandn(*v)
            else:
-                raise ValueError(
-                    f'unsupported type in search_space {_type}')
+                raise ValueError(f"unsupported type in search_space {_type}")
        add_cost_to_space(config, {}, {})
        self._ls = self.LocalSearch(
-            {}, self._ls.metric, self._mode, config, cost_attr=self.cost_attr,
-            seed=self._ls.seed)
+            {},
+            self._ls.metric,
+            self._mode,
+            config,
+            cost_attr=self.cost_attr,
+            seed=self._ls.seed,
+        )
        if self._gs is not None:
            self._gs = GlobalSearch(
-                space=config, metric=self._metric, mode=self._mode,
-                sampler=self._gs._sampler)
+                space=config,
+                metric=self._metric,
+                mode=self._mode,
+                sampler=self._gs._sampler,
+            )
            self._gs.space = config
        self._init_search()


 class CFO(BlendSearchTuner):
-    ''' class for CFO algorithm
-    '''
+    """class for CFO algorithm"""

-    __name__ = 'CFO'
+    __name__ = "CFO"

    def suggest(self, trial_id: str) -> Optional[Dict]:
        # Number of threads is 1 or 2. Thread 0 is a vacuous thread
@ -843,8 +989,7 @@ class CFO(BlendSearchTuner):
                return key, key

    def _create_condition(self, result: Dict) -> bool:
-        ''' create thread condition
-        '''
+        """create thread condition"""
        if self._points_to_evaluate:
            # still evaluating user-specified init points
            # we evaluate all candidate start points before we
@ -856,16 +1001,18 @@ class CFO(BlendSearchTuner):
            # result needs to match or exceed the best candidate start point
            obj_best = min(
                self._ls.metric_op * r[self._ls.metric]
-                for r in self._candidate_start_points.values() if r)
+                for r in self._candidate_start_points.values()
+                if r
+            )
            return result[self._ls.metric] * self._ls.metric_op <= obj_best
        else:
            return True

-    def on_trial_complete(self, trial_id: str, result: Optional[Dict] = None,
-                          error: bool = False):
+    def on_trial_complete(
+        self, trial_id: str, result: Optional[Dict] = None, error: bool = False
+    ):
        super().on_trial_complete(trial_id, result, error)
-        if self._candidate_start_points \
-           and trial_id in self._candidate_start_points:
+        if self._candidate_start_points and trial_id in self._candidate_start_points:
            # the trial is a candidate start point
            self._candidate_start_points[trial_id] = result
            if len(self._search_thread_pool) < 2 and not self._points_to_evaluate:
--- a/flaml/tune/tune.py
+++ b/flaml/tune/tune.py
@ -83,8 +83,6 @@ def report(_metric=None, **kwargs):
        return tune.report(_metric, **kwargs)
    else:
        result = kwargs
-        if _verbose == 2:
-            logger.info(f"result: {kwargs}")
        if _metric:
            result[DEFAULT_METRIC] = _metric
        trial = _runner.running_trial
@ -114,7 +112,7 @@ def run(
    cat_hp_cost: Optional[dict] = None,
    metric: Optional[str] = None,
    mode: Optional[str] = None,
-    time_budget_s: Union[int, float, datetime.timedelta] = None,
+    time_budget_s: Union[int, float] = None,
    points_to_evaluate: Optional[List[dict]] = None,
    evaluated_rewards: Optional[List] = None,
    prune_attr: Optional[str] = None,
@ -184,7 +182,7 @@ def run(
        metric: A string of the metric name to optimize for.
        mode: A string in ['min', 'max'] to specify the objective as
            minimization or maximization.
-        time_budget_s: A float of the time budget in seconds.
+        time_budget_s: int or float | The time budget in seconds.
        points_to_evaluate: A list of initial hyperparameter
            configurations to run first.
        evaluated_rewards (list): If you have previously evaluated the
@ -291,6 +289,8 @@ def run(
            evaluated_rewards=evaluated_rewards,
            low_cost_partial_config=low_cost_partial_config,
            cat_hp_cost=cat_hp_cost,
+            time_budget_s=time_budget_s,
+            num_samples=num_samples,
            prune_attr=prune_attr,
            min_resource=min_resource,
            max_resource=max_resource,
@ -303,10 +303,12 @@ def run(
        if metric is None or mode is None:
            metric = metric or search_alg.metric
            mode = mode or search_alg.mode
-    if time_budget_s:
-        search_alg.set_search_properties(
-            None, None, config={"time_budget_s": time_budget_s}
-        )
+        if time_budget_s or num_samples > 0:
+            search_alg.set_search_properties(
+                None,
+                None,
+                config={"time_budget_s": time_budget_s, "num_samples": num_samples},
+            )
    scheduler = None
    if report_intermediate_result:
        params = {}
--- a/test/test_restore.py
+++ b/test/test_restore.py
@ -6,7 +6,6 @@ import numpy as np
 from flaml.searcher.suggestion import ConcurrencyLimiter
 from flaml import tune
 from flaml import CFO
-from flaml import BlendSearch


 class AbstractWarmStartTest:
@ -27,28 +26,24 @@ class AbstractWarmStartTest:
        search_alg, cost = self.set_basic_conf()
        search_alg = ConcurrencyLimiter(search_alg, 1)
        results_exp_1 = tune.run(
-            cost,
-            num_samples=5,
-            search_alg=search_alg,
-            verbose=0,
-            local_dir=self.tmpdir)
+            cost, num_samples=5, search_alg=search_alg, verbose=0, local_dir=self.tmpdir
+        )
        checkpoint_path = os.path.join(self.tmpdir, self.experiment_name)
        search_alg.save(checkpoint_path)
        return results_exp_1, np.random.get_state(), checkpoint_path

    def run_explicit_restore(self, random_state, checkpoint_path):
-        np.random.set_state(random_state)
        search_alg2, cost = self.set_basic_conf()
        search_alg2 = ConcurrencyLimiter(search_alg2, 1)
        search_alg2.restore(checkpoint_path)
+        np.random.set_state(random_state)
        return tune.run(cost, num_samples=5, search_alg=search_alg2, verbose=0)

    def run_full(self):
        np.random.seed(162)
        search_alg3, cost = self.set_basic_conf()
        search_alg3 = ConcurrencyLimiter(search_alg3, 1)
-        return tune.run(
-            cost, num_samples=10, search_alg=search_alg3, verbose=0)
+        return tune.run(cost, num_samples=10, search_alg=search_alg3, verbose=0)

    def testReproduce(self):
        results_exp_1, _, _ = self.run_part_from_scratch()
@ -75,7 +70,7 @@ class CFOWarmStartTest(AbstractWarmStartTest, unittest.TestCase):
        }

        def cost(param):
-            tune.report(loss=(param["height"] - 14)**2 - abs(param["width"] - 3))
+            tune.report(loss=(param["height"] - 14) ** 2 - abs(param["width"] - 3))

        search_alg = CFO(
            space=space,
@ -86,6 +81,7 @@ class CFOWarmStartTest(AbstractWarmStartTest, unittest.TestCase):

        return search_alg, cost

+
 # # # Not doing test for BS because of problems with random seed in OptunaSearch
 # class BlendsearchWarmStartTest(AbstractWarmStartTest, unittest.TestCase):
 #     def set_basic_conf(self):