feat: add asynchronous decentralized bayesian optimization (#145)

mlr-org · Nov 15, 2024 · bbb91c3 · bbb91c3
1 parent ddbb5ef
commit bbb91c3
Show file tree

Hide file tree

Showing 86 changed files with 3,665 additions and 184 deletions.
diff --git a/.lintr b/.lintr
@@ -5,5 +5,6 @@ linters: linters_with_defaults(
     object_name_linter = object_name_linter(c("snake_case", "CamelCase")), # only allow snake case and camel case object names
     cyclocomp_linter = NULL, # do not check function complexity
     commented_code_linter = NULL, # allow code in comments
-    line_length_linter = line_length_linter(120)
+    line_length_linter = line_length_linter(120),
+    indentation_linter(indent = 2L, hanging_indent_style = "never")
     )
diff --git a/DESCRIPTION b/DESCRIPTION
@@ -39,16 +39,16 @@ License: LGPL-3
 URL: https://mlr3mbo.mlr-org.com, https://github.com/mlr-org/mlr3mbo
 BugReports: https://github.com/mlr-org/mlr3mbo/issues
 Depends:
+    mlr3tuning (>= 1.1.0),
     R (>= 3.1.0)
 Imports:
     bbotk (>= 1.2.0),
     checkmate (>= 2.0.0),
     data.table,
     lgr (>= 0.3.4),
-    mlr3 (>= 0.21.0),
+    mlr3 (>= 0.21.1),
     mlr3misc (>= 0.11.0),
-    mlr3tuning (>= 1.0.2),
-    paradox (>= 1.0.0),
+    paradox (>= 1.0.1),
     spacefillr,
     R6 (>= 2.4.1)
 Suggests:
@@ -62,6 +62,8 @@ Suggests:
     ranger,
     rgenoud,
     rpart,
+    redux,
+    rush,
     stringi,
     testthat (>= 3.0.0)
 ByteCompile: no
@@ -85,8 +87,12 @@ Collate:
     'AcqFunctionPI.R'
     'AcqFunctionSD.R'
     'AcqFunctionSmsEgo.R'
+    'AcqFunctionStochasticCB.R'
+    'AcqFunctionStochasticEI.R'
     'AcqOptimizer.R'
     'aaa.R'
+    'OptimizerADBO.R'
+    'OptimizerAsyncMbo.R'
     'OptimizerMbo.R'
     'mlr_result_assigners.R'
     'ResultAssigner.R'
@@ -95,6 +101,8 @@ Collate:
     'Surrogate.R'
     'SurrogateLearner.R'
     'SurrogateLearnerCollection.R'
+    'TunerADBO.R'
+    'TunerAsyncMbo.R'
     'TunerMbo.R'
     'mlr_loop_functions.R'
     'bayesopt_ego.R'

diff --git a/NAMESPACE b/NAMESPACE
@@ -16,14 +16,20 @@ export(AcqFunctionMulti)
 export(AcqFunctionPI)
 export(AcqFunctionSD)
 export(AcqFunctionSmsEgo)
+export(AcqFunctionStochasticCB)
+export(AcqFunctionStochasticEI)
 export(AcqOptimizer)
+export(OptimizerADBO)
+export(OptimizerAsyncMbo)
 export(OptimizerMbo)
 export(ResultAssigner)
 export(ResultAssignerArchive)
 export(ResultAssignerSurrogate)
 export(Surrogate)
 export(SurrogateLearner)
 export(SurrogateLearnerCollection)
+export(TunerADBO)
+export(TunerAsyncMbo)
 export(TunerMbo)
 export(acqf)
 export(acqfs)
@@ -58,6 +64,7 @@ importFrom(R6,R6Class)
 importFrom(stats,dnorm)
 importFrom(stats,pnorm)
 importFrom(stats,quantile)
+importFrom(stats,rexp)
 importFrom(stats,runif)
 importFrom(stats,setNames)
 importFrom(utils,bibentry)

diff --git a/NEWS.md b/NEWS.md
@@ -1,5 +1,11 @@
 # mlr3mbo (development version)
 
+* refactor: refactored `SurrogateLearner` and `SurrogateLearnerCollection` to allow updating on an asynchronous `Archive`
+* feat: added experimental `OptimizerAsyncMbo`, `OptimizerADBO`, `TunerAsyncMbo`, and `TunerADBO` that allow for asynchronous optimization
+* feat: added `AcqFunctionStochasticCB` and `AcqFunctionStochasticEI` that are useful for asynchronous optimization
+* doc: minor changes to highlight differences between batch and asynchronous objects related to asynchronous support
+* refactor: `AcqFunction`s and `AcqOptimizer` gained a `reset()` method.
+
 # mlr3mbo 0.2.6
 
 * refactor: Extract internal tuned values in instance.

diff --git a/R/AcqFunction.R b/R/AcqFunction.R
@@ -73,6 +73,14 @@ AcqFunction = R6Class("AcqFunction",
       # FIXME: at some point we may want to make this an AB to a private$.update
     },
 
+    #' @description
+    #' Reset the acquisition function.
+    #'
+    #' Can be implemented by subclasses.
+    reset = function() {
+      # FIXME: at some point we may want to make this an AB to a private$.reset
+    },
+
     #' @description
     #' Evaluates multiple input values on the objective function.
     #'

diff --git a/R/AcqFunctionMulti.R b/R/AcqFunctionMulti.R
@@ -16,7 +16,7 @@
 #' If acquisition functions have not been initialized with a surrogate, the surrogate passed during construction or lazy initialization
 #' will be used for all acquisition functions.
 #'
-#' For optimization, [AcqOptimizer] can be used as for any other [AcqFunction], however, the [bbotk::Optimizer] wrapped within the [AcqOptimizer]
+#' For optimization, [AcqOptimizer] can be used as for any other [AcqFunction], however, the [bbotk::OptimizerBatch] wrapped within the [AcqOptimizer]
 #' must support multi-objective optimization as indicated via the `multi-crit` property.
 #'
 #' @family Acquisition Function

diff --git a/R/AcqFunctionSmsEgo.R b/R/AcqFunctionSmsEgo.R
@@ -18,6 +18,11 @@
 #'   In the case of being `NULL`, an epsilon vector is maintained dynamically as
 #'   described in Horn et al. (2015).
 #'
+#' @section Note:
+#' * This acquisition function always also returns its current epsilon values in a list column (`acq_epsilon`).
+#'   These values will be logged into the [bbotk::ArchiveBatch] of the [bbotk::OptimInstanceBatch] of the [AcqOptimizer] and
+#'   therefore also in the [bbotk::Archive] of the actual [bbotk::OptimInstance] that is to be optimized.
+#'
 #' @references
 #' * `r format_bib("ponweiser_2008")`
 #' * `r format_bib("horn_2015")`
@@ -78,7 +83,7 @@ AcqFunctionSmsEgo = R6Class("AcqFunctionSmsEgo",
 
     #' @field progress (`numeric(1)`)\cr
     #'   Optimization progress (typically, the number of function evaluations left).
-    #'   Note that this requires the [bbotk::OptimInstance] to be terminated via a [bbotk::TerminatorEvals].
+    #'   Note that this requires the [bbotk::OptimInstanceBatch] to be terminated via a [bbotk::TerminatorEvals].
     progress = NULL,
 
     #' @description
@@ -94,7 +99,7 @@ AcqFunctionSmsEgo = R6Class("AcqFunctionSmsEgo",
 
       constants = ps(
         lambda = p_dbl(lower = 0, default = 1),
-        epsilon = p_dbl(lower = 0, default = NULL, special_vals = list(NULL))  # for NULL, it will be calculated dynamically
+        epsilon = p_dbl(lower = 0, default = NULL, special_vals = list(NULL))  # if NULL, it will be calculated dynamically
       )
       constants$values$lambda = lambda
       constants$values$epsilon = epsilon
@@ -140,6 +145,13 @@ AcqFunctionSmsEgo = R6Class("AcqFunctionSmsEgo",
       } else {
         self$epsilon = self$constants$values$epsilon
       }
+    },
+
+    #' @description
+    #' Reset the acquisition function.
+    #' Resets `epsilon`.
+    reset = function() {
+      self$epsilon = NULL
     }
   ),
 
@@ -163,7 +175,7 @@ AcqFunctionSmsEgo = R6Class("AcqFunctionSmsEgo",
       # allocate memory for adding points to front for HV calculation in C
       front2 = t(rbind(self$ys_front, 0))
       sms = .Call("c_sms_indicator", PACKAGE = "mlr3mbo", cbs, self$ys_front, front2, self$epsilon, self$ref_point)  # note that the negative indicator is returned from C
-      data.table(acq_smsego = sms)
+      data.table(acq_smsego = sms, acq_epsilon = list(self$epsilon))
     }
   )
 )

diff --git a/R/AcqFunctionStochasticCB.R b/R/AcqFunctionStochasticCB.R
@@ -0,0 +1,188 @@
+#' @title Acquisition Function Stochastic Confidence Bound
+#'
+#' @include AcqFunction.R
+#' @name mlr_acqfunctions_stochastic_cb
+#'
+#' @templateVar id stochastic_cb
+#' @template section_dictionary_acqfunctions
+#'
+#' @description
+#' Lower / Upper Confidence Bound with lambda sampling and decay.
+#' The initial \eqn{\lambda} is drawn from an uniform distribution between `min_lambda` and `max_lambda` or from an exponential distribution with rate `1 / lambda`.
+#' \eqn{\lambda} is updated after each update by the formula `lambda * exp(-rate * (t %% period))`, where `t` is the number of times the acquisition function has been updated.
+#'
+#' While this acquisition function usually would be used within an asynchronous optimizer, e.g., [OptimizerAsyncMbo],
+#' it can in principle also be used in synchronous optimizers, e.g., [OptimizerMbo].
+#'
+#' @section Parameters:
+#' * `"lambda"` (`numeric(1)`)\cr
+#'   \eqn{\lambda} value for sampling from the exponential distribution.
+#'   Defaults to `1.96`.
+#' * `"min_lambda"` (`numeric(1)`)\cr
+#'   Minimum value of \eqn{\lambda}for sampling from the uniform distribution.
+#'   Defaults to `0.01`.
+#' * `"max_lambda"` (`numeric(1)`)\cr
+#'   Maximum value of \eqn{\lambda} for sampling from the uniform distribution.
+#'   Defaults to `10`.
+#' * `"distribution"` (`character(1)`)\cr
+#'   Distribution to sample \eqn{\lambda} from.
+#'   One of `c("uniform", "exponential")`.
+#'   Defaults to `uniform`.
+#' * `"rate"` (`numeric(1)`)\cr
+#'   Rate of the exponential decay.
+#'   Defaults to `0` i.e. no decay.
+#' * `"period"` (`integer(1)`)\cr
+#'   Period of the exponential decay.
+#'   Defaults to `NULL`, i.e., the decay has no period.
+#'
+#' @section Note:
+#' * This acquisition function always also returns its current (`acq_lambda`) and original (`acq_lambda_0`) \eqn{\lambda}.
+#'   These values will be logged into the [bbotk::ArchiveBatch] of the [bbotk::OptimInstanceBatch] of the [AcqOptimizer] and
+#'   therefore also in the [bbotk::Archive] of the actual [bbotk::OptimInstance] that is to be optimized.
+#'
+#' @references
+#' * `r format_bib("snoek_2012")`
+#' * `r format_bib("egele_2023")`
+#'
+#' @family Acquisition Function
+#' @export
+#' @examples
+#' if (requireNamespace("mlr3learners") &
+#'     requireNamespace("DiceKriging") &
+#'     requireNamespace("rgenoud")) {
+#'   library(bbotk)
+#'   library(paradox)
+#'   library(mlr3learners)
+#'   library(data.table)
+#'
+#'   fun = function(xs) {
+#'     list(y = xs$x ^ 2)
+#'   }
+#'   domain = ps(x = p_dbl(lower = -10, upper = 10))
+#'   codomain = ps(y = p_dbl(tags = "minimize"))
+#'   objective = ObjectiveRFun$new(fun = fun, domain = domain, codomain = codomain)
+#'
+#'   instance = OptimInstanceBatchSingleCrit$new(
+#'     objective = objective,
+#'     terminator = trm("evals", n_evals = 5))
+#'
+#'   instance$eval_batch(data.table(x = c(-6, -5, 3, 9)))
+#'
+#'   learner = default_gp()
+#'
+#'   surrogate = srlrn(learner, archive = instance$archive)
+#'
+#'   acq_function = acqf("stochastic_cb", surrogate = surrogate, lambda = 3)
+#'
+#'   acq_function$surrogate$update()
+#'   acq_function$update()
+#'   acq_function$eval_dt(data.table(x = c(-1, 0, 1)))
+#' }
+AcqFunctionStochasticCB = R6Class("AcqFunctionStochasticCB",
+  inherit = AcqFunction,
+
+  public = list(
+
+    #' @description
+    #' Creates a new instance of this [R6][R6::R6Class] class.
+    #'
+    #' @param surrogate (`NULL` | [SurrogateLearner]).
+    #' @param lambda (`numeric(1)`).
+    #' @param min_lambda (`numeric(1)`).
+    #' @param max_lambda (`numeric(1)`).
+    #' @param distribution (`character(1)`).
+    #' @param rate (`numeric(1)`).
+    #' @param period (`NULL` | `integer(1)`).
+    initialize = function(
+      surrogate = NULL,
+      lambda = 1.96,
+      min_lambda = 0.01,
+      max_lambda = 10,
+      distribution = "uniform",
+      rate = 0,
+      period = NULL
+      ) {
+      assert_r6(surrogate, "SurrogateLearner", null.ok = TRUE)
+      private$.lambda = assert_number(lambda, lower = .Machine$double.neg.eps, null.ok = TRUE)
+      private$.min_lambda = assert_number(min_lambda, lower = .Machine$double.neg.eps, null.ok = TRUE)
+      private$.max_lambda = assert_number(max_lambda, lower = .Machine$double.neg.eps, null.ok = TRUE)
+      private$.distribution = assert_choice(distribution, choices = c("uniform", "exponential"))
+
+      if (private$.distribution == "uniform" && (is.null(private$.min_lambda) || is.null(private$.max_lambda))) {
+        stop('If `distribution` is "uniform", `min_lambda` and `max_lambda` must be set.')
+      }
+
+      if (private$.distribution == "exponential" && is.null(private$.lambda)) {
+        stop('If `distribution` is "exponential", `lambda` must be set.')
+      }
+
+      private$.rate = assert_number(rate, lower = 0)
+      private$.period = assert_int(period, lower = 1, null.ok = TRUE)
+
+      constants = ps(lambda = p_dbl(lower = 0))
+
+      super$initialize("acq_cb",
+        constants = constants,
+        surrogate = surrogate,
+        requires_predict_type_se = TRUE,
+        direction = "same",
+        label = "Stochastic Lower / Upper Confidence Bound",
+        man = "mlr3mbo::mlr_acqfunctions_stochastic_cb")
+    },
+
+    #' @description
+    #' Update the acquisition function.
+    #' Samples and decays lambda.
+    update = function() {
+      # sample lambda
+      if (is.null(self$constants$values$lambda)) {
+
+        if (private$.distribution == "uniform") {
+          lambda = runif(1, private$.min_lambda, private$.max_lambda)
+        } else {
+          lambda = rexp(1, 1 / private$.lambda)
+        }
+
+        private$.lambda_0 = lambda
+        self$constants$values$lambda = lambda
+      }
+
+      # decay lambda
+      if (private$.rate > 0) {
+        lambda_0 = private$.lambda_0
+        period = private$.period
+        t = if (is.null(period)) private$.t else private$.t %% period
+        rate = private$.rate
+
+        self$constants$values$lambda = lambda_0 * exp(-rate * t)
+        private$.t = t + 1L
+      }
+    },
+
+    #' @description
+    #' Reset the acquisition function.
+    #' Resets the private update counter `.t` used within the epsilon decay.
+    reset = function() {
+      private$.t = 0L
+    }
+  ),
+
+  private = list(
+    .lambda = NULL,
+    .min_lambda = NULL,
+    .max_lambda = NULL,
+    .distribution = NULL,
+    .rate = NULL,
+    .period = NULL,
+    .lambda_0 = NULL,
+    .t = 0L,
+    .fun = function(xdt, lambda) {
+      p = self$surrogate$predict(xdt)
+      cb = p$mean - self$surrogate_max_to_min * lambda * p$se
+      data.table(acq_cb = cb,  acq_lambda = lambda, acq_lambda_0 = private$.lambda_0)
+    }
+  )
+)
+
+mlr_acqfunctions$add("stochastic_cb", AcqFunctionStochasticCB)
+