Implement suggest in dedicated EgorService

relf · relf · commit 33d23c0e3165 · 2023-11-17T11:30:58.000+01:00
diff --git a/ego/src/egor.rs b/ego/src/egor.rs
@@ -290,6 +290,8 @@ impl<O: GroupFunc, SB: SurrogateBuilder> Egor<O, SB> {
     /// where optimum may occurs regarding the infill criterium.
     /// This function inverse the control of the optimization and can used
     /// ask-and-tell interface to the EGO optimizer.
+    ///
+    #[deprecated(since = "0.13.0", note = "moved in EgorService struct impl")]
     pub fn suggest(
         &self,
         x_data: &ArrayBase<impl Data<Elem = f64>, Ix2>,
@@ -351,7 +353,6 @@ mod tests {
     use ndarray::{array, s, ArrayView2, Ix1, Zip};
 
     use ndarray_npy::read_npy;
-    use ndarray_stats::QuantileExt;
 
     use serial_test::serial;
     use std::time::Instant;
@@ -441,30 +442,6 @@ mod tests {
         assert_abs_diff_eq!(expected, res.x_opt, epsilon = 1e-1);
     }
 
-    #[test]
-    #[serial]
-    fn test_xsinx_suggestions_egor_builder() {
-        let ego = EgorBuilder::optimize(xsinx)
-            .random_seed(42)
-            .min_within(&array![[0., 25.]])
-            .regression_spec(RegressionSpec::ALL)
-            .correlation_spec(CorrelationSpec::ALL)
-            .infill_strategy(InfillStrategy::EI);
-
-        let mut doe = array![[0.], [7.], [20.], [25.]];
-        let mut y_doe = xsinx(&doe.view());
-        for _i in 0..10 {
-            let x_suggested = ego.suggest(&doe, &y_doe);
-
-            doe = concatenate![Axis(0), doe, x_suggested];
-            y_doe = xsinx(&doe.view());
-        }
-
-        let expected = -15.1;
-        let y_opt = y_doe.min().unwrap();
-        assert_abs_diff_eq!(expected, *y_opt, epsilon = 1e-1);
-    }
-
     fn rosenb(x: &ArrayView2<f64>) -> Array2<f64> {
         let mut y: Array2<f64> = Array2::zeros((x.nrows(), 1));
         Zip::from(y.rows_mut())
diff --git a/ego/src/egor_service.rs b/ego/src/egor_service.rs
@@ -0,0 +1,331 @@
+//! Egor optimizer implements EGO algorithm with basic handling of constraints.
+//!
+//! ```no_run
+//! # use ndarray::{array, Array2, ArrayView1, ArrayView2, Zip};
+//! # use egobox_doe::{Lhs, SamplingMethod};
+//! # use egobox_ego::{EgorBuilder, InfillStrategy, InfillOptimizer};
+//!
+//! # use rand_xoshiro::Xoshiro256Plus;
+//! # use ndarray_rand::rand::SeedableRng;
+//! use argmin_testfunctions::rosenbrock;
+//!
+//! // Rosenbrock test function: minimum y_opt = 0 at x_opt = (1, 1)
+//! fn rosenb(x: &ArrayView2<f64>) -> Array2<f64> {
+//!     let mut y: Array2<f64> = Array2::zeros((x.nrows(), 1));
+//!     Zip::from(y.rows_mut())
+//!         .and(x.rows())
+//!         .par_for_each(|mut yi, xi| yi.assign(&array![rosenbrock(&xi.to_vec(), 1., 100.)]));
+//!     y
+//! }
+//!
+//! let xlimits = array![[-2., 2.], [-2., 2.]];
+//! let res = EgorBuilder::optimize(rosenb)
+//!     .min_within(&xlimits)
+//!     .infill_strategy(InfillStrategy::EI)
+//!     .n_doe(10)
+//!     .target(1e-1)
+//!     .n_iter(30)
+//!     .run()
+//!     .expect("Rosenbrock minimization");
+//! println!("Rosenbrock min result = {:?}", res);
+//! ```
+//!
+//! Constraints are expected to be evaluated with the objective function
+//! meaning that the function passed to the optimizer has to return
+//! a vector consisting of [obj, cstr_1, ..., cstr_n] and the cstr values
+//! are intended to be negative at the end of the optimization.
+//! Constraint number should be declared with `n_cstr` setter.
+//! A tolerance can be adjust with `cstr_tol` setter for relaxing constraint violation
+//! if specified cstr values should be < `cstr_tol` (instead of < 0)
+//!
+//! ```no_run
+//! # use ndarray::{array, Array2, ArrayView1, ArrayView2, Zip};
+//! # use egobox_doe::{Lhs, SamplingMethod};
+//! # use egobox_ego::{EgorBuilder, InfillStrategy, InfillOptimizer};
+//! # use rand_xoshiro::Xoshiro256Plus;
+//! # use ndarray_rand::rand::SeedableRng;
+//!
+//! // Function G24: 1 global optimum y_opt = -5.5080 at x_opt =(2.3295, 3.1785)
+//! fn g24(x: &ArrayView1<f64>) -> f64 {
+//!    -x[0] - x[1]
+//! }
+//!
+//! // Constraints < 0
+//! fn g24_c1(x: &ArrayView1<f64>) -> f64 {
+//!     -2.0 * x[0].powf(4.0) + 8.0 * x[0].powf(3.0) - 8.0 * x[0].powf(2.0) + x[1] - 2.0
+//! }
+//!
+//! fn g24_c2(x: &ArrayView1<f64>) -> f64 {
+//!     -4.0 * x[0].powf(4.0) + 32.0 * x[0].powf(3.0)
+//!     - 88.0 * x[0].powf(2.0) + 96.0 * x[0] + x[1]
+//!     - 36.0
+//! }
+//!
+//! // Gouped function : objective + constraints
+//! fn f_g24(x: &ArrayView2<f64>) -> Array2<f64> {
+//!     let mut y = Array2::zeros((x.nrows(), 3));
+//!     Zip::from(y.rows_mut())
+//!         .and(x.rows())
+//!         .for_each(|mut yi, xi| {
+//!             yi.assign(&array![g24(&xi), g24_c1(&xi), g24_c2(&xi)]);
+//!         });
+//!     y
+//! }
+//!
+//! let xlimits = array![[0., 3.], [0., 4.]];
+//! let doe = Lhs::new(&xlimits).sample(10);
+//! let res = EgorBuilder::optimize(f_g24)
+//!            .min_within(&xlimits)
+//!            .n_cstr(2)
+//!            .infill_strategy(InfillStrategy::EI)
+//!            .infill_optimizer(InfillOptimizer::Cobyla)
+//!            .doe(&doe)
+//!            .n_iter(40)
+//!            .target(-5.5080)
+//!            .run()
+//!            .expect("g24 minimized");
+//! println!("G24 min result = {:?}", res);
+//! ```
+//!
+use crate::egor_solver::*;
+use crate::mixint::*;
+use crate::types::*;
+
+use egobox_moe::{CorrelationSpec, MoeParams, RegressionSpec};
+use ndarray::Array1;
+use ndarray::{Array2, ArrayBase, Data, Ix2};
+use ndarray_rand::rand::SeedableRng;
+use rand_xoshiro::Xoshiro256Plus;
+
+/// EGO optimizer service builder allowing to use Egor optimizer
+/// with an ask-and-tell interface.
+///
+pub struct EgorServiceBuilder {
+    seed: Option<u64>,
+}
+
+impl EgorServiceBuilder {
+    /// Function to be minimized domain should be basically R^nx -> R^ny
+    /// where nx is the dimension of input x and ny the output dimension
+    /// equal to 1 (obj) + n (cstrs).
+    /// But function has to be able to evaluate several points in one go
+    /// hence take an (p, nx) matrix and return an (p, ny) matrix
+    pub fn optimize() -> Self {
+        EgorServiceBuilder { seed: None }
+    }
+
+    /// Allow to specify a seed for random number generator to allow
+    /// reproducible runs.
+    pub fn random_seed(mut self, seed: u64) -> Self {
+        self.seed = Some(seed);
+        self
+    }
+
+    /// Build an Egor optimizer to minimize the function within
+    /// the continuous `xlimits` specified as [[lower, upper], ...] array where the
+    /// number of rows gives the dimension of the inputs (continuous optimization)
+    /// and the ith row is the interval of the ith component of the input x.
+    pub fn min_within(
+        self,
+        xlimits: &ArrayBase<impl Data<Elem = f64>, Ix2>,
+    ) -> EgorService<MoeParams<f64, Xoshiro256Plus>> {
+        let rng = if let Some(seed) = self.seed {
+            Xoshiro256Plus::seed_from_u64(seed)
+        } else {
+            Xoshiro256Plus::from_entropy()
+        };
+        EgorService {
+            solver: EgorSolver::new(xlimits, rng),
+        }
+    }
+
+    /// Build an Egor optimizer to minimize the function R^n -> R^p taking
+    /// inputs specified with given xtypes where some of components may be
+    /// discrete variables (mixed-integer optimization).
+    pub fn min_within_mixint_space(self, xtypes: &[XType]) -> EgorService<MixintMoeParams> {
+        let rng = if let Some(seed) = self.seed {
+            Xoshiro256Plus::seed_from_u64(seed)
+        } else {
+            Xoshiro256Plus::from_entropy()
+        };
+        EgorService {
+            solver: EgorSolver::new_with_xtypes(xtypes, rng),
+        }
+    }
+}
+
+/// Egor optimizer structure used to parameterize the underlying `argmin::Solver`
+/// and trigger the optimization using `argmin::Executor`.
+#[derive(Clone)]
+pub struct EgorService<SB: SurrogateBuilder> {
+    solver: EgorSolver<SB>,
+}
+
+impl<SB: SurrogateBuilder> EgorService<SB> {
+    /// Sets allowed number of evaluation of the function under optimization
+    pub fn n_iter(mut self, n_iter: usize) -> Self {
+        self.solver = self.solver.n_iter(n_iter);
+        self
+    }
+
+    /// Sets the number of runs of infill strategy optimizations (best result taken)
+    pub fn n_start(mut self, n_start: usize) -> Self {
+        self.solver = self.solver.n_start(n_start);
+        self
+    }
+
+    /// Sets Number of parallel evaluations of the function under optimization
+    pub fn q_points(mut self, q_points: usize) -> Self {
+        self.solver = self.solver.q_points(q_points);
+        self
+    }
+
+    /// Number of samples of initial LHS sampling (used when DOE not provided by the user)
+    ///
+    /// When 0 a number of points is computed automatically regarding the number of input variables
+    /// of the function under optimization.
+    pub fn n_doe(mut self, n_doe: usize) -> Self {
+        self.solver = self.solver.n_doe(n_doe);
+        self
+    }
+
+    /// Sets the number of constraint functions
+    pub fn n_cstr(mut self, n_cstr: usize) -> Self {
+        self.solver = self.solver.n_cstr(n_cstr);
+        self
+    }
+
+    /// Sets the tolerance on constraints violation (cstr < tol)
+    pub fn cstr_tol(mut self, tol: &Array1<f64>) -> Self {
+        self.solver = self.solver.cstr_tol(tol);
+        self
+    }
+
+    /// Sets an initial DOE \['ns', `nt`\] containing `ns` samples.
+    ///
+    /// Either `nt` = `nx` then only `x` input values are specified and `ns` evals are done to get y ouput doe values,
+    /// or `nt = nx + ny` then `x = doe\[:, :nx\]` and `y = doe\[:, nx:\]` are specified
+    pub fn doe(mut self, doe: &Array2<f64>) -> Self {
+        self.solver = self.solver.doe(doe);
+        self
+    }
+
+    /// Sets the parallel infill strategy
+    ///
+    /// Parallel infill criterion to get virtual next promising points in order to allow
+    /// n parallel evaluations of the function under optimization.
+    pub fn qei_strategy(mut self, q_ei: QEiStrategy) -> Self {
+        self.solver = self.solver.qei_strategy(q_ei);
+        self
+    }
+
+    /// Sets the infill strategy
+    pub fn infill_strategy(mut self, infill: InfillStrategy) -> Self {
+        self.solver = self.solver.infill_strategy(infill);
+        self
+    }
+
+    /// Sets the infill optimizer
+    pub fn infill_optimizer(mut self, optimizer: InfillOptimizer) -> Self {
+        self.solver = self.solver.infill_optimizer(optimizer);
+        self
+    }
+
+    /// Sets the allowed regression models used in gaussian processes.
+    pub fn regression_spec(mut self, regression_spec: RegressionSpec) -> Self {
+        self.solver = self.solver.regression_spec(regression_spec);
+        self
+    }
+
+    /// Sets the allowed correlation models used in gaussian processes.
+    pub fn correlation_spec(mut self, correlation_spec: CorrelationSpec) -> Self {
+        self.solver = self.solver.correlation_spec(correlation_spec);
+        self
+    }
+
+    /// Sets the number of components to be used specifiying PLS projection is used (a.k.a KPLS method).
+    ///
+    /// This is used to address high-dimensional problems typically when `nx` > 9 wher `nx` is the dimension of `x`.
+    pub fn kpls_dim(mut self, kpls_dim: usize) -> Self {
+        self.solver = self.solver.kpls_dim(kpls_dim);
+        self
+    }
+
+    /// Sets the number of clusters used by the mixture of surrogate experts.
+    ///
+    /// When set to 0, the number of clusters is determined automatically
+    /// (warning in this case the optimizer runs slower)
+    pub fn n_clusters(mut self, n_clusters: usize) -> Self {
+        self.solver = self.solver.n_clusters(n_clusters);
+        self
+    }
+
+    /// Sets a known target minimum to be used as a stopping criterion.
+    pub fn target(mut self, target: f64) -> Self {
+        self.solver = self.solver.target(target);
+        self
+    }
+
+    /// Sets a directory to write optimization history and used as search path for hot start doe
+    pub fn outdir(mut self, outdir: impl Into<String>) -> Self {
+        self.solver = self.solver.outdir(outdir);
+        self
+    }
+
+    /// Whether we start by loading last DOE saved in `outdir` as initial DOE
+    pub fn hot_start(mut self, hot_start: bool) -> Self {
+        self.solver = self.solver.hot_start(hot_start);
+        self
+    }
+
+    /// Given an evaluated doe (x, y) data, return the next promising x point
+    /// where optimum may occurs regarding the infill criterium.
+    /// This function inverse the control of the optimization and can used
+    /// ask-and-tell interface to the EGO optimizer.
+    pub fn suggest(
+        &self,
+        x_data: &ArrayBase<impl Data<Elem = f64>, Ix2>,
+        y_data: &ArrayBase<impl Data<Elem = f64>, Ix2>,
+    ) -> Array2<f64> {
+        self.solver.suggest(x_data, y_data)
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use approx::assert_abs_diff_eq;
+    use ndarray::{array, concatenate, ArrayView2, Axis};
+
+    use ndarray_stats::QuantileExt;
+
+    use serial_test::serial;
+
+    fn xsinx(x: &ArrayView2<f64>) -> Array2<f64> {
+        (x - 3.5) * ((x - 3.5) / std::f64::consts::PI).mapv(|v| v.sin())
+    }
+
+    #[test]
+    #[serial]
+    fn test_xsinx_egor_builder() {
+        let ego = EgorServiceBuilder::optimize()
+            .random_seed(42)
+            .min_within(&array![[0., 25.]])
+            .regression_spec(RegressionSpec::ALL)
+            .correlation_spec(CorrelationSpec::ALL)
+            .infill_strategy(InfillStrategy::EI);
+
+        let mut doe = array![[0.], [7.], [20.], [25.]];
+        let mut y_doe = xsinx(&doe.view());
+        for _i in 0..10 {
+            let x_suggested = ego.suggest(&doe, &y_doe);
+
+            doe = concatenate![Axis(0), doe, x_suggested];
+            y_doe = xsinx(&doe.view());
+        }
+
+        let expected = -15.1;
+        let y_opt = y_doe.min().unwrap();
+        assert_abs_diff_eq!(expected, *y_opt, epsilon = 1e-1);
+    }
+}
diff --git a/ego/src/lib.rs b/ego/src/lib.rs
@@ -188,6 +188,7 @@
 //!
 mod criteria;
 mod egor;
+mod egor_service;
 mod egor_solver;
 mod egor_state;
 mod errors;
@@ -201,6 +202,7 @@ mod utils;
 
 pub use crate::criteria::*;
 pub use crate::egor::*;
+pub use crate::egor_service::*;
 pub use crate::egor_solver::*;
 pub use crate::egor_state::*;
 pub use crate::errors::*;