From c851ef0de4167b37477ee8322c939efa949bb05d Mon Sep 17 00:00:00 2001 From: Marc Becker <33069354+be-marc@users.noreply.github.com> Date: Wed, 9 Nov 2022 19:41:54 +0100 Subject: [PATCH] refactor: rewrite auto fselector function and class (#58) * refactor: rewrite auto fselector function and class * fix: task clone * fix: parameters * docs: rebuild --- NEWS.md | 3 + R/AutoFSelector.R | 310 ++++++++++++++------- R/auto_fselector.R | 21 +- man-roxygen/param_learner.R | 3 +- man-roxygen/param_measure.R | 2 +- man-roxygen/param_resampling.R | 5 +- man-roxygen/param_store_fselect_instance.R | 3 + man-roxygen/param_terminator.R | 3 +- man/AutoFSelector.Rd | 214 ++++++++++---- man/FSelectInstanceMultiCrit.Rd | 11 +- man/FSelectInstanceSingleCrit.Rd | 13 +- man/ObjectiveFSelect.Rd | 8 +- man/auto_fselector.Rd | 66 ++++- man/fselect.Rd | 8 +- man/fselect_nested.Rd | 5 +- tests/testthat/test_AutoFSelector.R | 66 ++--- tests/testthat/test_FSelectorRFE.R | 2 +- 17 files changed, 522 insertions(+), 221 deletions(-) create mode 100644 man-roxygen/param_store_fselect_instance.R diff --git a/NEWS.md b/NEWS.md index d89c16d5..c5a43846 100644 --- a/NEWS.md +++ b/NEWS.md @@ -1,6 +1,9 @@ # mlr3fselect 0.7.2.9000 * refactor: `FSelectorRFE` throws an error if the learner does not support the `$importance()` method. +* refactor: The `AutoFSelector` stores the instance and benchmark result if `store_models = TRUE`. +* refactor: The `AutoFSelector` stores the instance if `store_benchmark_result = TRUE`. +* feat: Add missing parameters from `AutoFSelector` to `auto_fselect()`. # mlr3fselect 0.7.2 diff --git a/R/AutoFSelector.R b/R/AutoFSelector.R index 1aaf0e03..63187d0e 100644 --- a/R/AutoFSelector.R +++ b/R/AutoFSelector.R @@ -1,24 +1,32 @@ #' @title AutoFSelector #' #' @description -#' The `AutoFSelector` is a [mlr3::Learner] which wraps another [mlr3::Learner] -#' and performs the following steps during `$train()`: +#' The [AutoFSelector] wraps a [mlr3::Learner] and augments it with an automatic feature selection. +#' The [auto_fselector()] function creates an [AutoFSelector] object. #' -#' 1. The wrapped (inner) learner is trained on the feature subsets via -#' resampling. The feature selection can be specified by providing a -#' [FSelector], a [bbotk::Terminator], a [mlr3::Resampling] and a -#' [mlr3::Measure]. -#' 2. A final model is fit on the complete training data with the best found -#' feature subset. +#' @details +#' The [AutoFSelector] is a [mlr3::Learner] which wraps another [mlr3::Learner] and performs the following steps during `$train()`: #' -#' During `$predict()` the `AutoFSelector` just calls the predict method of the -#' wrapped (inner) learner. +#' 1. The wrapped (inner) learner is trained on the feature subsets via resampling. +#' The feature selection can be specified by providing a [FSelector], a [bbotk::Terminator], a [mlr3::Resampling] and a [mlr3::Measure]. +#' 2. A final model is fit on the complete training data with the best found feature subset. #' -#' Note that this approach allows to perform nested resampling by passing an -#' [AutoFSelector] object to [mlr3::resample()] or [mlr3::benchmark()]. -#' To access the inner resampling results, set `store_fselect_instance = TRUE` -#' and execute [mlr3::resample()] or [mlr3::benchmark()] with -#' `store_models = TRUE`. +#' During `$predict()` the [AutoFSelector] just calls the predict method of the wrapped (inner) learner. +#' +#' @section Resources: +#' * [book chapter](https://mlr3book.mlr-org.com/feature-selection.html#autofselect) on automatic feature selection. +#' +#' @section Nested Resampling: +#' Nested resampling can be performed by passing an [AutoFSelector] object to [mlr3::resample()] or [mlr3::benchmark()]. +#' To access the inner resampling results, set `store_fselect_instance = TRUE` and execute [mlr3::resample()] or [mlr3::benchmark()] with `store_models = TRUE` (see examples). +#' The [mlr3::Resampling] passed to the [AutoFSelector] is meant to be the inner resampling, operating on the training set of an arbitrary outer resampling. +#' For this reason it is not feasible to pass an instantiated [mlr3::Resampling] here. +#' +#' @template param_learner +#' @template param_resampling +#' @template param_measure +#' @template param_terminator +#' @template param_store_fselect_instance #' #' @template param_store_models #' @template param_check_values @@ -26,80 +34,85 @@ #' #' @export #' @examples -#' library(mlr3) +#' # Automafsic Feafsure Selection +#' +#' task = tsk("penguins") +#' train_set = sample(task$nrow, 0.8 * task$nrow) +#' test_set = setdiff(seq_len(task$nrow), train_set) #' -#' task = tsk("iris") -#' learner = lrn("classif.rpart") -#' resampling = rsmp("holdout") -#' measure = msr("classif.ce") +#' afs = auto_fselector( +#' method = fs("random_search"), +#' learner = lrn("classif.rpart"), +#' resampling = rsmp ("holdout"), +#' measure = msr("classif.ce"), +#' term_evals = 4) #' -#' terminator = trm("evals", n_evals = 3) -#' fselector = fs("exhaustive_search") -#' afs = AutoFSelector$new(learner, resampling, measure, terminator, fselector, -#' store_fselect_instance = TRUE) +#' # optimize feafsure subset and fit final model +#' afs$train(task, row_ids = train_set) #' -#' afs$train(task) +#' # predict with final model +#' afs$predict(task, row_ids = test_set) +#' +#' # show fselect result +#' afs$fselect_result +#' +#' # model slot contains trained learner and fselect instance #' afs$model +#' +#' # shortcut trained learner #' afs$learner +#' +#' # shortcut fselect instance +#' afs$tuning_instance +#' +#' +#' # Nested Resampling +#' +#' afs = auto_fselector( +#' method = fs("random_search"), +#' learner = lrn("classif.rpart"), +#' resampling = rsmp ("holdout"), +#' measure = msr("classif.ce"), +#' term_evals = 4) +#' +#' resampling_outer = rsmp("cv", folds = 3) +#' rr = resample(task, afs, resampling_outer, store_models = TRUE) +#' +#' # retrieve inner tuning results. +#' extract_inner_fselect_results(rr) +#' +#' # performance scores estimated on the outer resampling +#' rr$score() +#' +#' # unbiased performance of the final model trained on the full dafsa set +#' rr$aggregate() AutoFSelector = R6Class("AutoFSelector", inherit = Learner, public = list( #' @field instance_args (`list()`)\cr - #' All arguments from construction to create the - #' [FSelectInstanceSingleCrit]. + #' All arguments from construction to create the [FSelectInstanceSingleCrit]. instance_args = NULL, #' @field fselector ([FSelector])\cr - #' Stores the feature selection algorithm. + #' Optimization algorithm. fselector = NULL, #' @description #' Creates a new instance of this [R6][R6::R6Class] class. #' - #' @param learner ([mlr3::Learner])\cr - #' Learner to optimize the feature subset for, see - #' [FSelectInstanceSingleCrit]. - #' - #' @param resampling ([mlr3::Resampling])\cr - #' Resampling strategy during feature selection, see - #' [FSelectInstanceSingleCrit]. This [mlr3::Resampling] is meant to be the - #' **inner** resampling, operating on the training set of an arbitrary outer - #' resampling. For this reason it is not feasible to pass an instantiated - #' [mlr3::Resampling] here. - #' - #' @param measure ([mlr3::Measure])\cr - #' Performance measure to optimize. - #' - #' @param terminator ([bbotk::Terminator])\cr - #' When to stop feature selection, see [FSelectInstanceSingleCrit]. - #' #' @param fselector ([FSelector])\cr - #' Feature selection algorithm to run. - #' - #' @param store_fselect_instance (`logical(1)`)\cr - #' If `TRUE` (default), stores the internally created - #' [FSelectInstanceSingleCrit] with all intermediate results in slot - #' `$fselect_instance`. - initialize = function(learner, resampling, measure, terminator, fselector, - store_fselect_instance = TRUE, store_benchmark_result = TRUE, - store_models = FALSE, check_values = FALSE) { + #' Optimization algorithm. + initialize = function(learner, resampling, measure = NULL, terminator, fselector, store_fselect_instance = TRUE, store_benchmark_result = TRUE, store_models = FALSE, check_values = FALSE) { ia = list() ia$learner = assert_learner(as_learner(learner, clone = TRUE)) - ia$resampling = assert_resampling(resampling, - instantiated = FALSE)$clone() - ia$measure = assert_measure(as_measure(measure), learner = learner) + ia$resampling = assert_resampling(resampling, instantiated = FALSE)$clone() + if (!is.null(measure)) ia$measure = assert_measure(as_measure(measure), learner = learner) ia$terminator = assert_terminator(terminator)$clone() - private$.store_fselect_instance = assert_flag(store_fselect_instance) - ia$store_benchmark_result = assert_flag(store_benchmark_result) - ia$store_models = assert_flag(store_models) - if (!private$.store_fselect_instance && ia$store_benchmark_result) { - stop("Benchmark results can only be stored if store_fselect_instance is set to TRUE") - } - if (ia$store_models && !ia$store_benchmark_result) { - stop("Models can only be stored if store_benchmark_result is set to TRUE") - } + ia$store_models = assert_flag(store_models) + ia$store_benchmark_result = assert_flag(store_benchmark_result) || ia$store_models + private$.store_fselect_instance = assert_flag(store_fselect_instance) || ia$store_benchmark_result ia$check_values = assert_flag(check_values) self$instance_args = ia @@ -111,7 +124,6 @@ AutoFSelector = R6Class("AutoFSelector", packages = c("mlr3fselect", learner$packages), feature_types = learner$feature_types, predict_types = learner$predict_types, - param_set = learner$param_set, properties = learner$properties ) @@ -120,52 +132,96 @@ AutoFSelector = R6Class("AutoFSelector", }, #' @description - #' Extracts the base learner from nested learner objects like - #' `GraphLearner` in \CRANpkg{mlr3pipelines}. If `recursive = 0`, the (tuned) - #' learner is returned. + #' Extracts the base learner from nested learner objects like `GraphLearner` in \CRANpkg{mlr3pipelines}. + #' If `recursive = 0`, the (tuned) learner is returned. #' #' @param recursive (`integer(1)`)\cr #' Depth of recursion for multiple nested objects. #' #' @return [Learner]. base_learner = function(recursive = Inf) { - if(recursive == 0) self$learner else self$learner$base_learner(recursive -1) - } - ), - - private = list( - - .train = function(task) { - - ia = self$instance_args - ia$task = task$clone() - instance = invoke(FSelectInstanceSingleCrit$new, .args = ia) - self$fselector$optimize(instance) - - feat = task$feature_names[as.logical(instance$result_x_search_space)] - ia$task$select(feat) + if (recursive == 0L) self$learner else self$learner$base_learner(recursive - 1L) + }, - learner = ia$learner$clone(deep = TRUE) - learner$train(ia$task) + #' @description + #' The importance scores of the final model. + #' + #' @return Named `numeric()`. + importance = function() { + if ("importance" %nin% self$instance_args$learner$properties) { + stopf("Learner ''%s' cannot calculate important scores.", self$instance_args$learner$id) + } + if (is.null(self$model$learner$model)) { + self$instance_args$learner$importance() + } else { + self$model$learner$importance() + } + }, - result_model = list(learner = learner, features = feat) - if (isTRUE(private$.store_fselect_instance)) { - result_model$fselect_instance = instance + #' @description + #' The selected features of the final model. + #' These features are selected internally by the learner. + #' + #' @return `character()`. + selected_features = function() { + if ("selected_features" %nin% self$instance_args$learner$properties) { + stopf("Learner ''%s' cannot select features.", self$instance_args$learner$id) + } + if (is.null(self$model$learner$model)) { + self$instance_args$learner$selected_features() + } else { + self$model$learner$selected_features() } - return(result_model) }, - .predict = function(task) { - task = task$clone(deep = TRUE) - task$select(self$model$features) - self$model$learner$predict(task) + #' @description + #' The out-of-bag error of the final model. + #' + #' @return `numeric(1)`. + oob_error = function() { + if ("oob_error" %nin% self$instance_args$learner$properties) { + stopf("Learner '%s' cannot calculate the out-of-bag error.", self$instance_args$learner$id) + } + if (is.null(self$model$learner$model)) { + self$instance_args$learner$oob_error() + } else { + self$model$learner$oob_error() + } }, - .base_learner = function(recursive = Inf) { - if (recursive == 0L) self$learner else self$learner$base_learner(recursive - 1L) + #' @description + #' The log-likelihood of the final model. + #' + #' @return `logLik`. + loglik = function() { + if ("loglik" %nin% self$instance_args$learner$properties) { + stopf("Learner '%s' cannot calculate the log-likelihood.", self$instance_args$learner$id) + } + if (is.null(self$model$learner$model)) { + self$instance_args$learner$loglik() + } else { + self$model$learner$loglik() + } }, - .store_fselect_instance = NULL + #' Printer. + #' @param ... (ignored). + print = function() { + catf(format(self)) + catf(str_indent("* Model:", if (is.null(self$model)) "-" else class(self$model)[1L])) + catf(str_indent("* Packages:", self$packages)) + catf(str_indent("* Predict Type:", self$predict_type)) + catf(str_indent("* Feature Types:", self$feature_types)) + catf(str_indent("* Properties:", self$properties)) + w = self$warnings + e = self$errors + if (length(w)) { + catf(str_indent("* Warnings:", w)) + } + if (length(e)) { + catf(str_indent("* Errors:", e)) + } + } ), active = list( @@ -178,7 +234,7 @@ AutoFSelector = R6Class("AutoFSelector", #' Trained learner. learner = function() { # if there is no trained learner, we return the one in instance args - if (is.null(self$model)) { + if (is.null(self$model$learner$model)) { self$instance_args$learner } else { self$model$learner @@ -186,14 +242,32 @@ AutoFSelector = R6Class("AutoFSelector", }, #' @field fselect_instance ([FSelectInstanceSingleCrit])\cr - #' Internally created feature selection instance with all intermediate - #' results. + #' Internally created feature selection instance with all intermediate results. fselect_instance = function() self$model$fselect_instance, #' @field fselect_result ([data.table::data.table])\cr #' Short-cut to `$result` from [FSelectInstanceSingleCrit]. fselect_result = function() self$fselect_instance$result, + #' @field predict_type (`character(1)`)\cr + #' Stores the currently active predict type, e.g. `"response"`. + #' Must be an element of `$predict_types`. + predict_type = function(rhs) { + if (missing(rhs)) { + return(private$.predict_type) + } + if (rhs %nin% self$predict_types) { + stopf("Learner '%s' does not support predict type '%s'", self$id, rhs) + } + + # Catches 'Error: Field/Binding is read-only' bug + tryCatch({ + self$model$learner$predict_type = rhs + }, error = function(cond){}) + + private$.predict_type = rhs + }, + #' @field hash (`character(1)`)\cr #' Hash (unique identifier) for this object. hash = function(rhs) { @@ -201,5 +275,39 @@ AutoFSelector = R6Class("AutoFSelector", calculate_hash(class(self), self$id, self$param_set$values, private$.predict_type, self$fallback$hash, self$instance_args, private$.store_fselect_instance) } + ), + + private = list( + .train = function(task) { + # construct instance from args; then tune + ia = self$instance_args + ia$task = task$clone() + instance = invoke(FSelectInstanceSingleCrit$new, .args = ia) + self$fselector$optimize(instance) + learner = ia$learner$clone(deep = TRUE) + task = task$clone() + + # disable timeout to allow train on full data set without time limit + # timeout during tuning is not affected + learner$timeout = c(train = Inf, predict = Inf) + + # fit final model + feat = task$feature_names[as.logical(instance$result_x_search_space)] + task$select(feat) + learner$train(task) + + # the return model is a list of "learner", "features" and "fselect_instance" + result_model = list(learner = learner, features = feat) + if (private$.store_fselect_instance) result_model$fselect_instance = instance + result_model + }, + + .predict = function(task) { + task = task$clone(deep = TRUE) + task$select(self$model$features) + self$model$learner$predict(task) + }, + + .store_fselect_instance = NULL ) ) diff --git a/R/auto_fselector.R b/R/auto_fselector.R index ecbe7c61..49f01dfe 100644 --- a/R/auto_fselector.R +++ b/R/auto_fselector.R @@ -1,7 +1,9 @@ -#' @title Syntactic Sugar for Automatic Feature Selection +#' @title Function for Automatic Feature Selection #' -#' @description -#' Function to create an [AutoFSelector] object. +#' @inherit AutoFSelector description +#' @inheritSection AutoFSelector Resources +#' @inherit AutoFSelector details +#' @inheritSection AutoFSelector Nested Resampling #' #' @param method (`character(1)` | [FSelector])\cr #' Key to retrieve fselector from [mlr_fselectors] dictionary or [FSelector] object. @@ -12,11 +14,16 @@ #' @param ... (named `list()`)\cr #' Named arguments to be set as parameters of the fselector. #' -#' @return [AutoFSelector] +#' @return [AutoFSelector]. #' #' @template param_learner #' @template param_resampling #' @template param_measure +#' @template param_terminator +#' @template param_store_fselect_instance +#' @template param_store_benchmark_result +#' @template param_store_models +#' @template param_check_values #' #' @export #' @examples @@ -28,14 +35,14 @@ #' term_evals = 4) #' #' at$train(tsk("pima")) -auto_fselector = function(method, learner, resampling, measure, term_evals = NULL, term_time = NULL, ...) { +auto_fselector = function(method, learner, resampling, measure = NULL, term_evals = NULL, term_time = NULL, terminator = NULL, store_fselect_instance = TRUE, store_benchmark_result = TRUE, store_models = FALSE, check_values = FALSE, ...) { fselector = if (is.character(method)) { assert_choice(method, mlr_fselectors$keys()) fs(method, ...) } else { assert_fselector(method) } - terminator = terminator_selection(term_evals, term_time) + terminator = terminator %??% terminator_selection(term_evals, term_time) - AutoFSelector$new(learner, resampling, measure, terminator, fselector) + AutoFSelector$new(learner = learner, resampling = resampling, measure = measure, terminator = terminator, fselector = fselector, store_fselect_instance = store_fselect_instance, store_benchmark_result = store_benchmark_result, store_models = store_models, check_values = check_values) } diff --git a/man-roxygen/param_learner.R b/man-roxygen/param_learner.R index c6e624ba..2703ebf8 100644 --- a/man-roxygen/param_learner.R +++ b/man-roxygen/param_learner.R @@ -1 +1,2 @@ -#' @param learner ([mlr3::Learner]). +#' @param learner ([mlr3::Learner])\cr +#' Learner to optimize the feature subset for. diff --git a/man-roxygen/param_measure.R b/man-roxygen/param_measure.R index c397e1bb..fcb0a2e4 100644 --- a/man-roxygen/param_measure.R +++ b/man-roxygen/param_measure.R @@ -1,2 +1,2 @@ #' @param measure ([mlr3::Measure])\cr -#' Measure to optimize. +#' Measure to optimize. If `NULL`, default measure is used. diff --git a/man-roxygen/param_resampling.R b/man-roxygen/param_resampling.R index 8f6bb2d6..e0bd515f 100644 --- a/man-roxygen/param_resampling.R +++ b/man-roxygen/param_resampling.R @@ -1,3 +1,4 @@ #' @param resampling ([mlr3::Resampling])\cr -#' Uninstantiated resamplings are instantiated during construction -#' so that all configurations are evaluated on the same data splits. +#' Resampling that is used to evaluated the performance of the feature subsets. +#' Uninstantiated resamplings are instantiated during construction so that all feature subsets are evaluated on the same data splits. +#' Already instantiated resamplings are kept unchanged. diff --git a/man-roxygen/param_store_fselect_instance.R b/man-roxygen/param_store_fselect_instance.R new file mode 100644 index 00000000..a6a569e8 --- /dev/null +++ b/man-roxygen/param_store_fselect_instance.R @@ -0,0 +1,3 @@ +#' @param store_fselect_instance (`logical(1)`)\cr +#' If `TRUE` (default), stores the internally created [FSelectInstanceSingleCrit] with all intermediate results in slot `$fselect_instance`. +#' Is set to `TRUE`, if `store_models = TRUE` diff --git a/man-roxygen/param_terminator.R b/man-roxygen/param_terminator.R index 676fb1fb..66f298f1 100644 --- a/man-roxygen/param_terminator.R +++ b/man-roxygen/param_terminator.R @@ -1 +1,2 @@ -#' @param terminator ([bbotk::Terminator]). +#' @param terminator ([Terminator])\cr +#' Stop criterion of the feature selection. diff --git a/man/AutoFSelector.Rd b/man/AutoFSelector.Rd index a9c2ea0e..ed1cf498 100644 --- a/man/AutoFSelector.Rd +++ b/man/AutoFSelector.Rd @@ -4,42 +4,87 @@ \alias{AutoFSelector} \title{AutoFSelector} \description{ -The \code{AutoFSelector} is a \link[mlr3:Learner]{mlr3::Learner} which wraps another \link[mlr3:Learner]{mlr3::Learner} -and performs the following steps during \verb{$train()}: +The \link{AutoFSelector} wraps a \link[mlr3:Learner]{mlr3::Learner} and augments it with an automatic feature selection. +The \code{\link[=auto_fselector]{auto_fselector()}} function creates an \link{AutoFSelector} object. +} +\details{ +The \link{AutoFSelector} is a \link[mlr3:Learner]{mlr3::Learner} which wraps another \link[mlr3:Learner]{mlr3::Learner} and performs the following steps during \verb{$train()}: \enumerate{ -\item The wrapped (inner) learner is trained on the feature subsets via -resampling. The feature selection can be specified by providing a -\link{FSelector}, a \link[bbotk:Terminator]{bbotk::Terminator}, a \link[mlr3:Resampling]{mlr3::Resampling} and a -\link[mlr3:Measure]{mlr3::Measure}. -\item A final model is fit on the complete training data with the best found -feature subset. +\item The wrapped (inner) learner is trained on the feature subsets via resampling. +The feature selection can be specified by providing a \link{FSelector}, a \link[bbotk:Terminator]{bbotk::Terminator}, a \link[mlr3:Resampling]{mlr3::Resampling} and a \link[mlr3:Measure]{mlr3::Measure}. +\item A final model is fit on the complete training data with the best found feature subset. +} + +During \verb{$predict()} the \link{AutoFSelector} just calls the predict method of the wrapped (inner) learner. +} +\section{Resources}{ + +\itemize{ +\item \href{https://mlr3book.mlr-org.com/feature-selection.html#autofselect}{book chapter} on automatic feature selection. +} } -During \verb{$predict()} the \code{AutoFSelector} just calls the predict method of the -wrapped (inner) learner. +\section{Nested Resampling}{ -Note that this approach allows to perform nested resampling by passing an -\link{AutoFSelector} object to \code{\link[mlr3:resample]{mlr3::resample()}} or \code{\link[mlr3:benchmark]{mlr3::benchmark()}}. -To access the inner resampling results, set \code{store_fselect_instance = TRUE} -and execute \code{\link[mlr3:resample]{mlr3::resample()}} or \code{\link[mlr3:benchmark]{mlr3::benchmark()}} with -\code{store_models = TRUE}. +Nested resampling can be performed by passing an \link{AutoFSelector} object to \code{\link[mlr3:resample]{mlr3::resample()}} or \code{\link[mlr3:benchmark]{mlr3::benchmark()}}. +To access the inner resampling results, set \code{store_fselect_instance = TRUE} and execute \code{\link[mlr3:resample]{mlr3::resample()}} or \code{\link[mlr3:benchmark]{mlr3::benchmark()}} with \code{store_models = TRUE} (see examples). +The \link[mlr3:Resampling]{mlr3::Resampling} passed to the \link{AutoFSelector} is meant to be the inner resampling, operating on the training set of an arbitrary outer resampling. +For this reason it is not feasible to pass an instantiated \link[mlr3:Resampling]{mlr3::Resampling} here. } + \examples{ -library(mlr3) +# Automafsic Feafsure Selection -task = tsk("iris") -learner = lrn("classif.rpart") -resampling = rsmp("holdout") -measure = msr("classif.ce") +task = tsk("penguins") +train_set = sample(task$nrow, 0.8 * task$nrow) +test_set = setdiff(seq_len(task$nrow), train_set) -terminator = trm("evals", n_evals = 3) -fselector = fs("exhaustive_search") -afs = AutoFSelector$new(learner, resampling, measure, terminator, fselector, - store_fselect_instance = TRUE) +afs = auto_fselector( + method = fs("random_search"), + learner = lrn("classif.rpart"), + resampling = rsmp ("holdout"), + measure = msr("classif.ce"), + term_evals = 4) -afs$train(task) +# optimize feafsure subset and fit final model +afs$train(task, row_ids = train_set) + +# predict with final model +afs$predict(task, row_ids = test_set) + +# show fselect result +afs$fselect_result + +# model slot contains trained learner and fselect instance afs$model + +# shortcut trained learner afs$learner + +# shortcut fselect instance +afs$tuning_instance + + +# Nested Resampling + +afs = auto_fselector( + method = fs("random_search"), + learner = lrn("classif.rpart"), + resampling = rsmp ("holdout"), + measure = msr("classif.ce"), + term_evals = 4) + +resampling_outer = rsmp("cv", folds = 3) +rr = resample(task, afs, resampling_outer, store_models = TRUE) + +# retrieve inner tuning results. +extract_inner_fselect_results(rr) + +# performance scores estimated on the outer resampling +rr$score() + +# unbiased performance of the final model trained on the full dafsa set +rr$aggregate() } \section{Super class}{ \code{\link[mlr3:Learner]{mlr3::Learner}} -> \code{AutoFSelector} @@ -48,11 +93,10 @@ afs$learner \if{html}{\out{
mlr3::Learner$help()
mlr3::Learner$predict()
mlr3::Learner$predict_newdata()
mlr3::Learner$print()
mlr3::Learner$reset()
mlr3::Learner$train()