Skip to contents

Feature selection using the Genetic Algorithm from the package genalg.

Dictionary

This FSelector can be instantiated with the associated sugar function fs():

fs("genetic_search")

Control Parameters

For the meaning of the control parameters, see genalg::rbga.bin(). genalg::rbga.bin() internally terminates after iters iteration. We set ìters = 100000 to allow the termination via our terminators. If more iterations are needed, set ìters to a higher value in the parameter set.

Super class

mlr3fselect::FSelector -> FSelectorGeneticSearch

Methods

Inherited methods


Method new()

Creates a new instance of this R6 class.


Method clone()

The objects of this class are cloneable with this method.

Usage

FSelectorGeneticSearch$clone(deep = FALSE)

Arguments

deep

Whether to make a deep clone.

Examples

# Feature Selection
# \donttest{

# retrieve task and load learner
task = tsk("penguins")
learner = lrn("classif.rpart")

# run feature selection on the Palmer Penguins data set
instance = fselect(
  method = "genetic_search",
  task = task,
  learner = learner,
  resampling = rsmp("holdout"),
  measure = msr("classif.ce"),
  term_evals = 10
)

# best performing feature set
instance$result
#>    bill_depth bill_length body_mass flipper_length island   sex  year
#> 1:       TRUE       FALSE      TRUE          FALSE   TRUE FALSE FALSE
#>                       features classif.ce
#> 1: bill_depth,body_mass,island  0.1391304

# all evaluated feature sets
as.data.table(instance$archive)
#>     bill_depth bill_length body_mass flipper_length island   sex  year
#>  1:      FALSE       FALSE     FALSE           TRUE  FALSE FALSE FALSE
#>  2:       TRUE       FALSE      TRUE          FALSE   TRUE FALSE FALSE
#>  3:       TRUE       FALSE     FALSE          FALSE  FALSE FALSE FALSE
#>  4:      FALSE       FALSE      TRUE          FALSE  FALSE FALSE FALSE
#>  5:      FALSE       FALSE      TRUE          FALSE  FALSE FALSE FALSE
#>  6:      FALSE       FALSE     FALSE          FALSE  FALSE FALSE  TRUE
#>  7:      FALSE       FALSE     FALSE          FALSE   TRUE FALSE FALSE
#>  8:      FALSE        TRUE     FALSE          FALSE  FALSE FALSE FALSE
#>  9:      FALSE        TRUE     FALSE          FALSE  FALSE FALSE FALSE
#> 10:      FALSE        TRUE     FALSE          FALSE  FALSE FALSE FALSE
#>     classif.ce runtime_learners           timestamp batch_nr warnings errors
#>  1:  0.2086957            0.068 2022-11-25 12:09:48        1        0      0
#>  2:  0.1391304            0.081 2022-11-25 12:09:48        2        0      0
#>  3:  0.2608696            0.059 2022-11-25 12:09:48        3        0      0
#>  4:  0.2956522            0.067 2022-11-25 12:09:48        4        0      0
#>  5:  0.2956522            0.060 2022-11-25 12:09:48        5        0      0
#>  6:  0.5826087            0.058 2022-11-25 12:09:49        6        0      0
#>  7:  0.3565217            0.066 2022-11-25 12:09:49        7        0      0
#>  8:  0.2521739            0.083 2022-11-25 12:09:49        8        0      0
#>  9:  0.2521739            0.059 2022-11-25 12:09:49        9        0      0
#> 10:  0.2521739            0.061 2022-11-25 12:09:49       10        0      0
#>          resample_result
#>  1: <ResampleResult[21]>
#>  2: <ResampleResult[21]>
#>  3: <ResampleResult[21]>
#>  4: <ResampleResult[21]>
#>  5: <ResampleResult[21]>
#>  6: <ResampleResult[21]>
#>  7: <ResampleResult[21]>
#>  8: <ResampleResult[21]>
#>  9: <ResampleResult[21]>
#> 10: <ResampleResult[21]>

# subset the task and fit the final model
task$select(instance$result_feature_set)
learner$train(task)
# }