From 1adefb501b9e49521719d028e2176c58e6dc6cf9 Mon Sep 17 00:00:00 2001
From: "Anthony D. Blaom" <anthony.blaom@gmail.com>
Date: Wed, 10 Jul 2024 21:09:35 +1200
Subject: [PATCH 1/2] bump 0.17.3

---
 Project.toml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/Project.toml b/Project.toml
index 58b2563..5babd59 100644
--- a/Project.toml
+++ b/Project.toml
@@ -1,7 +1,7 @@
 name = "MLJModels"
 uuid = "d491faf4-2d78-11e9-2867-c94bc002c0b7"
 authors = ["Anthony D. Blaom <anthony.blaom@gmail.com>"]
-version = "0.17.2"
+version = "0.17.3"
 
 [deps]
 CategoricalArrays = "324d7699-5711-5eae-9e2f-1d82baa6b597"

From 2c511f0362b08eb93997b3d014035762f7129667 Mon Sep 17 00:00:00 2001
From: "Anthony D. Blaom" <anthony.blaom@gmail.com>
Date: Wed, 10 Jul 2024 21:13:48 +1200
Subject: [PATCH 2/2] update model registry

---
 src/MLJModels.jl           |   2 +-
 src/registry/Metadata.toml | 326 ++++++++++++++++++++++++++++++++++---
 src/registry/Models.toml   |   2 +-
 3 files changed, 304 insertions(+), 26 deletions(-)

diff --git a/src/MLJModels.jl b/src/MLJModels.jl
index 36b2c1a..daad124 100755
--- a/src/MLJModels.jl
+++ b/src/MLJModels.jl
@@ -1,4 +1,4 @@
-module MLJModels
+module MLJModels 
 
 import MLJModelInterface
 import MLJModelInterface: Model, metadata_pkg, metadata_model, @mlj_model, info,
diff --git a/src/registry/Metadata.toml b/src/registry/Metadata.toml
index 9c8f122..3ed0464 100644
--- a/src/registry/Metadata.toml
+++ b/src/registry/Metadata.toml
@@ -7,6 +7,7 @@
 ":predict_scitype" = "`AbstractVector{<:ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "BetaML"
 ":package_license" = "MIT"
@@ -42,6 +43,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`Union{ScientificTypesBase.Table{<:AbstractVector{<:Union{Missing, ScientificTypesBase.Continuous}}}, AbstractMatrix{<:Union{Missing, ScientificTypesBase.Continuous}}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "BetaML"
 ":package_license" = "MIT"
@@ -77,6 +79,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "BetaML"
 ":package_license" = "MIT"
@@ -112,6 +115,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Known}}`"
 ":inverse_transform_scitype" = "`Union{ScientificTypesBase.Table{<:AbstractVector{<:Union{Missing, ScientificTypesBase.Known}}}, AbstractMatrix{<:Union{Missing, ScientificTypesBase.Known}}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "BetaML"
 ":package_license" = "MIT"
@@ -147,6 +151,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "BetaML"
 ":package_license" = "MIT"
@@ -182,6 +187,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`AbstractMatrix{<:Union{ScientificTypesBase.Continuous, ScientificTypesBase.Count}}`"
 ":inverse_transform_scitype" = "`Union{ScientificTypesBase.Table{<:AbstractVector{<:Union{ScientificTypesBase.Continuous, ScientificTypesBase.Count}}}, AbstractMatrix{<:Union{ScientificTypesBase.Continuous, ScientificTypesBase.Count}}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "BetaML"
 ":package_license" = "MIT"
@@ -217,6 +223,7 @@
 ":predict_scitype" = "`AbstractVector{<:ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "BetaML"
 ":package_license" = "MIT"
@@ -252,6 +259,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "BetaML"
 ":package_license" = "MIT"
@@ -287,6 +295,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`Union{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}, AbstractMatrix{<:ScientificTypesBase.Continuous}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "BetaML"
 ":package_license" = "MIT"
@@ -322,6 +331,7 @@
 ":predict_scitype" = "`AbstractVector{<:Union{ScientificTypesBase.Continuous, ScientificTypesBase.Count}}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "BetaML"
 ":package_license" = "MIT"
@@ -357,6 +367,7 @@
 ":predict_scitype" = "`AbstractMatrix{<:ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "BetaML"
 ":package_license" = "MIT"
@@ -392,6 +403,7 @@
 ":predict_scitype" = "`AbstractVector{<:ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "BetaML"
 ":package_license" = "MIT"
@@ -427,6 +439,7 @@
 ":predict_scitype" = "`AbstractMatrix{<:Union{ScientificTypesBase.Continuous, ScientificTypesBase.Count}}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "BetaML"
 ":package_license" = "MIT"
@@ -462,6 +475,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "BetaML"
 ":package_license" = "MIT"
@@ -497,6 +511,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Known}}`"
 ":inverse_transform_scitype" = "`Union{ScientificTypesBase.Table{<:AbstractVector{<:Union{Missing, ScientificTypesBase.Known}}}, AbstractMatrix{<:Union{Missing, ScientificTypesBase.Known}}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "BetaML"
 ":package_license" = "MIT"
@@ -532,6 +547,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "BetaML"
 ":package_license" = "MIT"
@@ -567,6 +583,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`Union{ScientificTypesBase.Table{<:AbstractVector{<:Union{Missing, ScientificTypesBase.Continuous}}}, AbstractMatrix{<:Union{Missing, ScientificTypesBase.Continuous}}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "BetaML"
 ":package_license" = "MIT"
@@ -602,6 +619,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`AbstractArray{<:ScientificTypesBase.Multiclass}`"
 ":inverse_transform_scitype" = "`Union{ScientificTypesBase.Table{<:AbstractVector{<:Union{Missing, ScientificTypesBase.Continuous}}}, AbstractMatrix{<:Union{Missing, ScientificTypesBase.Continuous}}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "BetaML"
 ":package_license" = "MIT"
@@ -637,6 +655,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "BetaML"
 ":package_license" = "MIT"
@@ -672,6 +691,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`Union{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}, AbstractMatrix{<:ScientificTypesBase.Continuous}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "BetaML"
 ":package_license" = "MIT"
@@ -707,6 +727,7 @@
 ":predict_scitype" = "`AbstractVector{<:ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "CatBoost"
 ":package_license" = "MIT"
@@ -742,6 +763,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "CatBoost"
 ":package_license" = "MIT"
@@ -777,6 +799,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "NearestNeighborModels"
 ":package_license" = "MIT"
@@ -812,6 +835,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Density{<:ScientificTypesBase.Finite}}}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "NearestNeighborModels"
 ":package_license" = "MIT"
@@ -847,6 +871,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "NearestNeighborModels"
 ":package_license" = "MIT"
@@ -882,6 +907,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "NearestNeighborModels"
 ":package_license" = "MIT"
@@ -917,6 +943,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -952,6 +979,7 @@
 ":predict_scitype" = "`AbstractVector{<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -987,6 +1015,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -1022,6 +1051,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -1057,6 +1087,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -1092,6 +1123,7 @@
 ":predict_scitype" = "`AbstractVector{<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -1127,6 +1159,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -1162,6 +1195,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -1197,6 +1231,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -1232,6 +1267,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -1267,6 +1303,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -1302,6 +1339,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -1337,6 +1375,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -1372,6 +1411,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -1407,6 +1447,7 @@
 ":predict_scitype" = "`AbstractVector{<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -1442,6 +1483,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -1477,6 +1519,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -1512,6 +1555,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -1547,6 +1591,7 @@
 ":predict_scitype" = "`AbstractVector{<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -1582,6 +1627,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -1617,6 +1663,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -1652,6 +1699,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -1687,6 +1735,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -1722,6 +1771,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -1757,6 +1807,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -1792,6 +1843,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -1827,6 +1879,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -1862,6 +1915,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -1897,6 +1951,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -1932,6 +1987,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -1967,6 +2023,7 @@
 ":predict_scitype" = "`AbstractVector{<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -2002,6 +2059,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -2037,6 +2095,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -2072,6 +2131,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -2107,6 +2167,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -2142,6 +2203,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -2177,6 +2239,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -2212,6 +2275,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -2247,6 +2311,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -2282,6 +2347,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -2317,6 +2383,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -2352,6 +2419,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -2387,6 +2455,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -2422,6 +2491,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -2457,6 +2527,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -2492,6 +2563,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -2527,6 +2599,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -2562,6 +2635,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -2597,6 +2671,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -2632,6 +2707,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -2667,6 +2743,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -2702,6 +2779,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -2737,6 +2815,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -2772,6 +2851,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -2807,6 +2887,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -2842,6 +2923,7 @@
 ":predict_scitype" = "`AbstractVector{<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -2877,6 +2959,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -2912,6 +2995,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -2947,6 +3031,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -2982,6 +3067,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -3017,6 +3103,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -3052,6 +3139,7 @@
 ":predict_scitype" = "`AbstractVector{<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -3087,6 +3175,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -3122,6 +3211,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -3157,6 +3247,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -3192,6 +3283,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -3227,6 +3319,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -3262,6 +3355,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -3297,6 +3391,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -3332,6 +3427,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -3367,6 +3463,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -3402,6 +3499,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -3437,6 +3535,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -3472,6 +3571,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -3507,6 +3607,7 @@
 ":predict_scitype" = "`AbstractVector{<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJScikitLearnInterface"
 ":package_license" = "BSD"
@@ -3542,6 +3643,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{AbstractVector{<:ScientificTypesBase.Continuous}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "OutlierDetectionNeighbors"
 ":package_license" = "MIT"
@@ -3577,6 +3679,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{AbstractVector{<:ScientificTypesBase.Continuous}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "OutlierDetectionNeighbors"
 ":package_license" = "MIT"
@@ -3612,6 +3715,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{AbstractVector{<:ScientificTypesBase.Continuous}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "OutlierDetectionNeighbors"
 ":package_license" = "MIT"
@@ -3647,6 +3751,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{AbstractVector{<:ScientificTypesBase.Continuous}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "OutlierDetectionNeighbors"
 ":package_license" = "MIT"
@@ -3682,6 +3787,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{AbstractVector{<:ScientificTypesBase.Continuous}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "OutlierDetectionNeighbors"
 ":package_license" = "MIT"
@@ -3717,6 +3823,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "SIRUS"
 ":package_license" = "MIT"
@@ -3752,6 +3859,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "SIRUS"
 ":package_license" = "MIT"
@@ -3787,6 +3895,7 @@
 ":predict_scitype" = "`AbstractVector{<:ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "SIRUS"
 ":package_license" = "MIT"
@@ -3822,6 +3931,7 @@
 ":predict_scitype" = "`AbstractVector{<:ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "SIRUS"
 ":package_license" = "MIT"
@@ -3857,6 +3967,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJIteration"
 ":package_license" = "MIT"
@@ -3892,6 +4003,7 @@
 ":predict_scitype" = "`Union{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "PartialLeastSquaresRegressor"
 ":package_license" = "MIT"
@@ -3927,6 +4039,7 @@
 ":predict_scitype" = "`Union{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "PartialLeastSquaresRegressor"
 ":package_license" = "MIT"
@@ -3962,6 +4075,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "PartitionedLS"
 ":package_license" = "MIT"
@@ -3997,6 +4111,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJLinearModels"
 ":package_license" = "MIT"
@@ -4032,6 +4147,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJLinearModels"
 ":package_license" = "MIT"
@@ -4067,6 +4183,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJLinearModels"
 ":package_license" = "MIT"
@@ -4102,6 +4219,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJLinearModels"
 ":package_license" = "MIT"
@@ -4137,6 +4255,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJLinearModels"
 ":package_license" = "MIT"
@@ -4172,6 +4291,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJLinearModels"
 ":package_license" = "MIT"
@@ -4207,6 +4327,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJLinearModels"
 ":package_license" = "MIT"
@@ -4242,6 +4363,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJLinearModels"
 ":package_license" = "MIT"
@@ -4277,6 +4399,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJLinearModels"
 ":package_license" = "MIT"
@@ -4312,6 +4435,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJLinearModels"
 ":package_license" = "MIT"
@@ -4347,6 +4471,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "ParallelKMeans"
 ":package_license" = "MIT"
@@ -4382,6 +4507,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "NaiveBayes"
 ":package_license" = "unknown"
@@ -4417,6 +4543,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "NaiveBayes"
 ":package_license" = "unknown"
@@ -4452,6 +4579,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJBase"
 ":package_license" = "unknown"
@@ -4487,6 +4615,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJBase"
 ":package_license" = "unknown"
@@ -4497,7 +4626,7 @@
 ":supports_weights" = "`missing`"
 ":supports_class_weights" = "`missing`"
 ":supports_online" = "`false`"
-":docstring" = "```\nresampler = Resampler(\n    model=ConstantRegressor(),\n    resampling=CV(),\n    measure=nothing,\n    weights=nothing,\n    class_weights=nothing\n    operation=predict,\n    repeats = 1,\n    acceleration=default_resource(),\n    check_measure=true,\n    per_observation=true,\n    logger=nothing,\n    compact=false,\n)\n```\n\n*Private method.* Use at own risk.\n\nResampling model wrapper, used internally by the `fit` method of `TunedModel` instances and `IteratedModel` instances. See [`evaluate!`](@ref) for meaning of the options. Not intended for use by general user, who will ordinarily use [`evaluate!`](@ref) directly.\n\nGiven a machine `mach = machine(resampler, args...)` one obtains a performance evaluation of the specified `model`, performed according to the prescribed `resampling` strategy and other parameters, using data `args...`, by calling `fit!(mach)` followed by `evaluate(mach)`.\n\nOn subsequent calls to `fit!(mach)` new train/test pairs of row indices are only regenerated if `resampling`, `repeats` or `cache` fields of `resampler` have changed. The evolution of an RNG field of `resampler` does *not* constitute a change (`==` for `MLJType` objects is not sensitive to such changes; see [`is_same_except`](@ref)).\n\nIf there is single train/test pair, then warm-restart behavior of the wrapped model `resampler.model` will extend to warm-restart behaviour of the wrapper `resampler`, with respect to mutations of the wrapped model.\n\nThe sample `weights` are passed to the specified performance measures that support weights for evaluation. These weights are not to be confused with any weights bound to a `Resampler` instance in a machine, used for training the wrapped `model` when supported.\n\nThe sample `class_weights` are passed to the specified performance measures that support per-class weights for evaluation. These weights are not to be confused with any weights bound to a `Resampler` instance in a machine, used for training the wrapped `model` when supported.\n"
+":docstring" = "```\nresampler = Resampler(\n    model=ConstantRegressor(),\n    resampling=CV(),\n    measure=nothing,\n    weights=nothing,\n    class_weights=nothing\n    operation=predict,\n    repeats = 1,\n    acceleration=default_resource(),\n    check_measure=true,\n    per_observation=true,\n    logger=default_logger(),\n    compact=false,\n)\n```\n\n*Private method.* Use at own risk.\n\nResampling model wrapper, used internally by the `fit` method of `TunedModel` instances and `IteratedModel` instances. See [`evaluate!`](@ref) for meaning of the options. Not intended for use by general user, who will ordinarily use [`evaluate!`](@ref) directly.\n\nGiven a machine `mach = machine(resampler, args...)` one obtains a performance evaluation of the specified `model`, performed according to the prescribed `resampling` strategy and other parameters, using data `args...`, by calling `fit!(mach)` followed by `evaluate(mach)`.\n\nOn subsequent calls to `fit!(mach)` new train/test pairs of row indices are only regenerated if `resampling`, `repeats` or `cache` fields of `resampler` have changed. The evolution of an RNG field of `resampler` does *not* constitute a change (`==` for `MLJType` objects is not sensitive to such changes; see [`is_same_except`](@ref)).\n\nIf there is single train/test pair, then warm-restart behavior of the wrapped model `resampler.model` will extend to warm-restart behaviour of the wrapper `resampler`, with respect to mutations of the wrapped model.\n\nThe sample `weights` are passed to the specified performance measures that support weights for evaluation. These weights are not to be confused with any weights bound to a `Resampler` instance in a machine, used for training the wrapped `model` when supported.\n\nThe sample `class_weights` are passed to the specified performance measures that support per-class weights for evaluation. These weights are not to be confused with any weights bound to a `Resampler` instance in a machine, used for training the wrapped `model` when supported.\n"
 ":name" = "Resampler"
 ":human_name" = "resampler"
 ":is_supervised" = "`false`"
@@ -4522,6 +4651,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJBase"
 ":package_license" = "MIT"
@@ -4557,6 +4687,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJBase"
 ":package_license" = "MIT"
@@ -4592,6 +4723,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MultivariateStats"
 ":package_license" = "MIT"
@@ -4627,6 +4759,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MultivariateStats"
 ":package_license" = "MIT"
@@ -4662,6 +4795,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MultivariateStats"
 ":package_license" = "MIT"
@@ -4697,6 +4831,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MultivariateStats"
 ":package_license" = "MIT"
@@ -4732,6 +4867,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MultivariateStats"
 ":package_license" = "MIT"
@@ -4767,6 +4903,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MultivariateStats"
 ":package_license" = "MIT"
@@ -4802,6 +4939,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MultivariateStats"
 ":package_license" = "MIT"
@@ -4837,6 +4975,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MultivariateStats"
 ":package_license" = "MIT"
@@ -4872,6 +5011,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MultivariateStats"
 ":package_license" = "MIT"
@@ -4907,6 +5047,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MultivariateStats"
 ":package_license" = "MIT"
@@ -4942,6 +5083,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MultivariateStats"
 ":package_license" = "MIT"
@@ -4977,6 +5119,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MultivariateStats"
 ":package_license" = "MIT"
@@ -5012,6 +5155,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MultivariateStats"
 ":package_license" = "MIT"
@@ -5047,6 +5191,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "DecisionTree"
 ":package_license" = "MIT"
@@ -5082,6 +5227,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "DecisionTree"
 ":package_license" = "MIT"
@@ -5117,6 +5263,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "DecisionTree"
 ":package_license" = "MIT"
@@ -5152,6 +5299,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "DecisionTree"
 ":package_license" = "MIT"
@@ -5187,6 +5335,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "DecisionTree"
 ":package_license" = "MIT"
@@ -5222,6 +5371,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJBalancing"
 ":package_license" = "unknown"
@@ -5257,6 +5407,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJBalancing"
 ":package_license" = "MIT"
@@ -5292,6 +5443,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{Union{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}, AbstractMatrix{ScientificTypesBase.Continuous}}, AbstractVector}`"
 ":inverse_transform_scitype" = "`Tuple{Union{ScientificTypesBase.Table{<:AbstractVector{<:Union{ScientificTypesBase.Infinite, ScientificTypesBase.Finite}}}, AbstractMatrix{ScientificTypesBase.Infinite}}, AbstractVector}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "Imbalance"
 ":package_license" = "unknown"
@@ -5327,6 +5479,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{ScientificTypesBase.Table{<:AbstractVector{<:Union{ScientificTypesBase.Infinite, ScientificTypesBase.Finite}}}, AbstractVector}`"
 ":inverse_transform_scitype" = "`Tuple{ScientificTypesBase.Table{<:AbstractVector{<:Union{ScientificTypesBase.Infinite, ScientificTypesBase.Finite}}}, AbstractVector}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "Imbalance"
 ":package_license" = "unknown"
@@ -5362,6 +5515,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{Union{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}, AbstractMatrix{ScientificTypesBase.Continuous}}, AbstractVector}`"
 ":inverse_transform_scitype" = "`Tuple{Union{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}, AbstractMatrix{ScientificTypesBase.Continuous}}, AbstractVector}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "Imbalance"
 ":package_license" = "unknown"
@@ -5397,6 +5551,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{Union{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}, AbstractMatrix{ScientificTypesBase.Continuous}}, AbstractVector}`"
 ":inverse_transform_scitype" = "`Tuple{Union{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}, AbstractMatrix{ScientificTypesBase.Continuous}}, AbstractVector}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "Imbalance"
 ":package_license" = "unknown"
@@ -5432,6 +5587,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{Union{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}, AbstractMatrix{ScientificTypesBase.Continuous}}, AbstractVector}`"
 ":inverse_transform_scitype" = "`Tuple{Union{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}, AbstractMatrix{ScientificTypesBase.Continuous}}, AbstractVector}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "Imbalance"
 ":package_license" = "unknown"
@@ -5467,6 +5623,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{Union{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Finite}}, AbstractMatrix{<:ScientificTypesBase.Finite}}, AbstractVector}`"
 ":inverse_transform_scitype" = "`Tuple{Union{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Finite}}, AbstractMatrix{<:ScientificTypesBase.Finite}}, AbstractVector}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "Imbalance"
 ":package_license" = "unknown"
@@ -5502,6 +5659,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{Union{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}, AbstractMatrix{ScientificTypesBase.Continuous}}, AbstractVector}`"
 ":inverse_transform_scitype" = "`Tuple{Union{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}, AbstractMatrix{ScientificTypesBase.Continuous}}, AbstractVector}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "Imbalance"
 ":package_license" = "unknown"
@@ -5537,6 +5695,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{Union{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}, AbstractMatrix{ScientificTypesBase.Continuous}}, AbstractVector}`"
 ":inverse_transform_scitype" = "`Tuple{Union{ScientificTypesBase.Table{<:AbstractVector{<:Union{ScientificTypesBase.Infinite, ScientificTypesBase.Finite}}}, AbstractMatrix{ScientificTypesBase.Infinite}}, AbstractVector}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "Imbalance"
 ":package_license" = "unknown"
@@ -5572,6 +5731,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{Union{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}, AbstractMatrix{ScientificTypesBase.Continuous}}, AbstractVector}`"
 ":inverse_transform_scitype" = "`Tuple{Union{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}, AbstractMatrix{ScientificTypesBase.Continuous}}, AbstractVector}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "Imbalance"
 ":package_license" = "unknown"
@@ -5607,6 +5767,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{Union{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}, AbstractMatrix{ScientificTypesBase.Continuous}}, AbstractVector}`"
 ":inverse_transform_scitype" = "`Tuple{Union{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}, AbstractMatrix{ScientificTypesBase.Continuous}}, AbstractVector}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "Imbalance"
 ":package_license" = "unknown"
@@ -5642,6 +5803,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{ScientificTypesBase.Table{<:AbstractVector{<:Union{ScientificTypesBase.Infinite, ScientificTypesBase.Finite}}}, AbstractVector}`"
 ":inverse_transform_scitype" = "`Tuple{ScientificTypesBase.Table{<:AbstractVector{<:Union{ScientificTypesBase.Infinite, ScientificTypesBase.Finite}}}, AbstractVector}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "Imbalance"
 ":package_license" = "unknown"
@@ -5677,6 +5839,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJTuning"
 ":package_license" = "MIT"
@@ -5712,6 +5875,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Table`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Table`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "FeatureSelection"
 ":package_license" = "MIT"
@@ -5747,17 +5911,18 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "FeatureSelection"
 ":package_license" = "MIT"
 ":load_path" = "FeatureSelection.RecursiveFeatureElimination"
 ":package_uuid" = "33837fe5-dbff-4c9e-8c2f-c5612fe2b8b6"
 ":package_url" = "https://github.com/JuliaAI/FeatureSelection.jl"
-":is_wrapper" = "`true`"
+":is_wrapper" = "`false`"
 ":supports_weights" = "`false`"
 ":supports_class_weights" = "`false`"
 ":supports_online" = "`false`"
-":docstring" = "```\nRecursiveFeatureElimination(model, n_features, step)\n```\n\nThis model implements a recursive feature elimination algorithm for feature selection. It recursively removes features, training a base model on the remaining features and evaluating their importance until the desired number of features is selected.\n\nConstruct an instance with default hyper-parameters using the syntax `rfe_model = RecursiveFeatureElimination(model=...)`. Provide keyword arguments to override hyper-parameter defaults.\n\n# Training data\n\nIn MLJ or MLJBase, bind an instance `rfe_model` to data with\n\n```\nmach = machine(rfe_model, X, y)\n```\n\nOR, if the base model supports weights, as\n\n```\nmach = machine(rfe_model, X, y, w)\n```\n\nHere:\n\n  * `X` is any table of input features (eg, a `DataFrame`) whose columns are of the scitype as that required by the base model; check column scitypes with `schema(X)` and column scitypes required by base model with `input_scitype(basemodel)`.\n  * `y` is the target, which can be any table of responses whose element scitype is   `Continuous` or `Finite` depending on the `target_scitype` required by the base model;   check the scitype with `scitype(y)`.\n  * `w` is the observation weights which can either be `nothing`(default) or an `AbstractVector` whoose element scitype is `Count` or `Continuous`. This is different from `weights` kernel which is an hyperparameter to the model, see below.\n\nTrain the machine using `fit!(mach, rows=...)`.\n\n# Hyper-parameters\n\n  * model: A base model with a `fit` method that provides information on feature feature importance (i.e `reports_feature_importances(model) == true`)\n  * n_features::Real = 0: The number of features to select. If `0`, half of the features are selected. If a positive integer, the parameter is the absolute number of features to select. If a real number between 0 and 1, it is the fraction of features to select.\n  * step::Real=1: If the value of step is at least 1, it signifies the quantity of features to eliminate in each iteration. Conversely, if step falls strictly within the range of 0.0 to 1.0, it denotes the proportion (rounded down) of features to remove during each iteration.\n\n# Operations\n\n  * `transform(mach, X)`: transform the input table `X` into a new table containing only\n\ncolumns corresponding to features gotten from the RFE algorithm.\n\n  * `predict(mach, X)`: transform the input table `X` into a new table same as in\n  * `transform(mach, X)` above and predict using the fitted base model on the transformed table.\n\n# Fitted parameters\n\nThe fields of `fitted_params(mach)` are:\n\n  * `features_left`: names of features remaining after recursive feature elimination.\n  * `model_fitresult`: fitted parameters of the base model.\n\n# Report\n\nThe fields of `report(mach)` are:\n\n  * `ranking`: The feature ranking of each features in the training dataset.\n  * `model_report`: report for the fitted base model.\n  * `features`: names of features seen during the training process.\n\n# Examples\n\n```\nusing FeatureSelection, MLJ, StableRNGs\n\nRandomForestRegressor = @load RandomForestRegressor pkg=DecisionTree\n\n# Creates a dataset where the target only depends on the first 5 columns of the input table.\nA = rand(rng, 50, 10);\ny = 10 .* sin.(\n        pi .* A[:, 1] .* A[:, 2]\n    ) + 20 .* (A[:, 3] .- 0.5).^ 2 .+ 10 .* A[:, 4] .+ 5 * A[:, 5]);\nX = MLJ.table(A);\n\n# fit a rfe model\nrf = RandomForestRegressor()\nselector = RecursiveFeatureElimination(model = rf)\nmach = machine(selector, X, y)\nfit!(mach)\n\n# view the feature importances\nfeature_importances(mach)\n\n# predict using the base model\nXnew = MLJ.table(rand(rng, 50, 10));\npredict(mach, Xnew)\n\n```\n"
+":docstring" = "```\nRecursiveFeatureElimination(model, n_features, step)\n```\n\nThis model implements a recursive feature elimination algorithm for feature selection. It recursively removes features, training a base model on the remaining features and evaluating their importance until the desired number of features is selected.\n\nConstruct an instance with default hyper-parameters using the syntax `rfe_model = RecursiveFeatureElimination(model=...)`. Provide keyword arguments to override hyper-parameter defaults.\n\n# Training data\n\nIn MLJ or MLJBase, bind an instance `rfe_model` to data with\n\n```\nmach = machine(rfe_model, X, y)\n```\n\nOR, if the base model supports weights, as\n\n```\nmach = machine(rfe_model, X, y, w)\n```\n\nHere:\n\n  * `X` is any table of input features (eg, a `DataFrame`) whose columns are of the scitype as that required by the base model; check column scitypes with `schema(X)` and column scitypes required by base model with `input_scitype(basemodel)`.\n  * `y` is the target, which can be any table of responses whose element scitype is   `Continuous` or `Finite` depending on the `target_scitype` required by the base model;   check the scitype with `scitype(y)`.\n  * `w` is the observation weights which can either be `nothing`(default) or an `AbstractVector` whoose element scitype is `Count` or `Continuous`. This is different from `weights` kernel which is an hyperparameter to the model, see below.\n\nTrain the machine using `fit!(mach, rows=...)`.\n\n# Hyper-parameters\n\n  * model: A base model with a `fit` method that provides information on feature feature importance (i.e `reports_feature_importances(model) == true`)\n  * n_features::Real = 0: The number of features to select. If `0`, half of the features are selected. If a positive integer, the parameter is the absolute number of features to select. If a real number between 0 and 1, it is the fraction of features to select.\n  * step::Real=1: If the value of step is at least 1, it signifies the quantity of features to eliminate in each iteration. Conversely, if step falls strictly within the range of 0.0 to 1.0, it denotes the proportion (rounded down) of features to remove during each iteration.\n\n# Operations\n\n  * `transform(mach, X)`: transform the input table `X` into a new table containing only\n\ncolumns corresponding to features gotten from the RFE algorithm.\n\n  * `predict(mach, X)`: transform the input table `X` into a new table same as in\n  * `transform(mach, X)` above and predict using the fitted base model on the transformed table.\n\n# Fitted parameters\n\nThe fields of `fitted_params(mach)` are:\n\n  * `features_left`: names of features remaining after recursive feature elimination.\n  * `model_fitresult`: fitted parameters of the base model.\n\n# Report\n\nThe fields of `report(mach)` are:\n\n  * `scores`: dictionary of scores for each feature in the training dataset. The model deems highly scored variables more significant.\n  * `model_report`: report for the fitted base model.\n\n# Examples\n\n```\nusing FeatureSelection, MLJ, StableRNGs\n\nRandomForestRegressor = @load RandomForestRegressor pkg=DecisionTree\n\n# Creates a dataset where the target only depends on the first 5 columns of the input table.\nA = rand(rng, 50, 10);\ny = 10 .* sin.(\n        pi .* A[:, 1] .* A[:, 2]\n    ) + 20 .* (A[:, 3] .- 0.5).^ 2 .+ 10 .* A[:, 4] .+ 5 * A[:, 5]);\nX = MLJ.table(A);\n\n# fit a rfe model\nrf = RandomForestRegressor()\nselector = RecursiveFeatureElimination(model = rf)\nmach = machine(selector, X, y)\nfit!(mach)\n\n# view the feature importances\nfeature_importances(mach)\n\n# predict using the base model\nXnew = MLJ.table(rand(rng, 50, 10));\npredict(mach, Xnew)\n\n```\n"
 ":name" = "RecursiveFeatureElimination"
 ":human_name" = "deterministic recursive feature elimination"
 ":is_supervised" = "`true`"
@@ -5782,6 +5947,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`Tuple{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "Clustering"
 ":package_license" = "MIT"
@@ -5817,6 +5983,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`Tuple{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "Clustering"
 ":package_license" = "MIT"
@@ -5852,6 +6019,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "Clustering"
 ":package_license" = "MIT"
@@ -5887,6 +6055,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "Clustering"
 ":package_license" = "MIT"
@@ -5922,6 +6091,7 @@
 ":predict_scitype" = "`AbstractVector{<:ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "EvoLinear"
 ":package_license" = "MIT"
@@ -5957,6 +6127,7 @@
 ":predict_scitype" = "`AbstractVector{<:ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "EvoLinear"
 ":package_license" = "MIT"
@@ -5992,6 +6163,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`AbstractMatrix{ScientificTypesBase.Continuous}`"
 ":inverse_transform_scitype" = "`Union{AbstractVector{<:AbstractVector{ScientificTypesBase.Textual}}, AbstractVector{<:ScientificTypesBase.Multiset{<:Tuple{Vararg{ScientificTypesBase.Textual, var\"_s1\"}} where var\"_s1\"}}, AbstractVector{<:ScientificTypesBase.Multiset{ScientificTypesBase.Textual}}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJText"
 ":package_license" = "MIT"
@@ -6027,6 +6199,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`AbstractMatrix{ScientificTypesBase.Continuous}`"
 ":inverse_transform_scitype" = "`Union{AbstractVector{<:AbstractVector{ScientificTypesBase.Textual}}, AbstractVector{<:ScientificTypesBase.Multiset{<:Tuple{Vararg{ScientificTypesBase.Textual, var\"_s1\"}} where var\"_s1\"}}, AbstractVector{<:ScientificTypesBase.Multiset{ScientificTypesBase.Textual}}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJText"
 ":package_license" = "MIT"
@@ -6062,6 +6235,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`AbstractMatrix{ScientificTypesBase.Continuous}`"
 ":inverse_transform_scitype" = "`Union{AbstractVector{<:AbstractVector{ScientificTypesBase.Textual}}, AbstractVector{<:ScientificTypesBase.Multiset{<:Tuple{Vararg{ScientificTypesBase.Textual, var\"_s1\"}} where var\"_s1\"}}, AbstractVector{<:ScientificTypesBase.Multiset{ScientificTypesBase.Textual}}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJText"
 ":package_license" = "MIT"
@@ -6097,6 +6271,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "LightGBM"
 ":package_license" = "MIT Expat"
@@ -6132,6 +6307,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "LightGBM"
 ":package_license" = "MIT Expat"
@@ -6167,6 +6343,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Count}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "XGBoost"
 ":package_license" = "unknown"
@@ -6184,9 +6361,9 @@
 ":prediction_type" = ":deterministic"
 ":abstract_type" = "`MLJModelInterface.Deterministic`"
 ":implemented_methods" = [":clean!"]
-":hyperparameters" = "`(:test, :num_round, :booster, :disable_default_eval_metric, :eta, :num_parallel_tree, :gamma, :max_depth, :min_child_weight, :max_delta_step, :subsample, :colsample_bytree, :colsample_bylevel, :colsample_bynode, :lambda, :alpha, :tree_method, :sketch_eps, :scale_pos_weight, :updater, :refresh_leaf, :process_type, :grow_policy, :max_leaves, :max_bin, :predictor, :sample_type, :normalize_type, :rate_drop, :one_drop, :skip_drop, :feature_selector, :top_k, :tweedie_variance_power, :objective, :base_score, :watchlist, :nthread, :importance_type, :seed, :validate_parameters, :eval_metric)`"
-":hyperparameter_types" = "`(\"Int64\", \"Int64\", \"String\", \"Union{Bool, Int64}\", \"Float64\", \"Int64\", \"Float64\", \"Int64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"String\", \"Float64\", \"Float64\", \"Union{Nothing, String}\", \"Union{Bool, Int64}\", \"String\", \"String\", \"Int64\", \"Int64\", \"String\", \"String\", \"String\", \"Float64\", \"Union{Bool, Int64}\", \"Float64\", \"String\", \"Int64\", \"Float64\", \"Any\", \"Float64\", \"Any\", \"Int64\", \"String\", \"Union{Nothing, Int64}\", \"Bool\", \"Vector{String}\")`"
-":hyperparameter_ranges" = "`(nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing)`"
+":hyperparameters" = "`(:test, :num_round, :booster, :disable_default_eval_metric, :eta, :num_parallel_tree, :gamma, :max_depth, :min_child_weight, :max_delta_step, :subsample, :colsample_bytree, :colsample_bylevel, :colsample_bynode, :lambda, :alpha, :tree_method, :sketch_eps, :scale_pos_weight, :updater, :refresh_leaf, :process_type, :grow_policy, :max_leaves, :max_bin, :predictor, :sample_type, :normalize_type, :rate_drop, :one_drop, :skip_drop, :feature_selector, :top_k, :tweedie_variance_power, :objective, :base_score, :early_stopping_rounds, :watchlist, :nthread, :importance_type, :seed, :validate_parameters, :eval_metric)`"
+":hyperparameter_types" = "`(\"Int64\", \"Int64\", \"String\", \"Union{Bool, Int64}\", \"Float64\", \"Int64\", \"Float64\", \"Int64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"String\", \"Float64\", \"Float64\", \"Union{Nothing, String}\", \"Union{Bool, Int64}\", \"String\", \"String\", \"Int64\", \"Int64\", \"String\", \"String\", \"String\", \"Float64\", \"Union{Bool, Int64}\", \"Float64\", \"String\", \"Int64\", \"Float64\", \"Any\", \"Float64\", \"Int64\", \"Any\", \"Int64\", \"String\", \"Union{Nothing, Int64}\", \"Bool\", \"Vector{String}\")`"
+":hyperparameter_ranges" = "`(nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing)`"
 ":iteration_parameter" = "`nothing`"
 ":supports_training_losses" = "`false`"
 ":reports_feature_importances" = "`true`"
@@ -6202,6 +6379,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "XGBoost"
 ":package_license" = "unknown"
@@ -6219,9 +6397,9 @@
 ":prediction_type" = ":deterministic"
 ":abstract_type" = "`MLJModelInterface.Deterministic`"
 ":implemented_methods" = [":clean!"]
-":hyperparameters" = "`(:test, :num_round, :booster, :disable_default_eval_metric, :eta, :num_parallel_tree, :gamma, :max_depth, :min_child_weight, :max_delta_step, :subsample, :colsample_bytree, :colsample_bylevel, :colsample_bynode, :lambda, :alpha, :tree_method, :sketch_eps, :scale_pos_weight, :updater, :refresh_leaf, :process_type, :grow_policy, :max_leaves, :max_bin, :predictor, :sample_type, :normalize_type, :rate_drop, :one_drop, :skip_drop, :feature_selector, :top_k, :tweedie_variance_power, :objective, :base_score, :watchlist, :nthread, :importance_type, :seed, :validate_parameters, :eval_metric)`"
-":hyperparameter_types" = "`(\"Int64\", \"Int64\", \"String\", \"Union{Bool, Int64}\", \"Float64\", \"Int64\", \"Float64\", \"Int64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"String\", \"Float64\", \"Float64\", \"Union{Nothing, String}\", \"Union{Bool, Int64}\", \"String\", \"String\", \"Int64\", \"Int64\", \"String\", \"String\", \"String\", \"Float64\", \"Union{Bool, Int64}\", \"Float64\", \"String\", \"Int64\", \"Float64\", \"Any\", \"Float64\", \"Any\", \"Int64\", \"String\", \"Union{Nothing, Int64}\", \"Bool\", \"Vector{String}\")`"
-":hyperparameter_ranges" = "`(nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing)`"
+":hyperparameters" = "`(:test, :num_round, :booster, :disable_default_eval_metric, :eta, :num_parallel_tree, :gamma, :max_depth, :min_child_weight, :max_delta_step, :subsample, :colsample_bytree, :colsample_bylevel, :colsample_bynode, :lambda, :alpha, :tree_method, :sketch_eps, :scale_pos_weight, :updater, :refresh_leaf, :process_type, :grow_policy, :max_leaves, :max_bin, :predictor, :sample_type, :normalize_type, :rate_drop, :one_drop, :skip_drop, :feature_selector, :top_k, :tweedie_variance_power, :objective, :base_score, :early_stopping_rounds, :watchlist, :nthread, :importance_type, :seed, :validate_parameters, :eval_metric)`"
+":hyperparameter_types" = "`(\"Int64\", \"Int64\", \"String\", \"Union{Bool, Int64}\", \"Float64\", \"Int64\", \"Float64\", \"Int64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"String\", \"Float64\", \"Float64\", \"Union{Nothing, String}\", \"Union{Bool, Int64}\", \"String\", \"String\", \"Int64\", \"Int64\", \"String\", \"String\", \"String\", \"Float64\", \"Union{Bool, Int64}\", \"Float64\", \"String\", \"Int64\", \"Float64\", \"Any\", \"Float64\", \"Int64\", \"Any\", \"Int64\", \"String\", \"Union{Nothing, Int64}\", \"Bool\", \"Vector{String}\")`"
+":hyperparameter_ranges" = "`(nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing)`"
 ":iteration_parameter" = "`nothing`"
 ":supports_training_losses" = "`false`"
 ":reports_feature_importances" = "`true`"
@@ -6237,6 +6415,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "XGBoost"
 ":package_license" = "unknown"
@@ -6254,9 +6433,9 @@
 ":prediction_type" = ":probabilistic"
 ":abstract_type" = "`MLJModelInterface.Probabilistic`"
 ":implemented_methods" = [":clean!", ":fit", ":predict"]
-":hyperparameters" = "`(:test, :num_round, :booster, :disable_default_eval_metric, :eta, :num_parallel_tree, :gamma, :max_depth, :min_child_weight, :max_delta_step, :subsample, :colsample_bytree, :colsample_bylevel, :colsample_bynode, :lambda, :alpha, :tree_method, :sketch_eps, :scale_pos_weight, :updater, :refresh_leaf, :process_type, :grow_policy, :max_leaves, :max_bin, :predictor, :sample_type, :normalize_type, :rate_drop, :one_drop, :skip_drop, :feature_selector, :top_k, :tweedie_variance_power, :objective, :base_score, :watchlist, :nthread, :importance_type, :seed, :validate_parameters, :eval_metric)`"
-":hyperparameter_types" = "`(\"Int64\", \"Int64\", \"String\", \"Union{Bool, Int64}\", \"Float64\", \"Int64\", \"Float64\", \"Int64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"String\", \"Float64\", \"Float64\", \"Union{Nothing, String}\", \"Union{Bool, Int64}\", \"String\", \"String\", \"Int64\", \"Int64\", \"String\", \"String\", \"String\", \"Float64\", \"Union{Bool, Int64}\", \"Float64\", \"String\", \"Int64\", \"Float64\", \"Any\", \"Float64\", \"Any\", \"Int64\", \"String\", \"Union{Nothing, Int64}\", \"Bool\", \"Vector{String}\")`"
-":hyperparameter_ranges" = "`(nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing)`"
+":hyperparameters" = "`(:test, :num_round, :booster, :disable_default_eval_metric, :eta, :num_parallel_tree, :gamma, :max_depth, :min_child_weight, :max_delta_step, :subsample, :colsample_bytree, :colsample_bylevel, :colsample_bynode, :lambda, :alpha, :tree_method, :sketch_eps, :scale_pos_weight, :updater, :refresh_leaf, :process_type, :grow_policy, :max_leaves, :max_bin, :predictor, :sample_type, :normalize_type, :rate_drop, :one_drop, :skip_drop, :feature_selector, :top_k, :tweedie_variance_power, :objective, :base_score, :early_stopping_rounds, :watchlist, :nthread, :importance_type, :seed, :validate_parameters, :eval_metric)`"
+":hyperparameter_types" = "`(\"Int64\", \"Int64\", \"String\", \"Union{Bool, Int64}\", \"Float64\", \"Int64\", \"Float64\", \"Int64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"Float64\", \"String\", \"Float64\", \"Float64\", \"Union{Nothing, String}\", \"Union{Bool, Int64}\", \"String\", \"String\", \"Int64\", \"Int64\", \"String\", \"String\", \"String\", \"Float64\", \"Union{Bool, Int64}\", \"Float64\", \"String\", \"Int64\", \"Float64\", \"Any\", \"Float64\", \"Int64\", \"Any\", \"Int64\", \"String\", \"Union{Nothing, Int64}\", \"Bool\", \"Vector{String}\")`"
+":hyperparameter_ranges" = "`(nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing)`"
 ":iteration_parameter" = "`nothing`"
 ":supports_training_losses" = "`false`"
 ":reports_feature_importances" = "`true`"
@@ -6272,6 +6451,7 @@
 ":predict_scitype" = "`Union{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}, AbstractMatrix{<:ScientificTypesBase.Continuous}}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "SymbolicRegression"
 ":package_license" = "Apache-2.0"
@@ -6282,16 +6462,16 @@
 ":supports_weights" = "`true`"
 ":supports_class_weights" = "`false`"
 ":supports_online" = "`false`"
-":docstring" = "```\nMultitargetSRRegressor\n```\n\nA model type for constructing a Multi-Target Symbolic Regression via Evolutionary Search, based on [SymbolicRegression.jl](https://github.com/MilesCranmer/SymbolicRegression.jl), and implementing the MLJ model interface.\n\nFrom MLJ, the type can be imported using\n\n```\nMultitargetSRRegressor = @load MultitargetSRRegressor pkg=SymbolicRegression\n```\n\nDo `model = MultitargetSRRegressor()` to construct an instance with default hyper-parameters. Provide keyword arguments to override hyper-parameter defaults, as in `MultitargetSRRegressor(binary_operators=...)`.\n\nMulti-target Symbolic Regression regressor (`MultitargetSRRegressor`) conducts several searches for expressions that predict each target variable from a set of input variables. All data is assumed to be `Continuous`. The search is performed using an evolutionary algorithm. This algorithm is described in the paper https://arxiv.org/abs/2305.01582.\n\n# Training data\n\nIn MLJ or MLJBase, bind an instance `model` to data with\n\n```\nmach = machine(model, X, y)\n```\n\nOR\n\n```\nmach = machine(model, X, y, w)\n```\n\nHere:\n\n  * `X` is any table of input features (eg, a `DataFrame`) whose columns are of scitype\n\n`Continuous`; check column scitypes with `schema(X)`. Variable names in discovered expressions will be taken from the column names of `X`, if available. Units in columns of `X` (use `DynamicQuantities` for units) will trigger dimensional analysis to be used.\n\n  * `y` is the target, which can be any table of target variables whose element scitype is `Continuous`; check the scitype with `schema(y)`. Units in columns of `y` (use `DynamicQuantities` for units) will trigger dimensional analysis to be used.\n  * `w` is the observation weights which can either be `nothing` (default) or an `AbstractVector` whoose element scitype is `Count` or `Continuous`. The same weights are used for all targets.\n\nTrain the machine using `fit!(mach)`, inspect the discovered expressions with `report(mach)`, and predict on new data with `predict(mach, Xnew)`. Note that unlike other regressors, symbolic regression stores a list of lists of trained models. The models chosen from each of these lists is defined by the function `selection_method` keyword argument, which by default balances accuracy and complexity. You can override this at prediction time by passing a named tuple with keys `data` and `idx`.\n\n# Hyper-parameters\n\n  * `binary_operators`: Vector of binary operators (functions) to use.   Each operator should be defined for two input scalars,   and one output scalar. All operators   need to be defined over the entire real line (excluding infinity - these   are stopped before they are input), or return `NaN` where not defined.   For speed, define it so it takes two reals   of the same type as input, and outputs the same type. For the SymbolicUtils   simplification backend, you will need to define a generic method of the   operator so it takes arbitrary types.\n  * `unary_operators`: Same, but for   unary operators (one input scalar, gives an output scalar).\n  * `constraints`: Array of pairs specifying size constraints   for each operator. The constraints for a binary operator should be a 2-tuple   (e.g., `(-1, -1)`) and the constraints for a unary operator should be an `Int`.   A size constraint is a limit to the size of the subtree   in each argument of an operator. e.g., `[(^)=>(-1, 3)]` means that the   `^` operator can have arbitrary size (`-1`) in its left argument,   but a maximum size of `3` in its right argument. Default is   no constraints.\n  * `batching`: Whether to evolve based on small mini-batches of data,   rather than the entire dataset.\n  * `batch_size`: What batch size to use if using batching.\n  * `elementwise_loss`: What elementwise loss function to use. Can be one of   the following losses, or any other loss of type   `SupervisedLoss`. You can also pass a function that takes   a scalar target (left argument), and scalar predicted (right   argument), and returns a scalar. This will be averaged   over the predicted data. If weights are supplied, your   function should take a third argument for the weight scalar.   Included losses:       Regression:           - `LPDistLoss{P}()`,           - `L1DistLoss()`,           - `L2DistLoss()` (mean square),           - `LogitDistLoss()`,           - `HuberLoss(d)`,           - `L1EpsilonInsLoss(ϵ)`,           - `L2EpsilonInsLoss(ϵ)`,           - `PeriodicLoss(c)`,           - `QuantileLoss(τ)`,       Classification:           - `ZeroOneLoss()`,           - `PerceptronLoss()`,           - `L1HingeLoss()`,           - `SmoothedL1HingeLoss(γ)`,           - `ModifiedHuberLoss()`,           - `L2MarginLoss()`,           - `ExpLoss()`,           - `SigmoidLoss()`,           - `DWDMarginLoss(q)`.\n  * `loss_function`: Alternatively, you may redefine the loss used   as any function of `tree::Node{T}`, `dataset::Dataset{T}`,   and `options::Options`, so long as you output a non-negative   scalar of type `T`. This is useful if you want to use a loss   that takes into account derivatives, or correlations across   the dataset. This also means you could use a custom evaluation   for a particular expression. If you are using   `batching=true`, then your function should   accept a fourth argument `idx`, which is either `nothing`   (indicating that the full dataset should be used), or a vector   of indices to use for the batch.   For example,\n\n    ```\n      function my_loss(tree, dataset::Dataset{T,L}, options)::L where {T,L}\n          prediction, flag = eval_tree_array(tree, dataset.X, options)\n          if !flag\n              return L(Inf)\n          end\n          return sum((prediction .- dataset.y) .^ 2) / dataset.n\n      end\n    ```\n  * `populations`: How many populations of equations to use.\n  * `population_size`: How many equations in each population.\n  * `ncycles_per_iteration`: How many generations to consider per iteration.\n  * `tournament_selection_n`: Number of expressions considered in each tournament.\n  * `tournament_selection_p`: The fittest expression in a tournament is to be   selected with probability `p`, the next fittest with probability `p*(1-p)`,   and so forth.\n  * `topn`: Number of equations to return to the host process, and to   consider for the hall of fame.\n  * `complexity_of_operators`: What complexity should be assigned to each operator,   and the occurrence of a constant or variable. By default, this is 1   for all operators. Can be a real number as well, in which case   the complexity of an expression will be rounded to the nearest integer.   Input this in the form of, e.g., [(^) => 3, sin => 2].\n  * `complexity_of_constants`: What complexity should be assigned to use of a constant.   By default, this is 1.\n  * `complexity_of_variables`: What complexity should be assigned to each variable.   By default, this is 1.\n  * `alpha`: The probability of accepting an equation mutation   during regularized evolution is given by exp(-delta_loss/(alpha * T)),   where T goes from 1 to 0. Thus, alpha=infinite is the same as no annealing.\n  * `maxsize`: Maximum size of equations during the search.\n  * `maxdepth`: Maximum depth of equations during the search, by default   this is set equal to the maxsize.\n  * `parsimony`: A multiplicative factor for how much complexity is   punished.\n  * `dimensional_constraint_penalty`: An additive factor if the dimensional   constraint is violated.\n  * `use_frequency`: Whether to use a parsimony that adapts to the   relative proportion of equations at each complexity; this will   ensure that there are a balanced number of equations considered   for every complexity.\n  * `use_frequency_in_tournament`: Whether to use the adaptive parsimony described   above inside the score, rather than just at the mutation accept/reject stage.\n  * `adaptive_parsimony_scaling`: How much to scale the adaptive parsimony term   in the loss. Increase this if the search is spending too much time   optimizing the most complex equations.\n  * `turbo`: Whether to use `LoopVectorization.@turbo` to evaluate expressions.   This can be significantly faster, but is only compatible with certain   operators. *Experimental!*\n  * `migration`: Whether to migrate equations between processes.\n  * `hof_migration`: Whether to migrate equations from the hall of fame   to processes.\n  * `fraction_replaced`: What fraction of each population to replace with   migrated equations at the end of each cycle.\n  * `fraction_replaced_hof`: What fraction to replace with hall of fame   equations at the end of each cycle.\n  * `should_simplify`: Whether to simplify equations. If you   pass a custom objective, this will be set to `false`.\n  * `should_optimize_constants`: Whether to use an optimization algorithm   to periodically optimize constants in equations.\n  * `optimizer_nrestarts`: How many different random starting positions to consider   for optimization of constants.\n  * `optimizer_algorithm`: Select algorithm to use for optimizing constants. Default   is \"BFGS\", but \"NelderMead\" is also supported.\n  * `optimizer_options`: General options for the constant optimization. For details   we refer to the documentation on `Optim.Options` from the `Optim.jl` package.   Options can be provided here as `NamedTuple`, e.g. `(iterations=16,)`, as a   `Dict`, e.g. Dict(:x_tol => 1.0e-32,), or as an `Optim.Options` instance.\n  * `output_file`: What file to store equations to, as a backup.\n  * `perturbation_factor`: When mutating a constant, either   multiply or divide by (1+perturbation_factor)^(rand()+1).\n  * `probability_negate_constant`: Probability of negating a constant in the equation   when mutating it.\n  * `mutation_weights`: Relative probabilities of the mutations. The struct   `MutationWeights` should be passed to these options.   See its documentation on `MutationWeights` for the different weights.\n  * `crossover_probability`: Probability of performing crossover.\n  * `annealing`: Whether to use simulated annealing.\n  * `warmup_maxsize_by`: Whether to slowly increase the max size from 5 up to   `maxsize`. If nonzero, specifies the fraction through the search   at which the maxsize should be reached.\n  * `verbosity`: Whether to print debugging statements or   not.\n  * `print_precision`: How many digits to print when printing   equations. By default, this is 5.\n  * `save_to_file`: Whether to save equations to a file during the search.\n  * `bin_constraints`: See `constraints`. This is the same, but specified for binary   operators only (for example, if you have an operator that is both a binary   and unary operator).\n  * `una_constraints`: Likewise, for unary operators.\n  * `seed`: What random seed to use. `nothing` uses no seed.\n  * `progress`: Whether to use a progress bar output (`verbosity` will   have no effect).\n  * `early_stop_condition`: Float - whether to stop early if the mean loss gets below this value.   Function - a function taking (loss, complexity) as arguments and returning true or false.\n  * `timeout_in_seconds`: Float64 - the time in seconds after which to exit (as an alternative to the number of iterations).\n  * `max_evals`: Int (or Nothing) - the maximum number of evaluations of expressions to perform.\n  * `skip_mutation_failures`: Whether to simply skip over mutations that fail or are rejected, rather than to replace the mutated   expression with the original expression and proceed normally.\n  * `enable_autodiff`: Whether to enable automatic differentiation functionality. This is turned off by default.   If turned on, this will be turned off if one of the operators does not have well-defined gradients.\n  * `nested_constraints`: Specifies how many times a combination of operators can be nested. For example,   `[sin => [cos => 0], cos => [cos => 2]]` specifies that `cos` may never appear within a `sin`,   but `sin` can be nested with itself an unlimited number of times. The second term specifies that `cos`   can be nested up to 2 times within a `cos`, so that `cos(cos(cos(x)))` is allowed (as well as any combination   of `+` or `-` within it), but `cos(cos(cos(cos(x))))` is not allowed. When an operator is not specified,   it is assumed that it can be nested an unlimited number of times. This requires that there is no operator   which is used both in the unary operators and the binary operators (e.g., `-` could be both subtract, and negation).   For binary operators, both arguments are treated the same way, and the max of each argument is constrained.\n  * `deterministic`: Use a global counter for the birth time, rather than calls to `time()`. This gives   perfect resolution, and is therefore deterministic. However, it is not thread safe, and must be used   in serial mode.\n  * `define_helper_functions`: Whether to define helper functions   for constructing and evaluating trees.\n  * `niterations::Int=10`: The number of iterations to perform the search.   More iterations will improve the results.\n  * `parallelism=:multithreading`: What parallelism mode to use.   The options are `:multithreading`, `:multiprocessing`, and `:serial`.   By default, multithreading will be used. Multithreading uses less memory,   but multiprocessing can handle multi-node compute. If using `:multithreading`   mode, the number of threads available to julia are used. If using   `:multiprocessing`, `numprocs` processes will be created dynamically if   `procs` is unset. If you have already allocated processes, pass them   to the `procs` argument and they will be used.   You may also pass a string instead of a symbol, like `\"multithreading\"`.\n  * `numprocs::Union{Int, Nothing}=nothing`:  The number of processes to use,   if you want `equation_search` to set this up automatically. By default   this will be `4`, but can be any number (you should pick a number <=   the number of cores available).\n  * `procs::Union{Vector{Int}, Nothing}=nothing`: If you have set up   a distributed run manually with `procs = addprocs()` and `@everywhere`,   pass the `procs` to this keyword argument.\n  * `addprocs_function::Union{Function, Nothing}=nothing`: If using multiprocessing   (`parallelism=:multithreading`), and are not passing `procs` manually,   then they will be allocated dynamically using `addprocs`. However,   you may also pass a custom function to use instead of `addprocs`.   This function should take a single positional argument,   which is the number of processes to use, as well as the `lazy` keyword argument.   For example, if set up on a slurm cluster, you could pass   `addprocs_function = addprocs_slurm`, which will set up slurm processes.\n  * `heap_size_hint_in_bytes::Union{Int,Nothing}=nothing`: On Julia 1.9+, you may set the `--heap-size-hint`   flag on Julia processes, recommending garbage collection once a process   is close to the recommended size. This is important for long-running distributed   jobs where each process has an independent memory, and can help avoid   out-of-memory errors. By default, this is set to `Sys.free_memory() / numprocs`.\n  * `runtests::Bool=true`: Whether to run (quick) tests before starting the   search, to see if there will be any problems during the equation search   related to the host environment.\n  * `loss_type::Type=Nothing`: If you would like to use a different type   for the loss than for the data you passed, specify the type here.   Note that if you pass complex data `::Complex{L}`, then the loss   type will automatically be set to `L`.\n  * `selection_method::Function`: Function to selection expression from   the Pareto frontier for use in `predict`.   See `SymbolicRegression.MLJInterfaceModule.choose_best` for an example.   This function should return a single integer specifying   the index of the expression to use. By default, this maximizes   the score (a pound-for-pound rating) of expressions reaching the threshold   of 1.5x the minimum loss. To override this at prediction time, you can pass   a named tuple with keys `data` and `idx` to `predict`. See the Operations   section for details.\n  * `dimensions_type::AbstractDimensions`: The type of dimensions to use when storing   the units of the data. By default this is `DynamicQuantities.SymbolicDimensions`.\n\n# Operations\n\n  * `predict(mach, Xnew)`: Return predictions of the target given features `Xnew`, which should have same scitype as `X` above. The expression used for prediction is defined by the `selection_method` function, which can be seen by viewing `report(mach).best_idx`.\n  * `predict(mach, (data=Xnew, idx=i))`: Return predictions of the target given features `Xnew`, which should have same scitype as `X` above. By passing a named tuple with keys `data` and `idx`, you are able to specify the equation you wish to evaluate in `idx`.\n\n# Fitted parameters\n\nThe fields of `fitted_params(mach)` are:\n\n  * `best_idx::Vector{Int}`: The index of the best expression in each Pareto frontier, as determined by the `selection_method` function. Override in `predict` by passing a named tuple with keys `data` and `idx`.\n  * `equations::Vector{Vector{Node{T}}}`: The expressions discovered by the search, represented in a dominating Pareto frontier (i.e., the best expressions found for each complexity). The outer vector is indexed by target variable, and the inner vector is ordered by increasing complexity. `T` is equal to the element type of the passed data.\n  * `equation_strings::Vector{Vector{String}}`: The expressions discovered by the search, represented as strings for easy inspection.\n\n# Report\n\nThe fields of `report(mach)` are:\n\n  * `best_idx::Vector{Int}`: The index of the best expression in each Pareto frontier,  as determined by the `selection_method` function. Override in `predict` by passing  a named tuple with keys `data` and `idx`.\n  * `equations::Vector{Vector{Node{T}}}`: The expressions discovered by the search, represented in a dominating Pareto frontier (i.e., the best expressions found for each complexity). The outer vector is indexed by target variable, and the inner vector is ordered by increasing complexity.\n  * `equation_strings::Vector{Vector{String}}`: The expressions discovered by the search, represented as strings for easy inspection.\n  * `complexities::Vector{Vector{Int}}`: The complexity of each expression in each Pareto frontier.\n  * `losses::Vector{Vector{L}}`: The loss of each expression in each Pareto frontier, according to the loss function specified in the model. The type `L` is the loss type, which is usually the same as the element type of data passed (i.e., `T`), but can differ if complex data types are passed.\n  * `scores::Vector{Vector{L}}`: A metric which considers both the complexity and loss of an expression, equal to the change in the log-loss divided by the change in complexity, relative to the previous expression along the Pareto frontier. A larger score aims to indicate an expression is more likely to be the true expression generating the data, but this is very problem-dependent and generally several other factors should be considered.\n\n# Examples\n\n```julia\nusing MLJ\nMultitargetSRRegressor = @load MultitargetSRRegressor pkg=SymbolicRegression\nX = (a=rand(100), b=rand(100), c=rand(100))\nY = (y1=(@. cos(X.c) * 2.1 - 0.9), y2=(@. X.a * X.b + X.c))\nmodel = MultitargetSRRegressor(binary_operators=[+, -, *], unary_operators=[exp], niterations=100)\nmach = machine(model, X, Y)\nfit!(mach)\ny_hat = predict(mach, X)\n# View the equations used:\nr = report(mach)\nfor (output_index, (eq, i)) in enumerate(zip(r.equation_strings, r.best_idx))\n    println(\"Equation used for \", output_index, \": \", eq[i])\nend\n```\n\nSee also [`SRRegressor`](@ref).\n"
+":docstring" = "```\nMultitargetSRRegressor\n```\n\nA model type for constructing a Multi-Target Symbolic Regression via Evolutionary Search, based on [SymbolicRegression.jl](https://github.com/MilesCranmer/SymbolicRegression.jl), and implementing the MLJ model interface.\n\nFrom MLJ, the type can be imported using\n\n```\nMultitargetSRRegressor = @load MultitargetSRRegressor pkg=SymbolicRegression\n```\n\nDo `model = MultitargetSRRegressor()` to construct an instance with default hyper-parameters. Provide keyword arguments to override hyper-parameter defaults, as in `MultitargetSRRegressor(binary_operators=...)`.\n\nMulti-target Symbolic Regression regressor (`MultitargetSRRegressor`) conducts several searches for expressions that predict each target variable from a set of input variables. All data is assumed to be `Continuous`. The search is performed using an evolutionary algorithm. This algorithm is described in the paper https://arxiv.org/abs/2305.01582.\n\n# Training data\n\nIn MLJ or MLJBase, bind an instance `model` to data with\n\n```\nmach = machine(model, X, y)\n```\n\nOR\n\n```\nmach = machine(model, X, y, w)\n```\n\nHere:\n\n  * `X` is any table of input features (eg, a `DataFrame`) whose columns are of scitype\n\n`Continuous`; check column scitypes with `schema(X)`. Variable names in discovered expressions will be taken from the column names of `X`, if available. Units in columns of `X` (use `DynamicQuantities` for units) will trigger dimensional analysis to be used.\n\n  * `y` is the target, which can be any table of target variables whose element scitype is `Continuous`; check the scitype with `schema(y)`. Units in columns of `y` (use `DynamicQuantities` for units) will trigger dimensional analysis to be used.\n  * `w` is the observation weights which can either be `nothing` (default) or an `AbstractVector` whoose element scitype is `Count` or `Continuous`. The same weights are used for all targets.\n\nTrain the machine using `fit!(mach)`, inspect the discovered expressions with `report(mach)`, and predict on new data with `predict(mach, Xnew)`. Note that unlike other regressors, symbolic regression stores a list of lists of trained models. The models chosen from each of these lists is defined by the function `selection_method` keyword argument, which by default balances accuracy and complexity. You can override this at prediction time by passing a named tuple with keys `data` and `idx`.\n\n# Hyper-parameters\n\n  * `binary_operators`: Vector of binary operators (functions) to use.   Each operator should be defined for two input scalars,   and one output scalar. All operators   need to be defined over the entire real line (excluding infinity - these   are stopped before they are input), or return `NaN` where not defined.   For speed, define it so it takes two reals   of the same type as input, and outputs the same type. For the SymbolicUtils   simplification backend, you will need to define a generic method of the   operator so it takes arbitrary types.\n  * `unary_operators`: Same, but for   unary operators (one input scalar, gives an output scalar).\n  * `constraints`: Array of pairs specifying size constraints   for each operator. The constraints for a binary operator should be a 2-tuple   (e.g., `(-1, -1)`) and the constraints for a unary operator should be an `Int`.   A size constraint is a limit to the size of the subtree   in each argument of an operator. e.g., `[(^)=>(-1, 3)]` means that the   `^` operator can have arbitrary size (`-1`) in its left argument,   but a maximum size of `3` in its right argument. Default is   no constraints.\n  * `batching`: Whether to evolve based on small mini-batches of data,   rather than the entire dataset.\n  * `batch_size`: What batch size to use if using batching.\n  * `elementwise_loss`: What elementwise loss function to use. Can be one of   the following losses, or any other loss of type   `SupervisedLoss`. You can also pass a function that takes   a scalar target (left argument), and scalar predicted (right   argument), and returns a scalar. This will be averaged   over the predicted data. If weights are supplied, your   function should take a third argument for the weight scalar.   Included losses:       Regression:           - `LPDistLoss{P}()`,           - `L1DistLoss()`,           - `L2DistLoss()` (mean square),           - `LogitDistLoss()`,           - `HuberLoss(d)`,           - `L1EpsilonInsLoss(ϵ)`,           - `L2EpsilonInsLoss(ϵ)`,           - `PeriodicLoss(c)`,           - `QuantileLoss(τ)`,       Classification:           - `ZeroOneLoss()`,           - `PerceptronLoss()`,           - `L1HingeLoss()`,           - `SmoothedL1HingeLoss(γ)`,           - `ModifiedHuberLoss()`,           - `L2MarginLoss()`,           - `ExpLoss()`,           - `SigmoidLoss()`,           - `DWDMarginLoss(q)`.\n  * `loss_function`: Alternatively, you may redefine the loss used   as any function of `tree::AbstractExpressionNode{T}`, `dataset::Dataset{T}`,   and `options::Options`, so long as you output a non-negative   scalar of type `T`. This is useful if you want to use a loss   that takes into account derivatives, or correlations across   the dataset. This also means you could use a custom evaluation   for a particular expression. If you are using   `batching=true`, then your function should   accept a fourth argument `idx`, which is either `nothing`   (indicating that the full dataset should be used), or a vector   of indices to use for the batch.   For example,\n\n    ```\n      function my_loss(tree, dataset::Dataset{T,L}, options)::L where {T,L}\n          prediction, flag = eval_tree_array(tree, dataset.X, options)\n          if !flag\n              return L(Inf)\n          end\n          return sum((prediction .- dataset.y) .^ 2) / dataset.n\n      end\n    ```\n  * `node_type::Type{N}=Node`: The type of node to use for the search.   For example, `Node` or `GraphNode`.\n  * `populations`: How many populations of equations to use.\n  * `population_size`: How many equations in each population.\n  * `ncycles_per_iteration`: How many generations to consider per iteration.\n  * `tournament_selection_n`: Number of expressions considered in each tournament.\n  * `tournament_selection_p`: The fittest expression in a tournament is to be   selected with probability `p`, the next fittest with probability `p*(1-p)`,   and so forth.\n  * `topn`: Number of equations to return to the host process, and to   consider for the hall of fame.\n  * `complexity_of_operators`: What complexity should be assigned to each operator,   and the occurrence of a constant or variable. By default, this is 1   for all operators. Can be a real number as well, in which case   the complexity of an expression will be rounded to the nearest integer.   Input this in the form of, e.g., [(^) => 3, sin => 2].\n  * `complexity_of_constants`: What complexity should be assigned to use of a constant.   By default, this is 1.\n  * `complexity_of_variables`: What complexity should be assigned to use of a variable,   which can also be a vector indicating different per-variable complexity.   By default, this is 1.\n  * `alpha`: The probability of accepting an equation mutation   during regularized evolution is given by exp(-delta_loss/(alpha * T)),   where T goes from 1 to 0. Thus, alpha=infinite is the same as no annealing.\n  * `maxsize`: Maximum size of equations during the search.\n  * `maxdepth`: Maximum depth of equations during the search, by default   this is set equal to the maxsize.\n  * `parsimony`: A multiplicative factor for how much complexity is   punished.\n  * `dimensional_constraint_penalty`: An additive factor if the dimensional   constraint is violated.\n  * `dimensionless_constants_only`: Whether to only allow dimensionless   constants.\n  * `use_frequency`: Whether to use a parsimony that adapts to the   relative proportion of equations at each complexity; this will   ensure that there are a balanced number of equations considered   for every complexity.\n  * `use_frequency_in_tournament`: Whether to use the adaptive parsimony described   above inside the score, rather than just at the mutation accept/reject stage.\n  * `adaptive_parsimony_scaling`: How much to scale the adaptive parsimony term   in the loss. Increase this if the search is spending too much time   optimizing the most complex equations.\n  * `turbo`: Whether to use `LoopVectorization.@turbo` to evaluate expressions.   This can be significantly faster, but is only compatible with certain   operators. *Experimental!*\n  * `bumper`: Whether to use Bumper.jl for faster evaluation. *Experimental!*\n  * `migration`: Whether to migrate equations between processes.\n  * `hof_migration`: Whether to migrate equations from the hall of fame   to processes.\n  * `fraction_replaced`: What fraction of each population to replace with   migrated equations at the end of each cycle.\n  * `fraction_replaced_hof`: What fraction to replace with hall of fame   equations at the end of each cycle.\n  * `should_simplify`: Whether to simplify equations. If you   pass a custom objective, this will be set to `false`.\n  * `should_optimize_constants`: Whether to use an optimization algorithm   to periodically optimize constants in equations.\n  * `optimizer_algorithm`: Select algorithm to use for optimizing constants. Default   is `Optim.BFGS(linesearch=LineSearches.BackTracking())`.\n  * `optimizer_nrestarts`: How many different random starting positions to consider   for optimization of constants.\n  * `optimizer_probability`: Probability of performing optimization of constants at   the end of a given iteration.\n  * `optimizer_iterations`: How many optimization iterations to perform. This gets  passed to `Optim.Options` as `iterations`. The default is 8.\n  * `optimizer_f_calls_limit`: How many function calls to allow during optimization.   This gets passed to `Optim.Options` as `f_calls_limit`. The default is   `0` which means no limit.\n  * `optimizer_options`: General options for the constant optimization. For details   we refer to the documentation on `Optim.Options` from the `Optim.jl` package.   Options can be provided here as `NamedTuple`, e.g. `(iterations=16,)`, as a   `Dict`, e.g. Dict(:x_tol => 1.0e-32,), or as an `Optim.Options` instance.\n  * `output_file`: What file to store equations to, as a backup.\n  * `perturbation_factor`: When mutating a constant, either   multiply or divide by (1+perturbation_factor)^(rand()+1).\n  * `probability_negate_constant`: Probability of negating a constant in the equation   when mutating it.\n  * `mutation_weights`: Relative probabilities of the mutations. The struct   `MutationWeights` should be passed to these options.   See its documentation on `MutationWeights` for the different weights.\n  * `crossover_probability`: Probability of performing crossover.\n  * `annealing`: Whether to use simulated annealing.\n  * `warmup_maxsize_by`: Whether to slowly increase the max size from 5 up to   `maxsize`. If nonzero, specifies the fraction through the search   at which the maxsize should be reached.\n  * `verbosity`: Whether to print debugging statements or   not.\n  * `print_precision`: How many digits to print when printing   equations. By default, this is 5.\n  * `save_to_file`: Whether to save equations to a file during the search.\n  * `bin_constraints`: See `constraints`. This is the same, but specified for binary   operators only (for example, if you have an operator that is both a binary   and unary operator).\n  * `una_constraints`: Likewise, for unary operators.\n  * `seed`: What random seed to use. `nothing` uses no seed.\n  * `progress`: Whether to use a progress bar output (`verbosity` will   have no effect).\n  * `early_stop_condition`: Float - whether to stop early if the mean loss gets below this value.   Function - a function taking (loss, complexity) as arguments and returning true or false.\n  * `timeout_in_seconds`: Float64 - the time in seconds after which to exit (as an alternative to the number of iterations).\n  * `max_evals`: Int (or Nothing) - the maximum number of evaluations of expressions to perform.\n  * `skip_mutation_failures`: Whether to simply skip over mutations that fail or are rejected, rather than to replace the mutated   expression with the original expression and proceed normally.\n  * `nested_constraints`: Specifies how many times a combination of operators can be nested. For example,   `[sin => [cos => 0], cos => [cos => 2]]` specifies that `cos` may never appear within a `sin`,   but `sin` can be nested with itself an unlimited number of times. The second term specifies that `cos`   can be nested up to 2 times within a `cos`, so that `cos(cos(cos(x)))` is allowed (as well as any combination   of `+` or `-` within it), but `cos(cos(cos(cos(x))))` is not allowed. When an operator is not specified,   it is assumed that it can be nested an unlimited number of times. This requires that there is no operator   which is used both in the unary operators and the binary operators (e.g., `-` could be both subtract, and negation).   For binary operators, both arguments are treated the same way, and the max of each argument is constrained.\n  * `deterministic`: Use a global counter for the birth time, rather than calls to `time()`. This gives   perfect resolution, and is therefore deterministic. However, it is not thread safe, and must be used   in serial mode.\n  * `define_helper_functions`: Whether to define helper functions   for constructing and evaluating trees.\n  * `niterations::Int=10`: The number of iterations to perform the search.   More iterations will improve the results.\n  * `parallelism=:multithreading`: What parallelism mode to use.   The options are `:multithreading`, `:multiprocessing`, and `:serial`.   By default, multithreading will be used. Multithreading uses less memory,   but multiprocessing can handle multi-node compute. If using `:multithreading`   mode, the number of threads available to julia are used. If using   `:multiprocessing`, `numprocs` processes will be created dynamically if   `procs` is unset. If you have already allocated processes, pass them   to the `procs` argument and they will be used.   You may also pass a string instead of a symbol, like `\"multithreading\"`.\n  * `numprocs::Union{Int, Nothing}=nothing`:  The number of processes to use,   if you want `equation_search` to set this up automatically. By default   this will be `4`, but can be any number (you should pick a number <=   the number of cores available).\n  * `procs::Union{Vector{Int}, Nothing}=nothing`: If you have set up   a distributed run manually with `procs = addprocs()` and `@everywhere`,   pass the `procs` to this keyword argument.\n  * `addprocs_function::Union{Function, Nothing}=nothing`: If using multiprocessing   (`parallelism=:multithreading`), and are not passing `procs` manually,   then they will be allocated dynamically using `addprocs`. However,   you may also pass a custom function to use instead of `addprocs`.   This function should take a single positional argument,   which is the number of processes to use, as well as the `lazy` keyword argument.   For example, if set up on a slurm cluster, you could pass   `addprocs_function = addprocs_slurm`, which will set up slurm processes.\n  * `heap_size_hint_in_bytes::Union{Int,Nothing}=nothing`: On Julia 1.9+, you may set the `--heap-size-hint`   flag on Julia processes, recommending garbage collection once a process   is close to the recommended size. This is important for long-running distributed   jobs where each process has an independent memory, and can help avoid   out-of-memory errors. By default, this is set to `Sys.free_memory() / numprocs`.\n  * `runtests::Bool=true`: Whether to run (quick) tests before starting the   search, to see if there will be any problems during the equation search   related to the host environment.\n  * `loss_type::Type=Nothing`: If you would like to use a different type   for the loss than for the data you passed, specify the type here.   Note that if you pass complex data `::Complex{L}`, then the loss   type will automatically be set to `L`.\n  * `selection_method::Function`: Function to selection expression from   the Pareto frontier for use in `predict`.   See `SymbolicRegression.MLJInterfaceModule.choose_best` for an example.   This function should return a single integer specifying   the index of the expression to use. By default, this maximizes   the score (a pound-for-pound rating) of expressions reaching the threshold   of 1.5x the minimum loss. To override this at prediction time, you can pass   a named tuple with keys `data` and `idx` to `predict`. See the Operations   section for details.\n  * `dimensions_type::AbstractDimensions`: The type of dimensions to use when storing   the units of the data. By default this is `DynamicQuantities.SymbolicDimensions`.\n\n# Operations\n\n  * `predict(mach, Xnew)`: Return predictions of the target given features `Xnew`, which should have same scitype as `X` above. The expression used for prediction is defined by the `selection_method` function, which can be seen by viewing `report(mach).best_idx`.\n  * `predict(mach, (data=Xnew, idx=i))`: Return predictions of the target given features `Xnew`, which should have same scitype as `X` above. By passing a named tuple with keys `data` and `idx`, you are able to specify the equation you wish to evaluate in `idx`.\n\n# Fitted parameters\n\nThe fields of `fitted_params(mach)` are:\n\n  * `best_idx::Vector{Int}`: The index of the best expression in each Pareto frontier, as determined by the `selection_method` function. Override in `predict` by passing a named tuple with keys `data` and `idx`.\n  * `equations::Vector{Vector{Node{T}}}`: The expressions discovered by the search, represented in a dominating Pareto frontier (i.e., the best expressions found for each complexity). The outer vector is indexed by target variable, and the inner vector is ordered by increasing complexity. `T` is equal to the element type of the passed data.\n  * `equation_strings::Vector{Vector{String}}`: The expressions discovered by the search, represented as strings for easy inspection.\n\n# Report\n\nThe fields of `report(mach)` are:\n\n  * `best_idx::Vector{Int}`: The index of the best expression in each Pareto frontier,  as determined by the `selection_method` function. Override in `predict` by passing  a named tuple with keys `data` and `idx`.\n  * `equations::Vector{Vector{Node{T}}}`: The expressions discovered by the search, represented in a dominating Pareto frontier (i.e., the best expressions found for each complexity). The outer vector is indexed by target variable, and the inner vector is ordered by increasing complexity.\n  * `equation_strings::Vector{Vector{String}}`: The expressions discovered by the search, represented as strings for easy inspection.\n  * `complexities::Vector{Vector{Int}}`: The complexity of each expression in each Pareto frontier.\n  * `losses::Vector{Vector{L}}`: The loss of each expression in each Pareto frontier, according to the loss function specified in the model. The type `L` is the loss type, which is usually the same as the element type of data passed (i.e., `T`), but can differ if complex data types are passed.\n  * `scores::Vector{Vector{L}}`: A metric which considers both the complexity and loss of an expression, equal to the change in the log-loss divided by the change in complexity, relative to the previous expression along the Pareto frontier. A larger score aims to indicate an expression is more likely to be the true expression generating the data, but this is very problem-dependent and generally several other factors should be considered.\n\n# Examples\n\n```julia\nusing MLJ\nMultitargetSRRegressor = @load MultitargetSRRegressor pkg=SymbolicRegression\nX = (a=rand(100), b=rand(100), c=rand(100))\nY = (y1=(@. cos(X.c) * 2.1 - 0.9), y2=(@. X.a * X.b + X.c))\nmodel = MultitargetSRRegressor(binary_operators=[+, -, *], unary_operators=[exp], niterations=100)\nmach = machine(model, X, Y)\nfit!(mach)\ny_hat = predict(mach, X)\n# View the equations used:\nr = report(mach)\nfor (output_index, (eq, i)) in enumerate(zip(r.equation_strings, r.best_idx))\n    println(\"Equation used for \", output_index, \": \", eq[i])\nend\n```\n\nSee also [`SRRegressor`](@ref).\n"
 ":name" = "MultitargetSRRegressor"
 ":human_name" = "Multi-Target Symbolic Regression via Evolutionary Search"
 ":is_supervised" = "`true`"
 ":prediction_type" = ":deterministic"
 ":abstract_type" = "`MLJModelInterface.Deterministic`"
 ":implemented_methods" = []
-":hyperparameters" = "`(:binary_operators, :unary_operators, :constraints, :elementwise_loss, :loss_function, :tournament_selection_n, :tournament_selection_p, :topn, :complexity_of_operators, :complexity_of_constants, :complexity_of_variables, :parsimony, :dimensional_constraint_penalty, :alpha, :maxsize, :maxdepth, :turbo, :migration, :hof_migration, :should_simplify, :should_optimize_constants, :output_file, :populations, :perturbation_factor, :annealing, :batching, :batch_size, :mutation_weights, :crossover_probability, :warmup_maxsize_by, :use_frequency, :use_frequency_in_tournament, :adaptive_parsimony_scaling, :population_size, :ncycles_per_iteration, :fraction_replaced, :fraction_replaced_hof, :verbosity, :print_precision, :save_to_file, :probability_negate_constant, :seed, :bin_constraints, :una_constraints, :progress, :terminal_width, :optimizer_algorithm, :optimizer_nrestarts, :optimizer_probability, :optimizer_iterations, :optimizer_options, :val_recorder, :recorder_file, :early_stop_condition, :timeout_in_seconds, :max_evals, :skip_mutation_failures, :enable_autodiff, :nested_constraints, :deterministic, :define_helper_functions, :fast_cycle, :npopulations, :npop, :niterations, :parallelism, :numprocs, :procs, :addprocs_function, :heap_size_hint_in_bytes, :runtests, :loss_type, :selection_method, :dimensions_type)`"
-":hyperparameter_types" = "`(\"Any\", \"Any\", \"Any\", \"Union{Nothing, Function, LossFunctions.Traits.SupervisedLoss}\", \"Union{Nothing, Function}\", \"Integer\", \"Real\", \"Integer\", \"Any\", \"Union{Nothing, Real}\", \"Union{Nothing, Real}\", \"Real\", \"Union{Nothing, Real}\", \"Real\", \"Integer\", \"Union{Nothing, Integer}\", \"Bool\", \"Bool\", \"Bool\", \"Union{Nothing, Bool}\", \"Bool\", \"Union{Nothing, AbstractString}\", \"Integer\", \"Real\", \"Bool\", \"Bool\", \"Integer\", \"Union{SymbolicRegression.CoreModule.OptionsStructModule.MutationWeights, NamedTuple, AbstractVector}\", \"Real\", \"Real\", \"Bool\", \"Bool\", \"Real\", \"Integer\", \"Integer\", \"Real\", \"Real\", \"Union{Nothing, Integer}\", \"Integer\", \"Bool\", \"Real\", \"Any\", \"Any\", \"Any\", \"Union{Nothing, Bool}\", \"Union{Nothing, Integer}\", \"AbstractString\", \"Integer\", \"Real\", \"Union{Nothing, Integer}\", \"Union{Nothing, Dict, NamedTuple, Optim.Options}\", \"Val\", \"AbstractString\", \"Union{Nothing, Function, Real}\", \"Union{Nothing, Real}\", \"Union{Nothing, Integer}\", \"Bool\", \"Bool\", \"Any\", \"Bool\", \"Bool\", \"Bool\", \"Union{Nothing, Integer}\", \"Union{Nothing, Integer}\", \"Int64\", \"Symbol\", \"Union{Nothing, Int64}\", \"Union{Nothing, Vector{Int64}}\", \"Union{Nothing, Function}\", \"Union{Nothing, Integer}\", \"Bool\", \"Any\", \"Function\", \"Type{D} where D<:DynamicQuantities.AbstractDimensions\")`"
-":hyperparameter_ranges" = "`(nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing)`"
+":hyperparameters" = "`(:binary_operators, :unary_operators, :constraints, :elementwise_loss, :loss_function, :tournament_selection_n, :tournament_selection_p, :topn, :complexity_of_operators, :complexity_of_constants, :complexity_of_variables, :parsimony, :dimensional_constraint_penalty, :dimensionless_constants_only, :alpha, :maxsize, :maxdepth, :turbo, :bumper, :migration, :hof_migration, :should_simplify, :should_optimize_constants, :output_file, :node_type, :populations, :perturbation_factor, :annealing, :batching, :batch_size, :mutation_weights, :crossover_probability, :warmup_maxsize_by, :use_frequency, :use_frequency_in_tournament, :adaptive_parsimony_scaling, :population_size, :ncycles_per_iteration, :fraction_replaced, :fraction_replaced_hof, :verbosity, :print_precision, :save_to_file, :probability_negate_constant, :seed, :bin_constraints, :una_constraints, :progress, :terminal_width, :optimizer_algorithm, :optimizer_nrestarts, :optimizer_probability, :optimizer_iterations, :optimizer_f_calls_limit, :optimizer_options, :use_recorder, :recorder_file, :early_stop_condition, :timeout_in_seconds, :max_evals, :skip_mutation_failures, :nested_constraints, :deterministic, :define_helper_functions, :fast_cycle, :npopulations, :npop, :niterations, :parallelism, :numprocs, :procs, :addprocs_function, :heap_size_hint_in_bytes, :runtests, :loss_type, :selection_method, :dimensions_type)`"
+":hyperparameter_types" = "`(\"Any\", \"Any\", \"Any\", \"Union{Nothing, Function, LossFunctions.Traits.SupervisedLoss}\", \"Union{Nothing, Function}\", \"Integer\", \"Real\", \"Integer\", \"Any\", \"Union{Nothing, Real}\", \"Union{Nothing, Real, AbstractVector}\", \"Real\", \"Union{Nothing, Real}\", \"Bool\", \"Real\", \"Integer\", \"Union{Nothing, Integer}\", \"Bool\", \"Bool\", \"Bool\", \"Bool\", \"Union{Nothing, Bool}\", \"Bool\", \"Union{Nothing, AbstractString}\", \"Type\", \"Integer\", \"Real\", \"Bool\", \"Bool\", \"Integer\", \"Union{SymbolicRegression.CoreModule.MutationWeightsModule.MutationWeights, NamedTuple, AbstractVector}\", \"Real\", \"Real\", \"Bool\", \"Bool\", \"Real\", \"Integer\", \"Integer\", \"Real\", \"Real\", \"Union{Nothing, Integer}\", \"Integer\", \"Bool\", \"Real\", \"Any\", \"Any\", \"Any\", \"Union{Nothing, Bool}\", \"Union{Nothing, Integer}\", \"Union{AbstractString, Optim.AbstractOptimizer}\", \"Integer\", \"Real\", \"Union{Nothing, Integer}\", \"Union{Nothing, Integer}\", \"Union{Nothing, Dict, NamedTuple, Optim.Options}\", \"Bool\", \"AbstractString\", \"Union{Nothing, Function, Real}\", \"Union{Nothing, Real}\", \"Union{Nothing, Integer}\", \"Bool\", \"Any\", \"Bool\", \"Bool\", \"Bool\", \"Union{Nothing, Integer}\", \"Union{Nothing, Integer}\", \"Int64\", \"Symbol\", \"Union{Nothing, Int64}\", \"Union{Nothing, Vector{Int64}}\", \"Union{Nothing, Function}\", \"Union{Nothing, Integer}\", \"Bool\", \"Any\", \"Function\", \"Type{D} where D<:DynamicQuantities.AbstractDimensions\")`"
+":hyperparameter_ranges" = "`(nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing)`"
 ":iteration_parameter" = "`nothing`"
 ":supports_training_losses" = "`false`"
 ":reports_feature_importances" = "`false`"
@@ -6307,6 +6487,7 @@
 ":predict_scitype" = "`AbstractVector{<:ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "SymbolicRegression"
 ":package_license" = "Apache-2.0"
@@ -6317,16 +6498,16 @@
 ":supports_weights" = "`true`"
 ":supports_class_weights" = "`false`"
 ":supports_online" = "`false`"
-":docstring" = "```\nSRRegressor\n```\n\nA model type for constructing a Symbolic Regression via Evolutionary Search, based on [SymbolicRegression.jl](https://github.com/MilesCranmer/SymbolicRegression.jl), and implementing the MLJ model interface.\n\nFrom MLJ, the type can be imported using\n\n```\nSRRegressor = @load SRRegressor pkg=SymbolicRegression\n```\n\nDo `model = SRRegressor()` to construct an instance with default hyper-parameters. Provide keyword arguments to override hyper-parameter defaults, as in `SRRegressor(binary_operators=...)`.\n\nSingle-target Symbolic Regression regressor (`SRRegressor`) searches for symbolic expressions that predict a single target variable from a set of input variables. All data is assumed to be `Continuous`. The search is performed using an evolutionary algorithm. This algorithm is described in the paper https://arxiv.org/abs/2305.01582.\n\n# Training data\n\nIn MLJ or MLJBase, bind an instance `model` to data with\n\n```\nmach = machine(model, X, y)\n```\n\nOR\n\n```\nmach = machine(model, X, y, w)\n```\n\nHere:\n\n  * `X` is any table of input features (eg, a `DataFrame`) whose columns are of scitype `Continuous`; check column scitypes with `schema(X)`. Variable names in discovered expressions will be taken from the column names of `X`, if available. Units in columns of `X` (use `DynamicQuantities` for units) will trigger dimensional analysis to be used.\n  * `y` is the target, which can be any `AbstractVector` whose element scitype is   `Continuous`; check the scitype with `scitype(y)`. Units in `y` (use `DynamicQuantities`   for units) will trigger dimensional analysis to be used.\n  * `w` is the observation weights which can either be `nothing` (default) or an `AbstractVector` whoose element scitype is `Count` or `Continuous`.\n\nTrain the machine using `fit!(mach)`, inspect the discovered expressions with `report(mach)`, and predict on new data with `predict(mach, Xnew)`. Note that unlike other regressors, symbolic regression stores a list of trained models. The model chosen from this list is defined by the function `selection_method` keyword argument, which by default balances accuracy and complexity. You can override this at prediction time by passing a named tuple with keys `data` and `idx`.\n\n# Hyper-parameters\n\n  * `binary_operators`: Vector of binary operators (functions) to use.   Each operator should be defined for two input scalars,   and one output scalar. All operators   need to be defined over the entire real line (excluding infinity - these   are stopped before they are input), or return `NaN` where not defined.   For speed, define it so it takes two reals   of the same type as input, and outputs the same type. For the SymbolicUtils   simplification backend, you will need to define a generic method of the   operator so it takes arbitrary types.\n  * `unary_operators`: Same, but for   unary operators (one input scalar, gives an output scalar).\n  * `constraints`: Array of pairs specifying size constraints   for each operator. The constraints for a binary operator should be a 2-tuple   (e.g., `(-1, -1)`) and the constraints for a unary operator should be an `Int`.   A size constraint is a limit to the size of the subtree   in each argument of an operator. e.g., `[(^)=>(-1, 3)]` means that the   `^` operator can have arbitrary size (`-1`) in its left argument,   but a maximum size of `3` in its right argument. Default is   no constraints.\n  * `batching`: Whether to evolve based on small mini-batches of data,   rather than the entire dataset.\n  * `batch_size`: What batch size to use if using batching.\n  * `elementwise_loss`: What elementwise loss function to use. Can be one of   the following losses, or any other loss of type   `SupervisedLoss`. You can also pass a function that takes   a scalar target (left argument), and scalar predicted (right   argument), and returns a scalar. This will be averaged   over the predicted data. If weights are supplied, your   function should take a third argument for the weight scalar.   Included losses:       Regression:           - `LPDistLoss{P}()`,           - `L1DistLoss()`,           - `L2DistLoss()` (mean square),           - `LogitDistLoss()`,           - `HuberLoss(d)`,           - `L1EpsilonInsLoss(ϵ)`,           - `L2EpsilonInsLoss(ϵ)`,           - `PeriodicLoss(c)`,           - `QuantileLoss(τ)`,       Classification:           - `ZeroOneLoss()`,           - `PerceptronLoss()`,           - `L1HingeLoss()`,           - `SmoothedL1HingeLoss(γ)`,           - `ModifiedHuberLoss()`,           - `L2MarginLoss()`,           - `ExpLoss()`,           - `SigmoidLoss()`,           - `DWDMarginLoss(q)`.\n  * `loss_function`: Alternatively, you may redefine the loss used   as any function of `tree::Node{T}`, `dataset::Dataset{T}`,   and `options::Options`, so long as you output a non-negative   scalar of type `T`. This is useful if you want to use a loss   that takes into account derivatives, or correlations across   the dataset. This also means you could use a custom evaluation   for a particular expression. If you are using   `batching=true`, then your function should   accept a fourth argument `idx`, which is either `nothing`   (indicating that the full dataset should be used), or a vector   of indices to use for the batch.   For example,\n\n    ```\n      function my_loss(tree, dataset::Dataset{T,L}, options)::L where {T,L}\n          prediction, flag = eval_tree_array(tree, dataset.X, options)\n          if !flag\n              return L(Inf)\n          end\n          return sum((prediction .- dataset.y) .^ 2) / dataset.n\n      end\n    ```\n  * `populations`: How many populations of equations to use.\n  * `population_size`: How many equations in each population.\n  * `ncycles_per_iteration`: How many generations to consider per iteration.\n  * `tournament_selection_n`: Number of expressions considered in each tournament.\n  * `tournament_selection_p`: The fittest expression in a tournament is to be   selected with probability `p`, the next fittest with probability `p*(1-p)`,   and so forth.\n  * `topn`: Number of equations to return to the host process, and to   consider for the hall of fame.\n  * `complexity_of_operators`: What complexity should be assigned to each operator,   and the occurrence of a constant or variable. By default, this is 1   for all operators. Can be a real number as well, in which case   the complexity of an expression will be rounded to the nearest integer.   Input this in the form of, e.g., [(^) => 3, sin => 2].\n  * `complexity_of_constants`: What complexity should be assigned to use of a constant.   By default, this is 1.\n  * `complexity_of_variables`: What complexity should be assigned to each variable.   By default, this is 1.\n  * `alpha`: The probability of accepting an equation mutation   during regularized evolution is given by exp(-delta_loss/(alpha * T)),   where T goes from 1 to 0. Thus, alpha=infinite is the same as no annealing.\n  * `maxsize`: Maximum size of equations during the search.\n  * `maxdepth`: Maximum depth of equations during the search, by default   this is set equal to the maxsize.\n  * `parsimony`: A multiplicative factor for how much complexity is   punished.\n  * `dimensional_constraint_penalty`: An additive factor if the dimensional   constraint is violated.\n  * `use_frequency`: Whether to use a parsimony that adapts to the   relative proportion of equations at each complexity; this will   ensure that there are a balanced number of equations considered   for every complexity.\n  * `use_frequency_in_tournament`: Whether to use the adaptive parsimony described   above inside the score, rather than just at the mutation accept/reject stage.\n  * `adaptive_parsimony_scaling`: How much to scale the adaptive parsimony term   in the loss. Increase this if the search is spending too much time   optimizing the most complex equations.\n  * `turbo`: Whether to use `LoopVectorization.@turbo` to evaluate expressions.   This can be significantly faster, but is only compatible with certain   operators. *Experimental!*\n  * `migration`: Whether to migrate equations between processes.\n  * `hof_migration`: Whether to migrate equations from the hall of fame   to processes.\n  * `fraction_replaced`: What fraction of each population to replace with   migrated equations at the end of each cycle.\n  * `fraction_replaced_hof`: What fraction to replace with hall of fame   equations at the end of each cycle.\n  * `should_simplify`: Whether to simplify equations. If you   pass a custom objective, this will be set to `false`.\n  * `should_optimize_constants`: Whether to use an optimization algorithm   to periodically optimize constants in equations.\n  * `optimizer_nrestarts`: How many different random starting positions to consider   for optimization of constants.\n  * `optimizer_algorithm`: Select algorithm to use for optimizing constants. Default   is \"BFGS\", but \"NelderMead\" is also supported.\n  * `optimizer_options`: General options for the constant optimization. For details   we refer to the documentation on `Optim.Options` from the `Optim.jl` package.   Options can be provided here as `NamedTuple`, e.g. `(iterations=16,)`, as a   `Dict`, e.g. Dict(:x_tol => 1.0e-32,), or as an `Optim.Options` instance.\n  * `output_file`: What file to store equations to, as a backup.\n  * `perturbation_factor`: When mutating a constant, either   multiply or divide by (1+perturbation_factor)^(rand()+1).\n  * `probability_negate_constant`: Probability of negating a constant in the equation   when mutating it.\n  * `mutation_weights`: Relative probabilities of the mutations. The struct   `MutationWeights` should be passed to these options.   See its documentation on `MutationWeights` for the different weights.\n  * `crossover_probability`: Probability of performing crossover.\n  * `annealing`: Whether to use simulated annealing.\n  * `warmup_maxsize_by`: Whether to slowly increase the max size from 5 up to   `maxsize`. If nonzero, specifies the fraction through the search   at which the maxsize should be reached.\n  * `verbosity`: Whether to print debugging statements or   not.\n  * `print_precision`: How many digits to print when printing   equations. By default, this is 5.\n  * `save_to_file`: Whether to save equations to a file during the search.\n  * `bin_constraints`: See `constraints`. This is the same, but specified for binary   operators only (for example, if you have an operator that is both a binary   and unary operator).\n  * `una_constraints`: Likewise, for unary operators.\n  * `seed`: What random seed to use. `nothing` uses no seed.\n  * `progress`: Whether to use a progress bar output (`verbosity` will   have no effect).\n  * `early_stop_condition`: Float - whether to stop early if the mean loss gets below this value.   Function - a function taking (loss, complexity) as arguments and returning true or false.\n  * `timeout_in_seconds`: Float64 - the time in seconds after which to exit (as an alternative to the number of iterations).\n  * `max_evals`: Int (or Nothing) - the maximum number of evaluations of expressions to perform.\n  * `skip_mutation_failures`: Whether to simply skip over mutations that fail or are rejected, rather than to replace the mutated   expression with the original expression and proceed normally.\n  * `enable_autodiff`: Whether to enable automatic differentiation functionality. This is turned off by default.   If turned on, this will be turned off if one of the operators does not have well-defined gradients.\n  * `nested_constraints`: Specifies how many times a combination of operators can be nested. For example,   `[sin => [cos => 0], cos => [cos => 2]]` specifies that `cos` may never appear within a `sin`,   but `sin` can be nested with itself an unlimited number of times. The second term specifies that `cos`   can be nested up to 2 times within a `cos`, so that `cos(cos(cos(x)))` is allowed (as well as any combination   of `+` or `-` within it), but `cos(cos(cos(cos(x))))` is not allowed. When an operator is not specified,   it is assumed that it can be nested an unlimited number of times. This requires that there is no operator   which is used both in the unary operators and the binary operators (e.g., `-` could be both subtract, and negation).   For binary operators, both arguments are treated the same way, and the max of each argument is constrained.\n  * `deterministic`: Use a global counter for the birth time, rather than calls to `time()`. This gives   perfect resolution, and is therefore deterministic. However, it is not thread safe, and must be used   in serial mode.\n  * `define_helper_functions`: Whether to define helper functions   for constructing and evaluating trees.\n  * `niterations::Int=10`: The number of iterations to perform the search.   More iterations will improve the results.\n  * `parallelism=:multithreading`: What parallelism mode to use.   The options are `:multithreading`, `:multiprocessing`, and `:serial`.   By default, multithreading will be used. Multithreading uses less memory,   but multiprocessing can handle multi-node compute. If using `:multithreading`   mode, the number of threads available to julia are used. If using   `:multiprocessing`, `numprocs` processes will be created dynamically if   `procs` is unset. If you have already allocated processes, pass them   to the `procs` argument and they will be used.   You may also pass a string instead of a symbol, like `\"multithreading\"`.\n  * `numprocs::Union{Int, Nothing}=nothing`:  The number of processes to use,   if you want `equation_search` to set this up automatically. By default   this will be `4`, but can be any number (you should pick a number <=   the number of cores available).\n  * `procs::Union{Vector{Int}, Nothing}=nothing`: If you have set up   a distributed run manually with `procs = addprocs()` and `@everywhere`,   pass the `procs` to this keyword argument.\n  * `addprocs_function::Union{Function, Nothing}=nothing`: If using multiprocessing   (`parallelism=:multithreading`), and are not passing `procs` manually,   then they will be allocated dynamically using `addprocs`. However,   you may also pass a custom function to use instead of `addprocs`.   This function should take a single positional argument,   which is the number of processes to use, as well as the `lazy` keyword argument.   For example, if set up on a slurm cluster, you could pass   `addprocs_function = addprocs_slurm`, which will set up slurm processes.\n  * `heap_size_hint_in_bytes::Union{Int,Nothing}=nothing`: On Julia 1.9+, you may set the `--heap-size-hint`   flag on Julia processes, recommending garbage collection once a process   is close to the recommended size. This is important for long-running distributed   jobs where each process has an independent memory, and can help avoid   out-of-memory errors. By default, this is set to `Sys.free_memory() / numprocs`.\n  * `runtests::Bool=true`: Whether to run (quick) tests before starting the   search, to see if there will be any problems during the equation search   related to the host environment.\n  * `loss_type::Type=Nothing`: If you would like to use a different type   for the loss than for the data you passed, specify the type here.   Note that if you pass complex data `::Complex{L}`, then the loss   type will automatically be set to `L`.\n  * `selection_method::Function`: Function to selection expression from   the Pareto frontier for use in `predict`.   See `SymbolicRegression.MLJInterfaceModule.choose_best` for an example.   This function should return a single integer specifying   the index of the expression to use. By default, this maximizes   the score (a pound-for-pound rating) of expressions reaching the threshold   of 1.5x the minimum loss. To override this at prediction time, you can pass   a named tuple with keys `data` and `idx` to `predict`. See the Operations   section for details.\n  * `dimensions_type::AbstractDimensions`: The type of dimensions to use when storing   the units of the data. By default this is `DynamicQuantities.SymbolicDimensions`.\n\n# Operations\n\n  * `predict(mach, Xnew)`: Return predictions of the target given features `Xnew`, which should have same scitype as `X` above. The expression used for prediction is defined by the `selection_method` function, which can be seen by viewing `report(mach).best_idx`.\n  * `predict(mach, (data=Xnew, idx=i))`: Return predictions of the target given features `Xnew`, which should have same scitype as `X` above. By passing a named tuple with keys `data` and `idx`, you are able to specify the equation you wish to evaluate in `idx`.\n\n# Fitted parameters\n\nThe fields of `fitted_params(mach)` are:\n\n  * `best_idx::Int`: The index of the best expression in the Pareto frontier,  as determined by the `selection_method` function. Override in `predict` by passing   a named tuple with keys `data` and `idx`.\n  * `equations::Vector{Node{T}}`: The expressions discovered by the search, represented in a dominating Pareto frontier (i.e., the best expressions found for each complexity). `T` is equal to the element type of the passed data.\n  * `equation_strings::Vector{String}`: The expressions discovered by the search, represented as strings for easy inspection.\n\n# Report\n\nThe fields of `report(mach)` are:\n\n  * `best_idx::Int`: The index of the best expression in the Pareto frontier,  as determined by the `selection_method` function. Override in `predict` by passing  a named tuple with keys `data` and `idx`.\n  * `equations::Vector{Node{T}}`: The expressions discovered by the search, represented in a dominating Pareto frontier (i.e., the best expressions found for each complexity).\n  * `equation_strings::Vector{String}`: The expressions discovered by the search, represented as strings for easy inspection.\n  * `complexities::Vector{Int}`: The complexity of each expression in the Pareto frontier.\n  * `losses::Vector{L}`: The loss of each expression in the Pareto frontier, according to the loss function specified in the model. The type `L` is the loss type, which is usually the same as the element type of data passed (i.e., `T`), but can differ if complex data types are passed.\n  * `scores::Vector{L}`: A metric which considers both the complexity and loss of an expression, equal to the change in the log-loss divided by the change in complexity, relative to the previous expression along the Pareto frontier. A larger score aims to indicate an expression is more likely to be the true expression generating the data, but this is very problem-dependent and generally several other factors should be considered.\n\n# Examples\n\n```julia\nusing MLJ\nSRRegressor = @load SRRegressor pkg=SymbolicRegression\nX, y = @load_boston\nmodel = SRRegressor(binary_operators=[+, -, *], unary_operators=[exp], niterations=100)\nmach = machine(model, X, y)\nfit!(mach)\ny_hat = predict(mach, X)\n# View the equation used:\nr = report(mach)\nprintln(\"Equation used:\", r.equation_strings[r.best_idx])\n```\n\nWith units and variable names:\n\n```julia\nusing MLJ\nusing DynamicQuantities\nSRegressor = @load SRRegressor pkg=SymbolicRegression\n\nX = (; x1=rand(32) .* us\"km/h\", x2=rand(32) .* us\"km\")\ny = @. X.x2 / X.x1 + 0.5us\"h\"\nmodel = SRRegressor(binary_operators=[+, -, *, /])\nmach = machine(model, X, y)\nfit!(mach)\ny_hat = predict(mach, X)\n# View the equation used:\nr = report(mach)\nprintln(\"Equation used:\", r.equation_strings[r.best_idx])\n```\n\nSee also [`MultitargetSRRegressor`](@ref).\n"
+":docstring" = "```\nSRRegressor\n```\n\nA model type for constructing a Symbolic Regression via Evolutionary Search, based on [SymbolicRegression.jl](https://github.com/MilesCranmer/SymbolicRegression.jl), and implementing the MLJ model interface.\n\nFrom MLJ, the type can be imported using\n\n```\nSRRegressor = @load SRRegressor pkg=SymbolicRegression\n```\n\nDo `model = SRRegressor()` to construct an instance with default hyper-parameters. Provide keyword arguments to override hyper-parameter defaults, as in `SRRegressor(binary_operators=...)`.\n\nSingle-target Symbolic Regression regressor (`SRRegressor`) searches for symbolic expressions that predict a single target variable from a set of input variables. All data is assumed to be `Continuous`. The search is performed using an evolutionary algorithm. This algorithm is described in the paper https://arxiv.org/abs/2305.01582.\n\n# Training data\n\nIn MLJ or MLJBase, bind an instance `model` to data with\n\n```\nmach = machine(model, X, y)\n```\n\nOR\n\n```\nmach = machine(model, X, y, w)\n```\n\nHere:\n\n  * `X` is any table of input features (eg, a `DataFrame`) whose columns are of scitype `Continuous`; check column scitypes with `schema(X)`. Variable names in discovered expressions will be taken from the column names of `X`, if available. Units in columns of `X` (use `DynamicQuantities` for units) will trigger dimensional analysis to be used.\n  * `y` is the target, which can be any `AbstractVector` whose element scitype is   `Continuous`; check the scitype with `scitype(y)`. Units in `y` (use `DynamicQuantities`   for units) will trigger dimensional analysis to be used.\n  * `w` is the observation weights which can either be `nothing` (default) or an `AbstractVector` whoose element scitype is `Count` or `Continuous`.\n\nTrain the machine using `fit!(mach)`, inspect the discovered expressions with `report(mach)`, and predict on new data with `predict(mach, Xnew)`. Note that unlike other regressors, symbolic regression stores a list of trained models. The model chosen from this list is defined by the function `selection_method` keyword argument, which by default balances accuracy and complexity. You can override this at prediction time by passing a named tuple with keys `data` and `idx`.\n\n# Hyper-parameters\n\n  * `binary_operators`: Vector of binary operators (functions) to use.   Each operator should be defined for two input scalars,   and one output scalar. All operators   need to be defined over the entire real line (excluding infinity - these   are stopped before they are input), or return `NaN` where not defined.   For speed, define it so it takes two reals   of the same type as input, and outputs the same type. For the SymbolicUtils   simplification backend, you will need to define a generic method of the   operator so it takes arbitrary types.\n  * `unary_operators`: Same, but for   unary operators (one input scalar, gives an output scalar).\n  * `constraints`: Array of pairs specifying size constraints   for each operator. The constraints for a binary operator should be a 2-tuple   (e.g., `(-1, -1)`) and the constraints for a unary operator should be an `Int`.   A size constraint is a limit to the size of the subtree   in each argument of an operator. e.g., `[(^)=>(-1, 3)]` means that the   `^` operator can have arbitrary size (`-1`) in its left argument,   but a maximum size of `3` in its right argument. Default is   no constraints.\n  * `batching`: Whether to evolve based on small mini-batches of data,   rather than the entire dataset.\n  * `batch_size`: What batch size to use if using batching.\n  * `elementwise_loss`: What elementwise loss function to use. Can be one of   the following losses, or any other loss of type   `SupervisedLoss`. You can also pass a function that takes   a scalar target (left argument), and scalar predicted (right   argument), and returns a scalar. This will be averaged   over the predicted data. If weights are supplied, your   function should take a third argument for the weight scalar.   Included losses:       Regression:           - `LPDistLoss{P}()`,           - `L1DistLoss()`,           - `L2DistLoss()` (mean square),           - `LogitDistLoss()`,           - `HuberLoss(d)`,           - `L1EpsilonInsLoss(ϵ)`,           - `L2EpsilonInsLoss(ϵ)`,           - `PeriodicLoss(c)`,           - `QuantileLoss(τ)`,       Classification:           - `ZeroOneLoss()`,           - `PerceptronLoss()`,           - `L1HingeLoss()`,           - `SmoothedL1HingeLoss(γ)`,           - `ModifiedHuberLoss()`,           - `L2MarginLoss()`,           - `ExpLoss()`,           - `SigmoidLoss()`,           - `DWDMarginLoss(q)`.\n  * `loss_function`: Alternatively, you may redefine the loss used   as any function of `tree::AbstractExpressionNode{T}`, `dataset::Dataset{T}`,   and `options::Options`, so long as you output a non-negative   scalar of type `T`. This is useful if you want to use a loss   that takes into account derivatives, or correlations across   the dataset. This also means you could use a custom evaluation   for a particular expression. If you are using   `batching=true`, then your function should   accept a fourth argument `idx`, which is either `nothing`   (indicating that the full dataset should be used), or a vector   of indices to use for the batch.   For example,\n\n    ```\n      function my_loss(tree, dataset::Dataset{T,L}, options)::L where {T,L}\n          prediction, flag = eval_tree_array(tree, dataset.X, options)\n          if !flag\n              return L(Inf)\n          end\n          return sum((prediction .- dataset.y) .^ 2) / dataset.n\n      end\n    ```\n  * `node_type::Type{N}=Node`: The type of node to use for the search.   For example, `Node` or `GraphNode`.\n  * `populations`: How many populations of equations to use.\n  * `population_size`: How many equations in each population.\n  * `ncycles_per_iteration`: How many generations to consider per iteration.\n  * `tournament_selection_n`: Number of expressions considered in each tournament.\n  * `tournament_selection_p`: The fittest expression in a tournament is to be   selected with probability `p`, the next fittest with probability `p*(1-p)`,   and so forth.\n  * `topn`: Number of equations to return to the host process, and to   consider for the hall of fame.\n  * `complexity_of_operators`: What complexity should be assigned to each operator,   and the occurrence of a constant or variable. By default, this is 1   for all operators. Can be a real number as well, in which case   the complexity of an expression will be rounded to the nearest integer.   Input this in the form of, e.g., [(^) => 3, sin => 2].\n  * `complexity_of_constants`: What complexity should be assigned to use of a constant.   By default, this is 1.\n  * `complexity_of_variables`: What complexity should be assigned to use of a variable,   which can also be a vector indicating different per-variable complexity.   By default, this is 1.\n  * `alpha`: The probability of accepting an equation mutation   during regularized evolution is given by exp(-delta_loss/(alpha * T)),   where T goes from 1 to 0. Thus, alpha=infinite is the same as no annealing.\n  * `maxsize`: Maximum size of equations during the search.\n  * `maxdepth`: Maximum depth of equations during the search, by default   this is set equal to the maxsize.\n  * `parsimony`: A multiplicative factor for how much complexity is   punished.\n  * `dimensional_constraint_penalty`: An additive factor if the dimensional   constraint is violated.\n  * `dimensionless_constants_only`: Whether to only allow dimensionless   constants.\n  * `use_frequency`: Whether to use a parsimony that adapts to the   relative proportion of equations at each complexity; this will   ensure that there are a balanced number of equations considered   for every complexity.\n  * `use_frequency_in_tournament`: Whether to use the adaptive parsimony described   above inside the score, rather than just at the mutation accept/reject stage.\n  * `adaptive_parsimony_scaling`: How much to scale the adaptive parsimony term   in the loss. Increase this if the search is spending too much time   optimizing the most complex equations.\n  * `turbo`: Whether to use `LoopVectorization.@turbo` to evaluate expressions.   This can be significantly faster, but is only compatible with certain   operators. *Experimental!*\n  * `bumper`: Whether to use Bumper.jl for faster evaluation. *Experimental!*\n  * `migration`: Whether to migrate equations between processes.\n  * `hof_migration`: Whether to migrate equations from the hall of fame   to processes.\n  * `fraction_replaced`: What fraction of each population to replace with   migrated equations at the end of each cycle.\n  * `fraction_replaced_hof`: What fraction to replace with hall of fame   equations at the end of each cycle.\n  * `should_simplify`: Whether to simplify equations. If you   pass a custom objective, this will be set to `false`.\n  * `should_optimize_constants`: Whether to use an optimization algorithm   to periodically optimize constants in equations.\n  * `optimizer_algorithm`: Select algorithm to use for optimizing constants. Default   is `Optim.BFGS(linesearch=LineSearches.BackTracking())`.\n  * `optimizer_nrestarts`: How many different random starting positions to consider   for optimization of constants.\n  * `optimizer_probability`: Probability of performing optimization of constants at   the end of a given iteration.\n  * `optimizer_iterations`: How many optimization iterations to perform. This gets  passed to `Optim.Options` as `iterations`. The default is 8.\n  * `optimizer_f_calls_limit`: How many function calls to allow during optimization.   This gets passed to `Optim.Options` as `f_calls_limit`. The default is   `0` which means no limit.\n  * `optimizer_options`: General options for the constant optimization. For details   we refer to the documentation on `Optim.Options` from the `Optim.jl` package.   Options can be provided here as `NamedTuple`, e.g. `(iterations=16,)`, as a   `Dict`, e.g. Dict(:x_tol => 1.0e-32,), or as an `Optim.Options` instance.\n  * `output_file`: What file to store equations to, as a backup.\n  * `perturbation_factor`: When mutating a constant, either   multiply or divide by (1+perturbation_factor)^(rand()+1).\n  * `probability_negate_constant`: Probability of negating a constant in the equation   when mutating it.\n  * `mutation_weights`: Relative probabilities of the mutations. The struct   `MutationWeights` should be passed to these options.   See its documentation on `MutationWeights` for the different weights.\n  * `crossover_probability`: Probability of performing crossover.\n  * `annealing`: Whether to use simulated annealing.\n  * `warmup_maxsize_by`: Whether to slowly increase the max size from 5 up to   `maxsize`. If nonzero, specifies the fraction through the search   at which the maxsize should be reached.\n  * `verbosity`: Whether to print debugging statements or   not.\n  * `print_precision`: How many digits to print when printing   equations. By default, this is 5.\n  * `save_to_file`: Whether to save equations to a file during the search.\n  * `bin_constraints`: See `constraints`. This is the same, but specified for binary   operators only (for example, if you have an operator that is both a binary   and unary operator).\n  * `una_constraints`: Likewise, for unary operators.\n  * `seed`: What random seed to use. `nothing` uses no seed.\n  * `progress`: Whether to use a progress bar output (`verbosity` will   have no effect).\n  * `early_stop_condition`: Float - whether to stop early if the mean loss gets below this value.   Function - a function taking (loss, complexity) as arguments and returning true or false.\n  * `timeout_in_seconds`: Float64 - the time in seconds after which to exit (as an alternative to the number of iterations).\n  * `max_evals`: Int (or Nothing) - the maximum number of evaluations of expressions to perform.\n  * `skip_mutation_failures`: Whether to simply skip over mutations that fail or are rejected, rather than to replace the mutated   expression with the original expression and proceed normally.\n  * `nested_constraints`: Specifies how many times a combination of operators can be nested. For example,   `[sin => [cos => 0], cos => [cos => 2]]` specifies that `cos` may never appear within a `sin`,   but `sin` can be nested with itself an unlimited number of times. The second term specifies that `cos`   can be nested up to 2 times within a `cos`, so that `cos(cos(cos(x)))` is allowed (as well as any combination   of `+` or `-` within it), but `cos(cos(cos(cos(x))))` is not allowed. When an operator is not specified,   it is assumed that it can be nested an unlimited number of times. This requires that there is no operator   which is used both in the unary operators and the binary operators (e.g., `-` could be both subtract, and negation).   For binary operators, both arguments are treated the same way, and the max of each argument is constrained.\n  * `deterministic`: Use a global counter for the birth time, rather than calls to `time()`. This gives   perfect resolution, and is therefore deterministic. However, it is not thread safe, and must be used   in serial mode.\n  * `define_helper_functions`: Whether to define helper functions   for constructing and evaluating trees.\n  * `niterations::Int=10`: The number of iterations to perform the search.   More iterations will improve the results.\n  * `parallelism=:multithreading`: What parallelism mode to use.   The options are `:multithreading`, `:multiprocessing`, and `:serial`.   By default, multithreading will be used. Multithreading uses less memory,   but multiprocessing can handle multi-node compute. If using `:multithreading`   mode, the number of threads available to julia are used. If using   `:multiprocessing`, `numprocs` processes will be created dynamically if   `procs` is unset. If you have already allocated processes, pass them   to the `procs` argument and they will be used.   You may also pass a string instead of a symbol, like `\"multithreading\"`.\n  * `numprocs::Union{Int, Nothing}=nothing`:  The number of processes to use,   if you want `equation_search` to set this up automatically. By default   this will be `4`, but can be any number (you should pick a number <=   the number of cores available).\n  * `procs::Union{Vector{Int}, Nothing}=nothing`: If you have set up   a distributed run manually with `procs = addprocs()` and `@everywhere`,   pass the `procs` to this keyword argument.\n  * `addprocs_function::Union{Function, Nothing}=nothing`: If using multiprocessing   (`parallelism=:multithreading`), and are not passing `procs` manually,   then they will be allocated dynamically using `addprocs`. However,   you may also pass a custom function to use instead of `addprocs`.   This function should take a single positional argument,   which is the number of processes to use, as well as the `lazy` keyword argument.   For example, if set up on a slurm cluster, you could pass   `addprocs_function = addprocs_slurm`, which will set up slurm processes.\n  * `heap_size_hint_in_bytes::Union{Int,Nothing}=nothing`: On Julia 1.9+, you may set the `--heap-size-hint`   flag on Julia processes, recommending garbage collection once a process   is close to the recommended size. This is important for long-running distributed   jobs where each process has an independent memory, and can help avoid   out-of-memory errors. By default, this is set to `Sys.free_memory() / numprocs`.\n  * `runtests::Bool=true`: Whether to run (quick) tests before starting the   search, to see if there will be any problems during the equation search   related to the host environment.\n  * `loss_type::Type=Nothing`: If you would like to use a different type   for the loss than for the data you passed, specify the type here.   Note that if you pass complex data `::Complex{L}`, then the loss   type will automatically be set to `L`.\n  * `selection_method::Function`: Function to selection expression from   the Pareto frontier for use in `predict`.   See `SymbolicRegression.MLJInterfaceModule.choose_best` for an example.   This function should return a single integer specifying   the index of the expression to use. By default, this maximizes   the score (a pound-for-pound rating) of expressions reaching the threshold   of 1.5x the minimum loss. To override this at prediction time, you can pass   a named tuple with keys `data` and `idx` to `predict`. See the Operations   section for details.\n  * `dimensions_type::AbstractDimensions`: The type of dimensions to use when storing   the units of the data. By default this is `DynamicQuantities.SymbolicDimensions`.\n\n# Operations\n\n  * `predict(mach, Xnew)`: Return predictions of the target given features `Xnew`, which should have same scitype as `X` above. The expression used for prediction is defined by the `selection_method` function, which can be seen by viewing `report(mach).best_idx`.\n  * `predict(mach, (data=Xnew, idx=i))`: Return predictions of the target given features `Xnew`, which should have same scitype as `X` above. By passing a named tuple with keys `data` and `idx`, you are able to specify the equation you wish to evaluate in `idx`.\n\n# Fitted parameters\n\nThe fields of `fitted_params(mach)` are:\n\n  * `best_idx::Int`: The index of the best expression in the Pareto frontier,  as determined by the `selection_method` function. Override in `predict` by passing   a named tuple with keys `data` and `idx`.\n  * `equations::Vector{Node{T}}`: The expressions discovered by the search, represented in a dominating Pareto frontier (i.e., the best expressions found for each complexity). `T` is equal to the element type of the passed data.\n  * `equation_strings::Vector{String}`: The expressions discovered by the search, represented as strings for easy inspection.\n\n# Report\n\nThe fields of `report(mach)` are:\n\n  * `best_idx::Int`: The index of the best expression in the Pareto frontier,  as determined by the `selection_method` function. Override in `predict` by passing  a named tuple with keys `data` and `idx`.\n  * `equations::Vector{Node{T}}`: The expressions discovered by the search, represented in a dominating Pareto frontier (i.e., the best expressions found for each complexity).\n  * `equation_strings::Vector{String}`: The expressions discovered by the search, represented as strings for easy inspection.\n  * `complexities::Vector{Int}`: The complexity of each expression in the Pareto frontier.\n  * `losses::Vector{L}`: The loss of each expression in the Pareto frontier, according to the loss function specified in the model. The type `L` is the loss type, which is usually the same as the element type of data passed (i.e., `T`), but can differ if complex data types are passed.\n  * `scores::Vector{L}`: A metric which considers both the complexity and loss of an expression, equal to the change in the log-loss divided by the change in complexity, relative to the previous expression along the Pareto frontier. A larger score aims to indicate an expression is more likely to be the true expression generating the data, but this is very problem-dependent and generally several other factors should be considered.\n\n# Examples\n\n```julia\nusing MLJ\nSRRegressor = @load SRRegressor pkg=SymbolicRegression\nX, y = @load_boston\nmodel = SRRegressor(binary_operators=[+, -, *], unary_operators=[exp], niterations=100)\nmach = machine(model, X, y)\nfit!(mach)\ny_hat = predict(mach, X)\n# View the equation used:\nr = report(mach)\nprintln(\"Equation used:\", r.equation_strings[r.best_idx])\n```\n\nWith units and variable names:\n\n```julia\nusing MLJ\nusing DynamicQuantities\nSRegressor = @load SRRegressor pkg=SymbolicRegression\n\nX = (; x1=rand(32) .* us\"km/h\", x2=rand(32) .* us\"km\")\ny = @. X.x2 / X.x1 + 0.5us\"h\"\nmodel = SRRegressor(binary_operators=[+, -, *, /])\nmach = machine(model, X, y)\nfit!(mach)\ny_hat = predict(mach, X)\n# View the equation used:\nr = report(mach)\nprintln(\"Equation used:\", r.equation_strings[r.best_idx])\n```\n\nSee also [`MultitargetSRRegressor`](@ref).\n"
 ":name" = "SRRegressor"
 ":human_name" = "Symbolic Regression via Evolutionary Search"
 ":is_supervised" = "`true`"
 ":prediction_type" = ":deterministic"
 ":abstract_type" = "`MLJModelInterface.Deterministic`"
 ":implemented_methods" = []
-":hyperparameters" = "`(:binary_operators, :unary_operators, :constraints, :elementwise_loss, :loss_function, :tournament_selection_n, :tournament_selection_p, :topn, :complexity_of_operators, :complexity_of_constants, :complexity_of_variables, :parsimony, :dimensional_constraint_penalty, :alpha, :maxsize, :maxdepth, :turbo, :migration, :hof_migration, :should_simplify, :should_optimize_constants, :output_file, :populations, :perturbation_factor, :annealing, :batching, :batch_size, :mutation_weights, :crossover_probability, :warmup_maxsize_by, :use_frequency, :use_frequency_in_tournament, :adaptive_parsimony_scaling, :population_size, :ncycles_per_iteration, :fraction_replaced, :fraction_replaced_hof, :verbosity, :print_precision, :save_to_file, :probability_negate_constant, :seed, :bin_constraints, :una_constraints, :progress, :terminal_width, :optimizer_algorithm, :optimizer_nrestarts, :optimizer_probability, :optimizer_iterations, :optimizer_options, :val_recorder, :recorder_file, :early_stop_condition, :timeout_in_seconds, :max_evals, :skip_mutation_failures, :enable_autodiff, :nested_constraints, :deterministic, :define_helper_functions, :fast_cycle, :npopulations, :npop, :niterations, :parallelism, :numprocs, :procs, :addprocs_function, :heap_size_hint_in_bytes, :runtests, :loss_type, :selection_method, :dimensions_type)`"
-":hyperparameter_types" = "`(\"Any\", \"Any\", \"Any\", \"Union{Nothing, Function, LossFunctions.Traits.SupervisedLoss}\", \"Union{Nothing, Function}\", \"Integer\", \"Real\", \"Integer\", \"Any\", \"Union{Nothing, Real}\", \"Union{Nothing, Real}\", \"Real\", \"Union{Nothing, Real}\", \"Real\", \"Integer\", \"Union{Nothing, Integer}\", \"Bool\", \"Bool\", \"Bool\", \"Union{Nothing, Bool}\", \"Bool\", \"Union{Nothing, AbstractString}\", \"Integer\", \"Real\", \"Bool\", \"Bool\", \"Integer\", \"Union{SymbolicRegression.CoreModule.OptionsStructModule.MutationWeights, NamedTuple, AbstractVector}\", \"Real\", \"Real\", \"Bool\", \"Bool\", \"Real\", \"Integer\", \"Integer\", \"Real\", \"Real\", \"Union{Nothing, Integer}\", \"Integer\", \"Bool\", \"Real\", \"Any\", \"Any\", \"Any\", \"Union{Nothing, Bool}\", \"Union{Nothing, Integer}\", \"AbstractString\", \"Integer\", \"Real\", \"Union{Nothing, Integer}\", \"Union{Nothing, Dict, NamedTuple, Optim.Options}\", \"Val\", \"AbstractString\", \"Union{Nothing, Function, Real}\", \"Union{Nothing, Real}\", \"Union{Nothing, Integer}\", \"Bool\", \"Bool\", \"Any\", \"Bool\", \"Bool\", \"Bool\", \"Union{Nothing, Integer}\", \"Union{Nothing, Integer}\", \"Int64\", \"Symbol\", \"Union{Nothing, Int64}\", \"Union{Nothing, Vector{Int64}}\", \"Union{Nothing, Function}\", \"Union{Nothing, Integer}\", \"Bool\", \"Any\", \"Function\", \"Type{D} where D<:DynamicQuantities.AbstractDimensions\")`"
-":hyperparameter_ranges" = "`(nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing)`"
+":hyperparameters" = "`(:binary_operators, :unary_operators, :constraints, :elementwise_loss, :loss_function, :tournament_selection_n, :tournament_selection_p, :topn, :complexity_of_operators, :complexity_of_constants, :complexity_of_variables, :parsimony, :dimensional_constraint_penalty, :dimensionless_constants_only, :alpha, :maxsize, :maxdepth, :turbo, :bumper, :migration, :hof_migration, :should_simplify, :should_optimize_constants, :output_file, :node_type, :populations, :perturbation_factor, :annealing, :batching, :batch_size, :mutation_weights, :crossover_probability, :warmup_maxsize_by, :use_frequency, :use_frequency_in_tournament, :adaptive_parsimony_scaling, :population_size, :ncycles_per_iteration, :fraction_replaced, :fraction_replaced_hof, :verbosity, :print_precision, :save_to_file, :probability_negate_constant, :seed, :bin_constraints, :una_constraints, :progress, :terminal_width, :optimizer_algorithm, :optimizer_nrestarts, :optimizer_probability, :optimizer_iterations, :optimizer_f_calls_limit, :optimizer_options, :use_recorder, :recorder_file, :early_stop_condition, :timeout_in_seconds, :max_evals, :skip_mutation_failures, :nested_constraints, :deterministic, :define_helper_functions, :fast_cycle, :npopulations, :npop, :niterations, :parallelism, :numprocs, :procs, :addprocs_function, :heap_size_hint_in_bytes, :runtests, :loss_type, :selection_method, :dimensions_type)`"
+":hyperparameter_types" = "`(\"Any\", \"Any\", \"Any\", \"Union{Nothing, Function, LossFunctions.Traits.SupervisedLoss}\", \"Union{Nothing, Function}\", \"Integer\", \"Real\", \"Integer\", \"Any\", \"Union{Nothing, Real}\", \"Union{Nothing, Real, AbstractVector}\", \"Real\", \"Union{Nothing, Real}\", \"Bool\", \"Real\", \"Integer\", \"Union{Nothing, Integer}\", \"Bool\", \"Bool\", \"Bool\", \"Bool\", \"Union{Nothing, Bool}\", \"Bool\", \"Union{Nothing, AbstractString}\", \"Type\", \"Integer\", \"Real\", \"Bool\", \"Bool\", \"Integer\", \"Union{SymbolicRegression.CoreModule.MutationWeightsModule.MutationWeights, NamedTuple, AbstractVector}\", \"Real\", \"Real\", \"Bool\", \"Bool\", \"Real\", \"Integer\", \"Integer\", \"Real\", \"Real\", \"Union{Nothing, Integer}\", \"Integer\", \"Bool\", \"Real\", \"Any\", \"Any\", \"Any\", \"Union{Nothing, Bool}\", \"Union{Nothing, Integer}\", \"Union{AbstractString, Optim.AbstractOptimizer}\", \"Integer\", \"Real\", \"Union{Nothing, Integer}\", \"Union{Nothing, Integer}\", \"Union{Nothing, Dict, NamedTuple, Optim.Options}\", \"Bool\", \"AbstractString\", \"Union{Nothing, Function, Real}\", \"Union{Nothing, Real}\", \"Union{Nothing, Integer}\", \"Bool\", \"Any\", \"Bool\", \"Bool\", \"Bool\", \"Union{Nothing, Integer}\", \"Union{Nothing, Integer}\", \"Int64\", \"Symbol\", \"Union{Nothing, Int64}\", \"Union{Nothing, Vector{Int64}}\", \"Union{Nothing, Function}\", \"Union{Nothing, Integer}\", \"Bool\", \"Any\", \"Function\", \"Type{D} where D<:DynamicQuantities.AbstractDimensions\")`"
+":hyperparameter_ranges" = "`(nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing)`"
 ":iteration_parameter" = "`nothing`"
 ":supports_training_losses" = "`false`"
 ":reports_feature_importances" = "`false`"
@@ -6342,6 +6523,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "EvoTrees"
 ":package_license" = "Apache"
@@ -6377,6 +6559,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "EvoTrees"
 ":package_license" = "Apache"
@@ -6412,6 +6595,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "EvoTrees"
 ":package_license" = "Apache"
@@ -6447,6 +6631,7 @@
 ":predict_scitype" = "`AbstractVector{<:ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "EvoTrees"
 ":package_license" = "Apache"
@@ -6482,6 +6667,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Count}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "EvoTrees"
 ":package_license" = "Apache"
@@ -6517,6 +6703,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJModels"
 ":package_license" = "MIT"
@@ -6552,6 +6739,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Union{ScientificTypesBase.Table, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`Union{ScientificTypesBase.Table, AbstractVector{<:ScientificTypesBase.Continuous}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJModels"
 ":package_license" = "MIT"
@@ -6587,6 +6775,7 @@
 ":predict_scitype" = "`AbstractVector{<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJModels"
 ":package_license" = "MIT"
@@ -6622,6 +6811,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":inverse_transform_scitype" = "`AbstractVector{<:ScientificTypesBase.ScientificTimeType}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJModels"
 ":package_license" = "MIT"
@@ -6657,6 +6847,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Table`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Table`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJModels"
 ":package_license" = "MIT"
@@ -6692,6 +6883,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Table`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJModels"
 ":package_license" = "MIT"
@@ -6727,6 +6919,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":inverse_transform_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJModels"
 ":package_license" = "MIT"
@@ -6762,6 +6955,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Table`"
 ":inverse_transform_scitype" = "`Tuple{ScientificTypesBase.Table}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJModels"
 ":package_license" = "MIT"
@@ -6797,6 +6991,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{ScientificTypesBase.Continuous}}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJModels"
 ":package_license" = "MIT"
@@ -6832,6 +7027,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`AbstractVector{<:ScientificTypesBase.OrderedFactor}`"
 ":inverse_transform_scitype" = "`AbstractVector{<:ScientificTypesBase.Continuous}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJModels"
 ":package_license" = "MIT"
@@ -6867,6 +7063,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJModels"
 ":package_license" = "unknown"
@@ -6902,6 +7099,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Table`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Table`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJModels"
 ":package_license" = "MIT"
@@ -6937,6 +7135,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJModels"
 ":package_license" = "MIT"
@@ -6972,6 +7171,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":inverse_transform_scitype" = "`AbstractVector{<:ScientificTypesBase.Infinite}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJModels"
 ":package_license" = "MIT"
@@ -7007,6 +7207,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Union{AbstractVector{<:ScientificTypesBase.Continuous}, AbstractVector{<:ScientificTypesBase.Count}, AbstractVector{<:ScientificTypesBase.Finite}}`"
 ":inverse_transform_scitype" = "`Union{AbstractVector{<:Union{Missing, ScientificTypesBase.Continuous}}, AbstractVector{<:Union{Missing, ScientificTypesBase.Count}}, AbstractVector{<:Union{Missing, ScientificTypesBase.Finite}}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJModels"
 ":package_license" = "MIT"
@@ -7042,6 +7243,7 @@
 ":predict_scitype" = "`AbstractVector{<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "OneRule"
 ":package_license" = "MIT"
@@ -7077,6 +7279,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{AbstractVector{<:ScientificTypesBase.Continuous}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "OutlierDetectionPython"
 ":package_license" = "MIT"
@@ -7112,6 +7315,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{AbstractVector{<:ScientificTypesBase.Continuous}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "OutlierDetectionPython"
 ":package_license" = "MIT"
@@ -7147,6 +7351,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{AbstractVector{<:ScientificTypesBase.Continuous}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "OutlierDetectionPython"
 ":package_license" = "MIT"
@@ -7182,6 +7387,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{AbstractVector{<:ScientificTypesBase.Continuous}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "OutlierDetectionPython"
 ":package_license" = "MIT"
@@ -7217,6 +7423,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{AbstractVector{<:ScientificTypesBase.Continuous}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "OutlierDetectionPython"
 ":package_license" = "MIT"
@@ -7252,6 +7459,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{AbstractVector{<:ScientificTypesBase.Continuous}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "OutlierDetectionPython"
 ":package_license" = "MIT"
@@ -7287,6 +7495,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{AbstractVector{<:ScientificTypesBase.Continuous}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "OutlierDetectionPython"
 ":package_license" = "MIT"
@@ -7322,6 +7531,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{AbstractVector{<:ScientificTypesBase.Continuous}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "OutlierDetectionPython"
 ":package_license" = "MIT"
@@ -7357,6 +7567,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{AbstractVector{<:ScientificTypesBase.Continuous}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "OutlierDetectionPython"
 ":package_license" = "MIT"
@@ -7392,6 +7603,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{AbstractVector{<:ScientificTypesBase.Continuous}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "OutlierDetectionPython"
 ":package_license" = "MIT"
@@ -7427,6 +7639,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{AbstractVector{<:ScientificTypesBase.Continuous}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "OutlierDetectionPython"
 ":package_license" = "MIT"
@@ -7462,6 +7675,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{AbstractVector{<:ScientificTypesBase.Continuous}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "OutlierDetectionPython"
 ":package_license" = "MIT"
@@ -7497,6 +7711,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{AbstractVector{<:ScientificTypesBase.Continuous}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "OutlierDetectionPython"
 ":package_license" = "MIT"
@@ -7532,6 +7747,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{AbstractVector{<:ScientificTypesBase.Continuous}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "OutlierDetectionPython"
 ":package_license" = "MIT"
@@ -7567,6 +7783,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{AbstractVector{<:ScientificTypesBase.Continuous}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "OutlierDetectionPython"
 ":package_license" = "MIT"
@@ -7602,6 +7819,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{AbstractVector{<:ScientificTypesBase.Continuous}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "OutlierDetectionPython"
 ":package_license" = "MIT"
@@ -7637,6 +7855,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{AbstractVector{<:ScientificTypesBase.Continuous}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "OutlierDetectionPython"
 ":package_license" = "MIT"
@@ -7672,6 +7891,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{AbstractVector{<:ScientificTypesBase.Continuous}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "OutlierDetectionPython"
 ":package_license" = "MIT"
@@ -7707,6 +7927,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{AbstractVector{<:ScientificTypesBase.Continuous}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "OutlierDetectionPython"
 ":package_license" = "MIT"
@@ -7742,6 +7963,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{AbstractVector{<:ScientificTypesBase.Continuous}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "OutlierDetectionPython"
 ":package_license" = "MIT"
@@ -7777,6 +7999,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{AbstractVector{<:ScientificTypesBase.Continuous}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "OutlierDetectionPython"
 ":package_license" = "MIT"
@@ -7812,6 +8035,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{AbstractVector{<:ScientificTypesBase.Continuous}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "OutlierDetectionPython"
 ":package_license" = "MIT"
@@ -7847,6 +8071,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`AbstractMatrix{ScientificTypesBase.Continuous}`"
 ":inverse_transform_scitype" = "`Union{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}, AbstractMatrix{ScientificTypesBase.Continuous}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "SelfOrganizingMaps"
 ":package_license" = "MIT"
@@ -7882,6 +8107,7 @@
 ":predict_scitype" = "`AbstractVector{<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "LIBSVM"
 ":package_license" = "unknown"
@@ -7917,6 +8143,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "LIBSVM"
 ":package_license" = "unknown"
@@ -7952,6 +8179,7 @@
 ":predict_scitype" = "`AbstractVector{<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "LIBSVM"
 ":package_license" = "unknown"
@@ -7987,6 +8215,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "LIBSVM"
 ":package_license" = "unknown"
@@ -8022,6 +8251,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "LIBSVM"
 ":package_license" = "unknown"
@@ -8057,6 +8287,7 @@
 ":predict_scitype" = "`AbstractVector{<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "LIBSVM"
 ":package_license" = "unknown"
@@ -8092,6 +8323,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "LIBSVM"
 ":package_license" = "unknown"
@@ -8127,6 +8359,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Tuple{AbstractVector{<:ScientificTypesBase.Continuous}, AbstractVector{<:ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "LIBSVM"
 ":package_license" = "unknown"
@@ -8162,6 +8395,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`Union{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}, AbstractMatrix{ScientificTypesBase.Continuous}}`"
 ":inverse_transform_scitype" = "`Union{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}, AbstractMatrix{ScientificTypesBase.Continuous}}`"
+":target_in_fit" = "`false`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "TSVD"
 ":package_license" = "MIT"
@@ -8197,6 +8431,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "GLM"
 ":package_license" = "MIT"
@@ -8232,6 +8467,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{ScientificTypesBase.Count}}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "GLM"
 ":package_license" = "MIT"
@@ -8267,6 +8503,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{ScientificTypesBase.Continuous}}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "GLM"
 ":package_license" = "MIT"
@@ -8302,6 +8539,7 @@
 ":predict_scitype" = "`Union{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}, AbstractMatrix{ScientificTypesBase.Continuous}}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJFlux"
 ":package_license" = "MIT"
@@ -8312,7 +8550,7 @@
 ":supports_weights" = "`false`"
 ":supports_class_weights" = "`false`"
 ":supports_online" = "`false`"
-":docstring" = "```\nMultitargetNeuralNetworkRegressor\n```\n\nA model type for constructing a multitarget neural network regressor, based on [MLJFlux.jl](https://github.com/alan-turing-institute/MLJFlux.jl), and implementing the MLJ model interface.\n\nFrom MLJ, the type can be imported using\n\n```\nMultitargetNeuralNetworkRegressor = @load MultitargetNeuralNetworkRegressor pkg=MLJFlux\n```\n\nDo `model = MultitargetNeuralNetworkRegressor()` to construct an instance with default hyper-parameters. Provide keyword arguments to override hyper-parameter defaults, as in `MultitargetNeuralNetworkRegressor(builder=...)`.\n\n`MultitargetNeuralNetworkRegressor` is for training a data-dependent Flux.jl neural network to predict a multi-valued `Continuous` target, represented as a table, given a table of `Continuous` features. Users provide a recipe for constructing the network, based on properties of the data that is encountered, by specifying an appropriate `builder`. See MLJFlux documentation for more on builders.\n\n# Training data\n\nIn MLJ or MLJBase, bind an instance `model` to data with\n\n```\nmach = machine(model, X, y)\n```\n\nHere:\n\n  * `X` is either a `Matrix` or any table of input features (eg, a `DataFrame`) whose columns are of scitype `Continuous`; check column scitypes with `schema(X)`. If `X` is a `Matrix`, it is assumed to have columns corresponding to features and rows corresponding to observations.\n  * `y` is the target, which can be any table or matrix of output targets whose element scitype is `Continuous`; check column scitypes with `schema(y)`. If `y` is a `Matrix`, it is assumed to have columns corresponding to variables and rows corresponding to observations.\n\n# Hyper-parameters\n\n  * `builder=MLJFlux.Linear(σ=Flux.relu)`: An MLJFlux builder that constructs a neural network. Possible `builders` include: `Linear`, `Short`, and `MLP`. See MLJFlux documentation for more on builders, and the example below for using the `@builder` convenience macro.\n  * `optimiser::Flux.Adam()`: A `Flux.Optimise` optimiser. The optimiser performs the updating of the weights of the network. For further reference, see [the Flux optimiser documentation](https://fluxml.ai/Flux.jl/stable/training/optimisers/). To choose a learning rate (the update rate of the optimizer), a good rule of thumb is to start out at `10e-3`, and tune using powers of 10 between `1` and `1e-7`.\n  * `loss=Flux.mse`: The loss function which the network will optimize. Should be a function which can be called in the form `loss(yhat, y)`.  Possible loss functions are listed in [the Flux loss function documentation](https://fluxml.ai/Flux.jl/stable/models/losses/). For a regression task, natural loss functions are:\n\n      * `Flux.mse`\n      * `Flux.mae`\n      * `Flux.msle`\n      * `Flux.huber_loss`\n\n    Currently MLJ measures are not supported as loss functions here.\n  * `epochs::Int=10`: The duration of training, in epochs. Typically, one epoch represents one pass through the complete the training dataset.\n  * `batch_size::int=1`: the batch size to be used for training, representing the number of samples per update of the network weights. Typically, batch size is between 8 and\n\n    512. Increassing batch size may accelerate training if `acceleration=CUDALibs()` and a\n\n    GPU is available.\n  * `lambda::Float64=0`: The strength of the weight regularization penalty. Can be any value in the range `[0, ∞)`.\n  * `alpha::Float64=0`: The L2/L1 mix of regularization, in the range `[0, 1]`. A value of 0 represents L2 regularization, and a value of 1 represents L1 regularization.\n  * `rng::Union{AbstractRNG, Int64}`: The random number generator or seed used during training.\n  * `optimizer_changes_trigger_retraining::Bool=false`: Defines what happens when re-fitting a machine if the associated optimiser has changed. If `true`, the associated machine will retrain from scratch on `fit!` call, otherwise it will not.\n  * `acceleration::AbstractResource=CPU1()`: Defines on what hardware training is done. For Training on GPU, use `CUDALibs()`.\n\n# Operations\n\n  * `predict(mach, Xnew)`: return predictions of the target given new features `Xnew` having the same scitype as `X` above. Predictions are deterministic.\n\n# Fitted parameters\n\nThe fields of `fitted_params(mach)` are:\n\n  * `chain`: The trained \"chain\" (Flux.jl model), namely the series of layers,  functions, and activations  which make up the neural network.\n\n# Report\n\nThe fields of `report(mach)` are:\n\n  * `training_losses`: A vector of training losses (penalised if `lambda != 0`) in  historical order, of length `epochs + 1`.  The first element is the pre-training loss.\n\n# Examples\n\nIn this example we apply a multi-target regression model to synthetic data:\n\n```julia\nusing MLJ\nimport MLJFlux\nusing Flux\n```\n\nFirst, we generate some synthetic data (needs MLJBase 0.20.16 or higher):\n\n```julia\nX, y = make_regression(100, 9; n_targets = 2) # both tables\nschema(y)\nschema(X)\n```\n\nSplitting off a test set:\n\n```julia\n(X, Xtest), (y, ytest) = partition((X, y), 0.7, multi=true);\n```\n\nNext, we can define a `builder`, making use of a convenience macro to do so.  In the following `@builder` call, `n_in` is a proxy for the number input features and `n_out` the number of target variables (both known at `fit!` time), while `rng` is a proxy for a RNG (which will be passed from the `rng` field of `model` defined below).\n\n```julia\nbuilder = MLJFlux.@builder begin\n    init=Flux.glorot_uniform(rng)\n    Chain(\n        Dense(n_in, 64, relu, init=init),\n        Dense(64, 32, relu, init=init),\n        Dense(32, n_out, init=init),\n    )\nend\n```\n\nInstantiating the regression model:\n\n```julia\nMultitargetNeuralNetworkRegressor = @load MultitargetNeuralNetworkRegressor\nmodel = MultitargetNeuralNetworkRegressor(builder=builder, rng=123, epochs=20)\n```\n\nWe will arrange for standardization of the the target by wrapping our model in  `TransformedTargetModel`, and standardization of the features by inserting the wrapped  model in a pipeline:\n\n```julia\npipe = Standardizer |> TransformedTargetModel(model, target=Standardizer)\n```\n\nIf we fit with a high verbosity (>1), we will see the losses during training. We can also see the losses in the output of `report(mach)`\n\n```julia\nmach = machine(pipe, X, y)\nfit!(mach, verbosity=2)\n\n# first element initial loss, 2:end per epoch training losses\nreport(mach).transformed_target_model_deterministic.model.training_losses\n```\n\nFor experimenting with learning rate, see the [`NeuralNetworkRegressor`](@ref) example.\n\n```\npipe.transformed_target_model_deterministic.model.optimiser.eta = 0.0001\n```\n\nWith the learning rate fixed, we can now compute a CV estimate of the performance (using all data bound to `mach`) and compare this with performance on the test set:\n\n```julia\n# custom MLJ loss:\nmulti_loss(yhat, y) = l2(MLJ.matrix(yhat), MLJ.matrix(y)) |> mean\n\n# CV estimate, based on `(X, y)`:\nevaluate!(mach, resampling=CV(nfolds=5), measure=multi_loss)\n\n# loss for `(Xtest, test)`:\nfit!(mach) # trains on all data `(X, y)`\nyhat = predict(mach, Xtest)\nmulti_loss(yhat, ytest)\n```\n\nSee also [`NeuralNetworkRegressor`](@ref)\n"
+":docstring" = "```\nMultitargetNeuralNetworkRegressor\n```\n\nA model type for constructing a multitarget neural network regressor, based on [MLJFlux.jl](https://github.com/alan-turing-institute/MLJFlux.jl), and implementing the MLJ model interface.\n\nFrom MLJ, the type can be imported using\n\n```\nMultitargetNeuralNetworkRegressor = @load MultitargetNeuralNetworkRegressor pkg=MLJFlux\n```\n\nDo `model = MultitargetNeuralNetworkRegressor()` to construct an instance with default hyper-parameters. Provide keyword arguments to override hyper-parameter defaults, as in `MultitargetNeuralNetworkRegressor(builder=...)`.\n\n`MultitargetNeuralNetworkRegressor` is for training a data-dependent Flux.jl neural network to predict a multi-valued `Continuous` target, represented as a table, given a table of `Continuous` features. Users provide a recipe for constructing the network, based on properties of the data that is encountered, by specifying an appropriate `builder`. See MLJFlux documentation for more on builders.\n\n# Training data\n\nIn MLJ or MLJBase, bind an instance `model` to data with\n\n```\nmach = machine(model, X, y)\n```\n\nHere:\n\n  * `X` is either a `Matrix` or any table of input features (eg, a `DataFrame`) whose columns are of scitype `Continuous`; check column scitypes with `schema(X)`. If `X` is a `Matrix`, it is assumed to have columns corresponding to features and rows corresponding to observations.\n  * `y` is the target, which can be any table or matrix of output targets whose element scitype is `Continuous`; check column scitypes with `schema(y)`. If `y` is a `Matrix`, it is assumed to have columns corresponding to variables and rows corresponding to observations.\n\n# Hyper-parameters\n\n  * `builder=MLJFlux.Linear(σ=Flux.relu)`: An MLJFlux builder that constructs a neural network. Possible `builders` include: `Linear`, `Short`, and `MLP`. See MLJFlux documentation for more on builders, and the example below for using the `@builder` convenience macro.\n  * `optimiser::Optimisers.Adam()`: An Optimisers.jl optimiser. The optimiser performs the updating of the weights of the network. To choose a learning rate (the update rate of the optimizer), a good rule of thumb is to start out at `10e-3`, and tune using powers of `10` between `1` and `1e-7`.\n  * `loss=Flux.mse`: The loss function which the network will optimize. Should be a function which can be called in the form `loss(yhat, y)`.  Possible loss functions are listed in [the Flux loss function documentation](https://fluxml.ai/Flux.jl/stable/models/losses/). For a regression task, natural loss functions are:\n\n      * `Flux.mse`\n      * `Flux.mae`\n      * `Flux.msle`\n      * `Flux.huber_loss`\n\n    Currently MLJ measures are not supported as loss functions here.\n  * `epochs::Int=10`: The duration of training, in epochs. Typically, one epoch represents one pass through the complete the training dataset.\n  * `batch_size::int=1`: the batch size to be used for training, representing the number of samples per update of the network weights. Typically, batch size is between `8` and `512`. Increassing batch size may accelerate training if `acceleration=CUDALibs()` and a GPU is available.\n  * `lambda::Float64=0`: The strength of the weight regularization penalty. Can be any value in the range `[0, ∞)`. Note the history reports unpenalized losses.\n  * `alpha::Float64=0`: The L2/L1 mix of regularization, in the range `[0, 1]`. A value of 0 represents L2 regularization, and a value of 1 represents L1 regularization.\n  * `rng::Union{AbstractRNG, Int64}`: The random number generator or seed used during training. The default is `Random.default_rng()`.\n  * `optimizer_changes_trigger_retraining::Bool=false`: Defines what happens when re-fitting a machine if the associated optimiser has changed. If `true`, the associated machine will retrain from scratch on `fit!` call, otherwise it will not.\n  * `acceleration::AbstractResource=CPU1()`: Defines on what hardware training is done. For Training on GPU, use `CUDALibs()`.\n\n# Operations\n\n  * `predict(mach, Xnew)`: return predictions of the target given new features `Xnew` having the same scitype as `X` above. Predictions are deterministic.\n\n# Fitted parameters\n\nThe fields of `fitted_params(mach)` are:\n\n  * `chain`: The trained \"chain\" (Flux.jl model), namely the series of layers,  functions, and activations  which make up the neural network.\n\n# Report\n\nThe fields of `report(mach)` are:\n\n  * `training_losses`: A vector of training losses (penalised if `lambda != 0`) in  historical order, of length `epochs + 1`.  The first element is the pre-training loss.\n\n# Examples\n\nIn this example we apply a multi-target regression model to synthetic data:\n\n```julia\nusing MLJ\nimport MLJFlux\nusing Flux\nimport Optimisers\n```\n\nFirst, we generate some synthetic data (needs MLJBase 0.20.16 or higher):\n\n```julia\nX, y = make_regression(100, 9; n_targets = 2) # both tables\nschema(y)\nschema(X)\n```\n\nSplitting off a test set:\n\n```julia\n(X, Xtest), (y, ytest) = partition((X, y), 0.7, multi=true);\n```\n\nNext, we can define a `builder`, making use of a convenience macro to do so.  In the following `@builder` call, `n_in` is a proxy for the number input features and `n_out` the number of target variables (both known at `fit!` time), while `rng` is a proxy for a RNG (which will be passed from the `rng` field of `model` defined below).\n\n```julia\nbuilder = MLJFlux.@builder begin\n    init=Flux.glorot_uniform(rng)\n    Chain(\n        Dense(n_in, 64, relu, init=init),\n        Dense(64, 32, relu, init=init),\n        Dense(32, n_out, init=init),\n    )\nend\n```\n\nInstantiating the regression model:\n\n```julia\nMultitargetNeuralNetworkRegressor = @load MultitargetNeuralNetworkRegressor\nmodel = MultitargetNeuralNetworkRegressor(builder=builder, rng=123, epochs=20)\n```\n\nWe will arrange for standardization of the the target by wrapping our model in  `TransformedTargetModel`, and standardization of the features by inserting the wrapped  model in a pipeline:\n\n```julia\npipe = Standardizer |> TransformedTargetModel(model, target=Standardizer)\n```\n\nIf we fit with a high verbosity (>1), we will see the losses during training. We can also see the losses in the output of `report(mach)`\n\n```julia\nmach = machine(pipe, X, y)\nfit!(mach, verbosity=2)\n\n# first element initial loss, 2:end per epoch training losses\nreport(mach).transformed_target_model_deterministic.model.training_losses\n```\n\nFor experimenting with learning rate, see the [`NeuralNetworkRegressor`](@ref) example.\n\n```\npipe.transformed_target_model_deterministic.model.optimiser = Optimisers.Adam(0.0001)\n```\n\nWith the learning rate fixed, we can now compute a CV estimate of the performance (using all data bound to `mach`) and compare this with performance on the test set:\n\n```julia\n# custom MLJ loss:\nmulti_loss(yhat, y) = l2(MLJ.matrix(yhat), MLJ.matrix(y))\n\n# CV estimate, based on `(X, y)`:\nevaluate!(mach, resampling=CV(nfolds=5), measure=multi_loss)\n\n# loss for `(Xtest, test)`:\nfit!(mach) # trains on all data `(X, y)`\nyhat = predict(mach, Xtest)\nmulti_loss(yhat, ytest)\n```\n\nSee also [`NeuralNetworkRegressor`](@ref)\n"
 ":name" = "MultitargetNeuralNetworkRegressor"
 ":human_name" = "multitarget neural network regressor"
 ":is_supervised" = "`true`"
@@ -8337,6 +8575,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Finite}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJFlux"
 ":package_license" = "MIT"
@@ -8347,7 +8586,7 @@
 ":supports_weights" = "`false`"
 ":supports_class_weights" = "`false`"
 ":supports_online" = "`false`"
-":docstring" = "```\nNeuralNetworkClassifier\n```\n\nA model type for constructing a neural network classifier, based on [MLJFlux.jl](https://github.com/alan-turing-institute/MLJFlux.jl), and implementing the MLJ model interface.\n\nFrom MLJ, the type can be imported using\n\n```\nNeuralNetworkClassifier = @load NeuralNetworkClassifier pkg=MLJFlux\n```\n\nDo `model = NeuralNetworkClassifier()` to construct an instance with default hyper-parameters. Provide keyword arguments to override hyper-parameter defaults, as in `NeuralNetworkClassifier(builder=...)`.\n\n`NeuralNetworkClassifier` is for training a data-dependent Flux.jl neural network for making probabilistic predictions of a `Multiclass` or `OrderedFactor` target, given a table of `Continuous` features. Users provide a recipe for constructing  the network, based on properties of the data that is encountered, by specifying  an appropriate `builder`. See MLJFlux documentation for more on builders.\n\n# Training data\n\nIn MLJ or MLJBase, bind an instance `model` to data with\n\n```\nmach = machine(model, X, y)\n```\n\nHere:\n\n  * `X` is either a `Matrix` or any table of input features (eg, a `DataFrame`) whose columns are of scitype `Continuous`; check column scitypes with `schema(X)`. If `X` is a `Matrix`, it is assumed to have columns corresponding to features and rows corresponding to observations.\n  * `y` is the target, which can be any `AbstractVector` whose element scitype is `Multiclass` or `OrderedFactor`; check the scitype with `scitype(y)`\n\nTrain the machine with `fit!(mach, rows=...)`.\n\n# Hyper-parameters\n\n  * `builder=MLJFlux.Short()`: An MLJFlux builder that constructs a neural network. Possible  `builders` include: `MLJFlux.Linear`, `MLJFlux.Short`, and `MLJFlux.MLP`. See  MLJFlux.jl documentation for examples of user-defined builders. See also `finaliser`  below.\n  * `optimiser::Flux.Adam()`: A `Flux.Optimise` optimiser. The optimiser performs the updating of the weights of the network. For further reference, see [the Flux optimiser documentation](https://fluxml.ai/Flux.jl/stable/training/optimisers/). To choose a learning rate (the update rate of the optimizer), a good rule of thumb is to start out at `10e-3`, and tune using powers of 10 between `1` and `1e-7`.\n  * `loss=Flux.crossentropy`: The loss function which the network will optimize. Should be a function which can be called in the form `loss(yhat, y)`.  Possible loss functions are listed in [the Flux loss function documentation](https://fluxml.ai/Flux.jl/stable/models/losses/). For a classification task, the most natural loss functions are:\n\n      * `Flux.crossentropy`: Standard multiclass classification loss, also known as the log loss.\n      * `Flux.logitcrossentopy`: Mathematically equal to crossentropy, but numerically more stable than finalising the outputs with `softmax` and then calculating crossentropy. You will need to specify `finaliser=identity` to remove MLJFlux's default softmax finaliser, and understand that the output of `predict` is then unnormalized (no longer probabilistic).\n      * `Flux.tversky_loss`: Used with imbalanced data to give more weight to false negatives.\n      * `Flux.focal_loss`: Used with highly imbalanced data. Weights harder examples more than easier examples.\n\n    Currently MLJ measures are not supported values of `loss`.\n  * `epochs::Int=10`: The duration of training, in epochs. Typically, one epoch represents one pass through the complete the training dataset.\n  * `batch_size::int=1`: the batch size to be used for training, representing the number of samples per update of the network weights. Typically, batch size is between 8 and\n\n    512. Increassing batch size may accelerate training if `acceleration=CUDALibs()` and a\n\n    GPU is available.\n  * `lambda::Float64=0`: The strength of the weight regularization penalty. Can be any value in the range `[0, ∞)`.\n  * `alpha::Float64=0`: The L2/L1 mix of regularization, in the range `[0, 1]`. A value of 0 represents L2 regularization, and a value of 1 represents L1 regularization.\n  * `rng::Union{AbstractRNG, Int64}`: The random number generator or seed used during training.\n  * `optimizer_changes_trigger_retraining::Bool=false`: Defines what happens when re-fitting a machine if the associated optimiser has changed. If `true`, the associated machine will retrain from scratch on `fit!` call, otherwise it will not.\n  * `acceleration::AbstractResource=CPU1()`: Defines on what hardware training is done. For Training on GPU, use `CUDALibs()`.\n  * `finaliser=Flux.softmax`: The final activation function of the neural network (applied after the network defined by `builder`). Defaults to `Flux.softmax`.\n\n# Operations\n\n  * `predict(mach, Xnew)`: return predictions of the target given new features `Xnew`, which should have the same scitype as `X` above. Predictions are probabilistic but uncalibrated.\n  * `predict_mode(mach, Xnew)`: Return the modes of the probabilistic predictions returned above.\n\n# Fitted parameters\n\nThe fields of `fitted_params(mach)` are:\n\n  * `chain`: The trained \"chain\" (Flux.jl model), namely the series of layers,  functions, and activations which make up the neural network. This includes  the final layer specified by `finaliser` (eg, `softmax`).\n\n# Report\n\nThe fields of `report(mach)` are:\n\n  * `training_losses`: A vector of training losses (penalised if `lambda != 0`) in  historical order, of length `epochs + 1`.  The first element is the pre-training loss.\n\n# Examples\n\nIn this example we build a classification model using the Iris dataset. This is a very basic example, using a default builder and no standardization.  For a more advanced illustration, see [`NeuralNetworkRegressor`](@ref) or [`ImageClassifier`](@ref), and examples in the MLJFlux.jl documentation.\n\n```julia\nusing MLJ\nusing Flux\nimport RDatasets\n```\n\nFirst, we can load the data:\n\n```julia\niris = RDatasets.dataset(\"datasets\", \"iris\");\ny, X = unpack(iris, ==(:Species), rng=123); # a vector and a table\nNeuralNetworkClassifier = @load NeuralNetworkClassifier pkg=MLJFlux\nclf = NeuralNetworkClassifier()\n```\n\nNext, we can train the model:\n\n```julia\nmach = machine(clf, X, y)\nfit!(mach)\n```\n\nWe can train the model in an incremental fashion, altering the learning rate as we go, provided `optimizer_changes_trigger_retraining` is `false` (the default). Here, we also change the number of (total) iterations:\n\n```julia\nclf.optimiser.eta = clf.optimiser.eta * 2\nclf.epochs = clf.epochs + 5\n\nfit!(mach, verbosity=2) # trains 5 more epochs\n```\n\nWe can inspect the mean training loss using the `cross_entropy` function:\n\n```julia\ntraining_loss = cross_entropy(predict(mach, X), y) |> mean\n```\n\nAnd we can access the Flux chain (model) using `fitted_params`:\n\n```julia\nchain = fitted_params(mach).chain\n```\n\nFinally, we can see how the out-of-sample performance changes over time, using MLJ's `learning_curve` function:\n\n```julia\nr = range(clf, :epochs, lower=1, upper=200, scale=:log10)\ncurve = learning_curve(clf, X, y,\n                     range=r,\n                     resampling=Holdout(fraction_train=0.7),\n                     measure=cross_entropy)\nusing Plots\nplot(curve.parameter_values,\n     curve.measurements,\n     xlab=curve.parameter_name,\n     xscale=curve.parameter_scale,\n     ylab = \"Cross Entropy\")\n\n```\n\nSee also [`ImageClassifier`](@ref).\n"
+":docstring" = "```\nNeuralNetworkClassifier\n```\n\nA model type for constructing a neural network classifier, based on [MLJFlux.jl](https://github.com/alan-turing-institute/MLJFlux.jl), and implementing the MLJ model interface.\n\nFrom MLJ, the type can be imported using\n\n```\nNeuralNetworkClassifier = @load NeuralNetworkClassifier pkg=MLJFlux\n```\n\nDo `model = NeuralNetworkClassifier()` to construct an instance with default hyper-parameters. Provide keyword arguments to override hyper-parameter defaults, as in `NeuralNetworkClassifier(builder=...)`.\n\n`NeuralNetworkClassifier` is for training a data-dependent Flux.jl neural network for making probabilistic predictions of a `Multiclass` or `OrderedFactor` target, given a table of `Continuous` features. Users provide a recipe for constructing  the network, based on properties of the data that is encountered, by specifying  an appropriate `builder`. See MLJFlux documentation for more on builders.\n\n# Training data\n\nIn MLJ or MLJBase, bind an instance `model` to data with\n\n```\nmach = machine(model, X, y)\n```\n\nHere:\n\n  * `X` is either a `Matrix` or any table of input features (eg, a `DataFrame`) whose columns are of scitype `Continuous`; check column scitypes with `schema(X)`. If `X` is a `Matrix`, it is assumed to have columns corresponding to features and rows corresponding to observations.\n  * `y` is the target, which can be any `AbstractVector` whose element scitype is `Multiclass` or `OrderedFactor`; check the scitype with `scitype(y)`\n\nTrain the machine with `fit!(mach, rows=...)`.\n\n# Hyper-parameters\n\n  * `builder=MLJFlux.Short()`: An MLJFlux builder that constructs a neural network. Possible  `builders` include: `MLJFlux.Linear`, `MLJFlux.Short`, and `MLJFlux.MLP`. See  MLJFlux.jl documentation for examples of user-defined builders. See also `finaliser`  below.\n  * `optimiser::Optimisers.Adam()`: An Optimisers.jl optimiser. The optimiser performs the updating of the weights of the network. To choose a learning rate (the update rate of the optimizer), a good rule of thumb is to start out at `10e-3`, and tune using powers of `10` between `1` and `1e-7`.\n  * `loss=Flux.crossentropy`: The loss function which the network will optimize. Should be a function which can be called in the form `loss(yhat, y)`.  Possible loss functions are listed in [the Flux loss function documentation](https://fluxml.ai/Flux.jl/stable/models/losses/). For a classification task, the most natural loss functions are:\n\n      * `Flux.crossentropy`: Standard multiclass classification loss, also known as the log loss.\n      * `Flux.logitcrossentopy`: Mathematically equal to crossentropy, but numerically more stable than finalising the outputs with `softmax` and then calculating crossentropy. You will need to specify `finaliser=identity` to remove MLJFlux's default softmax finaliser, and understand that the output of `predict` is then unnormalized (no longer probabilistic).\n      * `Flux.tversky_loss`: Used with imbalanced data to give more weight to false negatives.\n      * `Flux.focal_loss`: Used with highly imbalanced data. Weights harder examples more than easier examples.\n\n    Currently MLJ measures are not supported values of `loss`.\n  * `epochs::Int=10`: The duration of training, in epochs. Typically, one epoch represents one pass through the complete the training dataset.\n  * `batch_size::int=1`: the batch size to be used for training, representing the number of samples per update of the network weights.] Typically, batch size is between `8` and `512`. Increassing batch size may accelerate training if `acceleration=CUDALibs()` and a GPU is available.\n  * `lambda::Float64=0`: The strength of the weight regularization penalty. Can be any value in the range `[0, ∞)`. Note the history reports unpenalized losses.\n  * `alpha::Float64=0`: The L2/L1 mix of regularization, in the range `[0, 1]`. A value of 0 represents L2 regularization, and a value of 1 represents L1 regularization.\n  * `rng::Union{AbstractRNG, Int64}`: The random number generator or seed used during training. The default is `Random.default_rng()`.\n  * `optimizer_changes_trigger_retraining::Bool=false`: Defines what happens when re-fitting a machine if the associated optimiser has changed. If `true`, the associated machine will retrain from scratch on `fit!` call, otherwise it will not.\n  * `acceleration::AbstractResource=CPU1()`: Defines on what hardware training is done. For Training on GPU, use `CUDALibs()`.\n  * `finaliser=Flux.softmax`: The final activation function of the neural network (applied after the network defined by `builder`). Defaults to `Flux.softmax`.\n\n# Operations\n\n  * `predict(mach, Xnew)`: return predictions of the target given new features `Xnew`, which should have the same scitype as `X` above. Predictions are probabilistic but uncalibrated.\n  * `predict_mode(mach, Xnew)`: Return the modes of the probabilistic predictions returned above.\n\n# Fitted parameters\n\nThe fields of `fitted_params(mach)` are:\n\n  * `chain`: The trained \"chain\" (Flux.jl model), namely the series of layers,  functions, and activations which make up the neural network. This includes  the final layer specified by `finaliser` (eg, `softmax`).\n\n# Report\n\nThe fields of `report(mach)` are:\n\n  * `training_losses`: A vector of training losses (penalised if `lambda != 0`) in  historical order, of length `epochs + 1`.  The first element is the pre-training loss.\n\n# Examples\n\nIn this example we build a classification model using the Iris dataset. This is a very basic example, using a default builder and no standardization.  For a more advanced illustration, see [`NeuralNetworkRegressor`](@ref) or [`ImageClassifier`](@ref), and examples in the MLJFlux.jl documentation.\n\n```julia\nusing MLJ\nusing Flux\nimport RDatasets\nimport Optimisers\n```\n\nFirst, we can load the data:\n\n```julia\niris = RDatasets.dataset(\"datasets\", \"iris\");\ny, X = unpack(iris, ==(:Species), rng=123); # a vector and a table\nNeuralNetworkClassifier = @load NeuralNetworkClassifier pkg=MLJFlux\nclf = NeuralNetworkClassifier()\n```\n\nNext, we can train the model:\n\n```julia\nmach = machine(clf, X, y)\nfit!(mach)\n```\n\nWe can train the model in an incremental fashion, altering the learning rate as we go, provided `optimizer_changes_trigger_retraining` is `false` (the default). Here, we also change the number of (total) iterations:\n\n```julia\nclf.optimiser = Optimisers.Adam(clf.optimiser.eta * 2)\nclf.epochs = clf.epochs + 5\n\nfit!(mach, verbosity=2) # trains 5 more epochs\n```\n\nWe can inspect the mean training loss using the `cross_entropy` function:\n\n```julia\ntraining_loss = cross_entropy(predict(mach, X), y)\n```\n\nAnd we can access the Flux chain (model) using `fitted_params`:\n\n```julia\nchain = fitted_params(mach).chain\n```\n\nFinally, we can see how the out-of-sample performance changes over time, using MLJ's `learning_curve` function:\n\n```julia\nr = range(clf, :epochs, lower=1, upper=200, scale=:log10)\ncurve = learning_curve(clf, X, y,\n                     range=r,\n                     resampling=Holdout(fraction_train=0.7),\n                     measure=cross_entropy)\nusing Plots\nplot(curve.parameter_values,\n     curve.measurements,\n     xlab=curve.parameter_name,\n     xscale=curve.parameter_scale,\n     ylab = \"Cross Entropy\")\n\n```\n\nSee also [`ImageClassifier`](@ref), [`NeuralNetworkBinaryClassifier`](@ref).\n"
 ":name" = "NeuralNetworkClassifier"
 ":human_name" = "neural network classifier"
 ":is_supervised" = "`true`"
@@ -8372,6 +8611,7 @@
 ":predict_scitype" = "`AbstractVector{ScientificTypesBase.Density{_s25} where _s25<:ScientificTypesBase.Multiclass}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJFlux"
 ":package_license" = "MIT"
@@ -8382,7 +8622,7 @@
 ":supports_weights" = "`false`"
 ":supports_class_weights" = "`false`"
 ":supports_online" = "`false`"
-":docstring" = "```\nImageClassifier\n```\n\nA model type for constructing a image classifier, based on [MLJFlux.jl](https://github.com/alan-turing-institute/MLJFlux.jl), and implementing the MLJ model interface.\n\nFrom MLJ, the type can be imported using\n\n```\nImageClassifier = @load ImageClassifier pkg=MLJFlux\n```\n\nDo `model = ImageClassifier()` to construct an instance with default hyper-parameters. Provide keyword arguments to override hyper-parameter defaults, as in `ImageClassifier(builder=...)`.\n\n`ImageClassifier` classifies images using a neural network adapted to the type of images provided (color or gray scale). Predictions are probabilistic. Users provide a recipe for constructing the network, based on properties of the image encountered, by specifying an appropriate `builder`. See MLJFlux documentation for more on builders.\n\n# Training data\n\nIn MLJ or MLJBase, bind an instance `model` to data with\n\n```\nmach = machine(model, X, y)\n```\n\nHere:\n\n  * `X` is any `AbstractVector` of images with `ColorImage` or `GrayImage` scitype; check  the scitype with `scitype(X)` and refer to ScientificTypes.jl documentation on coercing  typical image formats into an appropriate type.\n  * `y` is the target, which can be any `AbstractVector` whose element  scitype is `Multiclass`; check the scitype with `scitype(y)`.\n\nTrain the machine with `fit!(mach, rows=...)`.\n\n# Hyper-parameters\n\n  * `builder`: An MLJFlux builder that constructs the neural network.  The fallback builds a  depth-16 VGG architecture adapted to the image size and number of target classes, with  no batch normalization; see the Metalhead.jl documentation for details. See the example  below for a user-specified builder. A convenience macro `@builder` is also  available. See also `finaliser` below.\n  * `optimiser::Flux.Adam()`: A `Flux.Optimise` optimiser. The optimiser performs the updating of the weights of the network. For further reference, see [the Flux optimiser documentation](https://fluxml.ai/Flux.jl/stable/training/optimisers/). To choose a learning rate (the update rate of the optimizer), a good rule of thumb is to start out at `10e-3`, and tune using powers of 10 between `1` and `1e-7`.\n  * `loss=Flux.crossentropy`: The loss function which the network will optimize. Should be a function which can be called in the form `loss(yhat, y)`.  Possible loss functions are listed in [the Flux loss function documentation](https://fluxml.ai/Flux.jl/stable/models/losses/). For a classification task, the most natural loss functions are:\n\n      * `Flux.crossentropy`: Standard multiclass classification loss, also known as the log loss.\n      * `Flux.logitcrossentopy`: Mathematically equal to crossentropy, but numerically more stable than finalising the outputs with `softmax` and then calculating crossentropy. You will need to specify `finaliser=identity` to remove MLJFlux's default softmax finaliser, and understand that the output of `predict` is then unnormalized (no longer probabilistic).\n      * `Flux.tversky_loss`: Used with imbalanced data to give more weight to false negatives.\n      * `Flux.focal_loss`: Used with highly imbalanced data. Weights harder examples more than easier examples.\n\n    Currently MLJ measures are not supported values of `loss`.\n  * `epochs::Int=10`: The duration of training, in epochs. Typically, one epoch represents one pass through the complete the training dataset.\n  * `batch_size::int=1`: the batch size to be used for training, representing the number of samples per update of the network weights. Typically, batch size is between 8 and\n\n    512. Increassing batch size may accelerate training if `acceleration=CUDALibs()` and a\n\n    GPU is available.\n  * `lambda::Float64=0`: The strength of the weight regularization penalty. Can be any value in the range `[0, ∞)`.\n  * `alpha::Float64=0`: The L2/L1 mix of regularization, in the range `[0, 1]`. A value of 0 represents L2 regularization, and a value of 1 represents L1 regularization.\n  * `rng::Union{AbstractRNG, Int64}`: The random number generator or seed used during training.\n  * `optimizer_changes_trigger_retraining::Bool=false`: Defines what happens when re-fitting a machine if the associated optimiser has changed. If `true`, the associated machine will retrain from scratch on `fit!` call, otherwise it will not.\n  * `acceleration::AbstractResource=CPU1()`: Defines on what hardware training is done. For Training on GPU, use `CUDALibs()`.\n  * `finaliser=Flux.softmax`: The final activation function of the neural network (applied after the network defined by `builder`). Defaults to `Flux.softmax`.\n\n# Operations\n\n  * `predict(mach, Xnew)`: return predictions of the target given new features `Xnew`, which should have the same scitype as `X` above. Predictions are probabilistic but uncalibrated.\n  * `predict_mode(mach, Xnew)`: Return the modes of the probabilistic predictions returned above.\n\n# Fitted parameters\n\nThe fields of `fitted_params(mach)` are:\n\n  * `chain`: The trained \"chain\" (Flux.jl model), namely the series of layers,  functions, and activations  which make up the neural network. This includes  the final layer specified by `finaliser` (eg, `softmax`).\n\n# Report\n\nThe fields of `report(mach)` are:\n\n  * `training_losses`: A vector of training losses (penalised if `lambda != 0`) in  historical order, of length `epochs + 1`.  The first element is the pre-training loss.\n\n# Examples\n\nIn this example we use MLJFlux and a custom builder to classify the MNIST image dataset.\n\n```julia\nusing MLJ\nusing Flux\nimport MLJFlux\nimport MLJIteration # for `skip` control\n```\n\nFirst we want to download the MNIST dataset, and unpack into images and labels:\n\n```julia\nimport MLDatasets: MNIST\ndata = MNIST(split=:train)\nimages, labels = data.features, data.targets\n```\n\nIn MLJ, integers cannot be used for encoding categorical data, so we must coerce them into the `Multiclass` scitype:\n\n```julia\nlabels = coerce(labels, Multiclass);\n```\n\nAbove `images` is a single array but MLJFlux requires the images to be a vector of individual image arrays:\n\n```\nimages = coerce(images, GrayImage);\nimages[1]\n```\n\nWe start by defining a suitable `builder` object. This is a recipe for building the neural network. Our builder will work for images of any (constant) size, whether they be color or black and white (ie, single or multi-channel).  The architecture always consists of six alternating convolution and max-pool layers, and a final dense layer; the filter size and the number of channels after each convolution layer is customizable.\n\n```julia\nimport MLJFlux\n\nstruct MyConvBuilder\n    filter_size::Int\n    channels1::Int\n    channels2::Int\n    channels3::Int\nend\n\nmake2d(x::AbstractArray) = reshape(x, :, size(x)[end])\n\nfunction MLJFlux.build(b::MyConvBuilder, rng, n_in, n_out, n_channels)\n    k, c1, c2, c3 = b.filter_size, b.channels1, b.channels2, b.channels3\n    mod(k, 2) == 1 || error(\"`filter_size` must be odd. \")\n    p = div(k - 1, 2) # padding to preserve image size\n    init = Flux.glorot_uniform(rng)\n    front = Chain(\n        Conv((k, k), n_channels => c1, pad=(p, p), relu, init=init),\n        MaxPool((2, 2)),\n        Conv((k, k), c1 => c2, pad=(p, p), relu, init=init),\n        MaxPool((2, 2)),\n        Conv((k, k), c2 => c3, pad=(p, p), relu, init=init),\n        MaxPool((2 ,2)),\n        make2d)\n    d = Flux.outputsize(front, (n_in..., n_channels, 1)) |> first\n    return Chain(front, Dense(d, n_out, init=init))\nend\n```\n\nIt is important to note that in our `build` function, there is no final `softmax`. This is applied by default in all MLJFlux classifiers (override this using the `finaliser` hyperparameter).\n\nNow that our builder is defined, we can instantiate the actual MLJFlux model. If you have a GPU, you can substitute in `acceleration=CUDALibs()` below to speed up training.\n\n```julia\nImageClassifier = @load ImageClassifier pkg=MLJFlux\nclf = ImageClassifier(builder=MyConvBuilder(3, 16, 32, 32),\n                      batch_size=50,\n                      epochs=10,\n                      rng=123)\n```\n\nYou can add Flux options such as `optimiser` and `loss` in the snippet above. Currently, `loss` must be a flux-compatible loss, and not an MLJ measure.\n\nNext, we can bind the model with the data in a machine, and train using the first 500 images:\n\n```julia\nmach = machine(clf, images, labels);\nfit!(mach, rows=1:500, verbosity=2);\nreport(mach)\nchain = fitted_params(mach)\nFlux.params(chain)[2]\n```\n\nWe can tack on 20 more epochs by modifying the `epochs` field, and iteratively fit some more:\n\n```julia\nclf.epochs = clf.epochs + 20\nfit!(mach, rows=1:500, verbosity=2);\n```\n\nWe can also make predictions and calculate an out-of-sample loss estimate, using any MLJ measure (loss/score):\n\n```julia\npredicted_labels = predict(mach, rows=501:1000);\ncross_entropy(predicted_labels, labels[501:1000]) |> mean\n```\n\nThe preceding `fit!`/`predict`/evaluate workflow can be alternatively executed as follows:\n\n```julia\nevaluate!(mach,\n          resampling=Holdout(fraction_train=0.5),\n          measure=cross_entropy,\n          rows=1:1000,\n          verbosity=0)\n```\n\nSee also [`NeuralNetworkClassifier`](@ref).\n"
+":docstring" = "```\nImageClassifier\n```\n\nA model type for constructing a image classifier, based on [MLJFlux.jl](https://github.com/alan-turing-institute/MLJFlux.jl), and implementing the MLJ model interface.\n\nFrom MLJ, the type can be imported using\n\n```\nImageClassifier = @load ImageClassifier pkg=MLJFlux\n```\n\nDo `model = ImageClassifier()` to construct an instance with default hyper-parameters. Provide keyword arguments to override hyper-parameter defaults, as in `ImageClassifier(builder=...)`.\n\n`ImageClassifier` classifies images using a neural network adapted to the type of images provided (color or gray scale). Predictions are probabilistic. Users provide a recipe for constructing the network, based on properties of the image encountered, by specifying an appropriate `builder`. See MLJFlux documentation for more on builders.\n\n# Training data\n\nIn MLJ or MLJBase, bind an instance `model` to data with\n\n```\nmach = machine(model, X, y)\n```\n\nHere:\n\n  * `X` is any `AbstractVector` of images with `ColorImage` or `GrayImage` scitype; check  the scitype with `scitype(X)` and refer to ScientificTypes.jl documentation on coercing  typical image formats into an appropriate type.\n  * `y` is the target, which can be any `AbstractVector` whose element  scitype is `Multiclass`; check the scitype with `scitype(y)`.\n\nTrain the machine with `fit!(mach, rows=...)`.\n\n# Hyper-parameters\n\n  * `builder`: An MLJFlux builder that constructs the neural network.  The fallback builds a  depth-16 VGG architecture adapted to the image size and number of target classes, with  no batch normalization; see the Metalhead.jl documentation for details. See the example  below for a user-specified builder. A convenience macro `@builder` is also  available. See also `finaliser` below.\n  * `optimiser::Optimisers.Adam()`: An Optimisers.jl optimiser. The optimiser performs the updating of the weights of the network. To choose a learning rate (the update rate of the optimizer), a good rule of thumb is to start out at `10e-3`, and tune using powers of `10` between `1` and `1e-7`.\n  * `loss=Flux.crossentropy`: The loss function which the network will optimize. Should be a function which can be called in the form `loss(yhat, y)`.  Possible loss functions are listed in [the Flux loss function documentation](https://fluxml.ai/Flux.jl/stable/models/losses/). For a classification task, the most natural loss functions are:\n\n      * `Flux.crossentropy`: Standard multiclass classification loss, also known as the log loss.\n      * `Flux.logitcrossentopy`: Mathematically equal to crossentropy, but numerically more stable than finalising the outputs with `softmax` and then calculating crossentropy. You will need to specify `finaliser=identity` to remove MLJFlux's default softmax finaliser, and understand that the output of `predict` is then unnormalized (no longer probabilistic).\n      * `Flux.tversky_loss`: Used with imbalanced data to give more weight to false negatives.\n      * `Flux.focal_loss`: Used with highly imbalanced data. Weights harder examples more than easier examples.\n\n    Currently MLJ measures are not supported values of `loss`.\n  * `epochs::Int=10`: The duration of training, in epochs. Typically, one epoch represents one pass through the complete the training dataset.\n  * `batch_size::int=1`: the batch size to be used for training, representing the number of samples per update of the network weights. Typically, batch size is between 8 and\n\n    512. Increassing batch size may accelerate training if `acceleration=CUDALibs()` and a\n\n    GPU is available.\n  * `lambda::Float64=0`: The strength of the weight regularization penalty. Can be any value in the range `[0, ∞)`. Note the history reports unpenalized losses.\n  * `alpha::Float64=0`: The L2/L1 mix of regularization, in the range `[0, 1]`. A value of 0 represents L2 regularization, and a value of 1 represents L1 regularization.\n  * `rng::Union{AbstractRNG, Int64}`: The random number generator or seed used during training. The default is `Random.default_rng()`.\n  * `optimizer_changes_trigger_retraining::Bool=false`: Defines what happens when re-fitting a machine if the associated optimiser has changed. If `true`, the associated machine will retrain from scratch on `fit!` call, otherwise it will not.\n  * `acceleration::AbstractResource=CPU1()`: Defines on what hardware training is done. For Training on GPU, use `CUDALibs()`.\n  * `finaliser=Flux.softmax`: The final activation function of the neural network (applied after the network defined by `builder`). Defaults to `Flux.softmax`.\n\n# Operations\n\n  * `predict(mach, Xnew)`: return predictions of the target given new features `Xnew`, which should have the same scitype as `X` above. Predictions are probabilistic but uncalibrated.\n  * `predict_mode(mach, Xnew)`: Return the modes of the probabilistic predictions returned above.\n\n# Fitted parameters\n\nThe fields of `fitted_params(mach)` are:\n\n  * `chain`: The trained \"chain\" (Flux.jl model), namely the series of layers,  functions, and activations  which make up the neural network. This includes  the final layer specified by `finaliser` (eg, `softmax`).\n\n# Report\n\nThe fields of `report(mach)` are:\n\n  * `training_losses`: A vector of training losses (penalised if `lambda != 0`) in  historical order, of length `epochs + 1`.  The first element is the pre-training loss.\n\n# Examples\n\nIn this example we use MLJFlux and a custom builder to classify the MNIST image dataset.\n\n```julia\nusing MLJ\nusing Flux\nimport MLJFlux\nimport Optimisers\nimport MLJIteration # for `skip` control\n```\n\nFirst we want to download the MNIST dataset, and unpack into images and labels:\n\n```julia\nimport MLDatasets: MNIST\ndata = MNIST(split=:train)\nimages, labels = data.features, data.targets\n```\n\nIn MLJ, integers cannot be used for encoding categorical data, so we must coerce them into the `Multiclass` scitype:\n\n```julia\nlabels = coerce(labels, Multiclass);\n```\n\nAbove `images` is a single array but MLJFlux requires the images to be a vector of individual image arrays:\n\n```\nimages = coerce(images, GrayImage);\nimages[1]\n```\n\nWe start by defining a suitable `builder` object. This is a recipe for building the neural network. Our builder will work for images of any (constant) size, whether they be color or black and white (ie, single or multi-channel).  The architecture always consists of six alternating convolution and max-pool layers, and a final dense layer; the filter size and the number of channels after each convolution layer is customizable.\n\n```julia\nimport MLJFlux\n\nstruct MyConvBuilder\n    filter_size::Int\n    channels1::Int\n    channels2::Int\n    channels3::Int\nend\n\nmake2d(x::AbstractArray) = reshape(x, :, size(x)[end])\n\nfunction MLJFlux.build(b::MyConvBuilder, rng, n_in, n_out, n_channels)\n    k, c1, c2, c3 = b.filter_size, b.channels1, b.channels2, b.channels3\n    mod(k, 2) == 1 || error(\"`filter_size` must be odd. \")\n    p = div(k - 1, 2) # padding to preserve image size\n    init = Flux.glorot_uniform(rng)\n    front = Chain(\n        Conv((k, k), n_channels => c1, pad=(p, p), relu, init=init),\n        MaxPool((2, 2)),\n        Conv((k, k), c1 => c2, pad=(p, p), relu, init=init),\n        MaxPool((2, 2)),\n        Conv((k, k), c2 => c3, pad=(p, p), relu, init=init),\n        MaxPool((2 ,2)),\n        make2d)\n    d = Flux.outputsize(front, (n_in..., n_channels, 1)) |> first\n    return Chain(front, Dense(d, n_out, init=init))\nend\n```\n\nIt is important to note that in our `build` function, there is no final `softmax`. This is applied by default in all MLJFlux classifiers (override this using the `finaliser` hyperparameter).\n\nNow that our builder is defined, we can instantiate the actual MLJFlux model. If you have a GPU, you can substitute in `acceleration=CUDALibs()` below to speed up training.\n\n```julia\nImageClassifier = @load ImageClassifier pkg=MLJFlux\nclf = ImageClassifier(builder=MyConvBuilder(3, 16, 32, 32),\n                      batch_size=50,\n                      epochs=10,\n                      rng=123)\n```\n\nYou can add Flux options such as `optimiser` and `loss` in the snippet above. Currently, `loss` must be a flux-compatible loss, and not an MLJ measure.\n\nNext, we can bind the model with the data in a machine, and train using the first 500 images:\n\n```julia\nmach = machine(clf, images, labels);\nfit!(mach, rows=1:500, verbosity=2);\nreport(mach)\nchain = fitted_params(mach)\nFlux.params(chain)[2]\n```\n\nWe can tack on 20 more epochs by modifying the `epochs` field, and iteratively fit some more:\n\n```julia\nclf.epochs = clf.epochs + 20\nfit!(mach, rows=1:500, verbosity=2);\n```\n\nWe can also make predictions and calculate an out-of-sample loss estimate, using any MLJ measure (loss/score):\n\n```julia\npredicted_labels = predict(mach, rows=501:1000);\ncross_entropy(predicted_labels, labels[501:1000])\n```\n\nThe preceding `fit!`/`predict`/evaluate workflow can be alternatively executed as follows:\n\n```julia\nevaluate!(mach,\n          resampling=Holdout(fraction_train=0.5),\n          measure=cross_entropy,\n          rows=1:1000,\n          verbosity=0)\n```\n\nSee also [`NeuralNetworkClassifier`](@ref).\n"
 ":name" = "ImageClassifier"
 ":human_name" = "image classifier"
 ":is_supervised" = "`true`"
@@ -8399,6 +8639,42 @@
 ":reporting_operations" = "`()`"
 ":constructor" = "`nothing`"
 
+[MLJFlux.NeuralNetworkBinaryClassifier]
+":input_scitype" = "`Union{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}, AbstractMatrix{ScientificTypesBase.Continuous}}`"
+":output_scitype" = "`ScientificTypesBase.Unknown`"
+":target_scitype" = "`AbstractVector{<:ScientificTypesBase.Binary}`"
+":fit_data_scitype" = "`Tuple{Union{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}, AbstractMatrix{ScientificTypesBase.Continuous}}, AbstractVector{<:ScientificTypesBase.Binary}}`"
+":predict_scitype" = "`ScientificTypesBase.Unknown`"
+":transform_scitype" = "`ScientificTypesBase.Unknown`"
+":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
+":is_pure_julia" = "`true`"
+":package_name" = "MLJFlux"
+":package_license" = "MIT"
+":load_path" = "MLJFlux.NeuralNetworkBinaryClassifier"
+":package_uuid" = "094fc8d1-fd35-5302-93ea-dabda2abf845"
+":package_url" = "https://github.com/alan-turing-institute/MLJFlux.jl"
+":is_wrapper" = "`false`"
+":supports_weights" = "`false`"
+":supports_class_weights" = "`false`"
+":supports_online" = "`false`"
+":docstring" = "```\nNeuralNetworkBinaryClassifier\n```\n\nA model type for constructing a neural network binary classifier, based on [MLJFlux.jl](https://github.com/alan-turing-institute/MLJFlux.jl), and implementing the MLJ model interface.\n\nFrom MLJ, the type can be imported using\n\n```\nNeuralNetworkBinaryClassifier = @load NeuralNetworkBinaryClassifier pkg=MLJFlux\n```\n\nDo `model = NeuralNetworkBinaryClassifier()` to construct an instance with default hyper-parameters. Provide keyword arguments to override hyper-parameter defaults, as in `NeuralNetworkBinaryClassifier(builder=...)`.\n\n`NeuralNetworkBinaryClassifier` is for training a data-dependent Flux.jl neural network for making probabilistic predictions of a binary (`Multiclass{2}` or `OrderedFactor{2}`) target, given a table of `Continuous` features. Users provide a recipe for constructing  the network, based on properties of the data that is encountered, by specifying  an appropriate `builder`. See MLJFlux documentation for more on builders.\n\n# Training data\n\nIn MLJ or MLJBase, bind an instance `model` to data with\n\n```\nmach = machine(model, X, y)\n```\n\nHere:\n\n  * `X` is either a `Matrix` or any table of input features (eg, a `DataFrame`) whose columns are of scitype `Continuous`; check column scitypes with `schema(X)`. If `X` is a `Matrix`, it is assumed to have columns corresponding to features and rows corresponding to observations.\n  * `y` is the target, which can be any `AbstractVector` whose element scitype is `Multiclass{2}` or `OrderedFactor{2}`; check the scitype with `scitype(y)`\n\nTrain the machine with `fit!(mach, rows=...)`.\n\n# Hyper-parameters\n\n  * `builder=MLJFlux.Short()`: An MLJFlux builder that constructs a neural network. Possible  `builders` include: `MLJFlux.Linear`, `MLJFlux.Short`, and `MLJFlux.MLP`. See  MLJFlux.jl documentation for examples of user-defined builders. See also `finaliser`  below.\n  * `optimiser::Flux.Adam()`: A `Flux.Optimise` optimiser. The optimiser performs the updating of the weights of the network. For further reference, see [the Flux optimiser documentation](https://fluxml.ai/Flux.jl/stable/training/optimisers/). To choose a learning rate (the update rate of the optimizer), a good rule of thumb is to start out at `10e-3`, and tune using powers of `10` between `1` and `1e-7`.\n  * `loss=Flux.binarycrossentropy`: The loss function which the network will optimize. Should be a function which can be called in the form `loss(yhat, y)`.  Possible loss functions are listed in [the Flux loss function documentation](https://fluxml.ai/Flux.jl/stable/models/losses/). For a classification task, the most natural loss functions are:\n\n      * `Flux.binarycrossentropy`: Standard binary classification loss, also known as the log loss.\n      * `Flux.logitbinarycrossentropy`: Mathematically equal to crossentropy, but numerically more stable than finalising the outputs with `σ` and then calculating crossentropy. You will need to specify `finaliser=identity` to remove MLJFlux's default sigmoid finaliser, and understand that the output of `predict` is then unnormalized (no longer probabilistic).\n      * `Flux.tversky_loss`: Used with imbalanced data to give more weight to false negatives.\n      * `Flux.binary_focal_loss`: Used with highly imbalanced data. Weights harder examples more than easier examples.\n\n    Currently MLJ measures are not supported values of `loss`.\n  * `epochs::Int=10`: The duration of training, in epochs. Typically, one epoch represents one pass through the complete the training dataset.\n  * `batch_size::int=1`: the batch size to be used for training, representing the number of samples per update of the network weights. Typically, batch size is between `8` and `512`. Increassing batch size may accelerate training if `acceleration=CUDALibs()` and a GPU is available.\n  * `lambda::Float64=0`: The strength of the weight regularization penalty. Can be any value in the range `[0, ∞)`.\n  * `alpha::Float64=0`: The L2/L1 mix of regularization, in the range `[0, 1]`. A value of 0 represents L2 regularization, and a value of 1 represents L1 regularization.\n  * `rng::Union{AbstractRNG, Int64}`: The random number generator or seed used during training.\n  * `optimizer_changes_trigger_retraining::Bool=false`: Defines what happens when re-fitting a machine if the associated optimiser has changed. If `true`, the associated machine will retrain from scratch on `fit!` call, otherwise it will not.\n  * `acceleration::AbstractResource=CPU1()`: Defines on what hardware training is done. For Training on GPU, use `CUDALibs()`.\n  * `finaliser=Flux.σ`: The final activation function of the neural network (applied after the network defined by `builder`). Defaults to `Flux.σ`.\n\n# Operations\n\n  * `predict(mach, Xnew)`: return predictions of the target given new features `Xnew`, which should have the same scitype as `X` above. Predictions are probabilistic but uncalibrated.\n  * `predict_mode(mach, Xnew)`: Return the modes of the probabilistic predictions returned above.\n\n# Fitted parameters\n\nThe fields of `fitted_params(mach)` are:\n\n  * `chain`: The trained \"chain\" (Flux.jl model), namely the series of layers,  functions, and activations which make up the neural network. This includes  the final layer specified by `finaliser` (eg, `softmax`).\n\n# Report\n\nThe fields of `report(mach)` are:\n\n  * `training_losses`: A vector of training losses (penalised if `lambda != 0`) in  historical order, of length `epochs + 1`.  The first element is the pre-training loss.\n\n# Examples\n\nIn this example we build a classification model using the Iris dataset. This is a very basic example, using a default builder and no standardization.  For a more advanced illustration, see [`NeuralNetworkRegressor`](@ref) or [`ImageClassifier`](@ref), and examples in the MLJFlux.jl documentation.\n\n```julia\nusing MLJ, Flux\nimport Optimisers\nimport RDatasets\n```\n\nFirst, we can load the data:\n\n```julia\nmtcars = RDatasets.dataset(\"datasets\", \"mtcars\");\ny, X = unpack(mtcars, ==(:VS), in([:MPG, :Cyl, :Disp, :HP, :WT, :QSec]));\n```\n\nNote that `y` is a vector and `X` a table.\n\n```julia\ny = categorical(y) # classifier takes catogorical input\nX_f32 = Float32.(X) # To match floating point type of the neural network layers\nNeuralNetworkBinaryClassifier = @load NeuralNetworkBinaryClassifier pkg=MLJFlux\nbclf = NeuralNetworkBinaryClassifier()\n```\n\nNext, we can train the model:\n\n```julia\nmach = machine(bclf, X_f32, y)\nfit!(mach)\n```\n\nWe can train the model in an incremental fashion, altering the learning rate as we go, provided `optimizer_changes_trigger_retraining` is `false` (the default). Here, we also change the number of (total) iterations:\n\n```julia-repl\njulia> bclf.optimiser\nAdam(0.001, (0.9, 0.999), 1.0e-8)\n```\n\n```julia\nbclf.optimiser = Optimisers.Adam(eta = bclf.optimiser.eta * 2)\nbclf.epochs = bclf.epochs + 5\n\nfit!(mach, verbosity=2) # trains 5 more epochs\n```\n\nWe can inspect the mean training loss using the `cross_entropy` function:\n\n```julia\ntraining_loss = cross_entropy(predict(mach, X_f32), y)\n```\n\nAnd we can access the Flux chain (model) using `fitted_params`:\n\n```julia\nchain = fitted_params(mach).chain\n```\n\nFinally, we can see how the out-of-sample performance changes over time, using MLJ's `learning_curve` function:\n\n```julia\nr = range(bclf, :epochs, lower=1, upper=200, scale=:log10)\ncurve = learning_curve(\n    bclf,\n    X_f32,\n    y,\n    range=r,\n    resampling=Holdout(fraction_train=0.7),\n    measure=cross_entropy,\n)\nusing Plots\nplot(\n   curve.parameter_values,\n   curve.measurements,\n   xlab=curve.parameter_name,\n   xscale=curve.parameter_scale,\n   ylab = \"Cross Entropy\",\n)\n\n```\n\nSee also [`ImageClassifier`](@ref).\n"
+":name" = "NeuralNetworkBinaryClassifier"
+":human_name" = "neural network binary classifier"
+":is_supervised" = "`true`"
+":prediction_type" = ":probabilistic"
+":abstract_type" = "`MLJModelInterface.Probabilistic`"
+":implemented_methods" = [":predict"]
+":hyperparameters" = "`(:builder, :finaliser, :optimiser, :loss, :epochs, :batch_size, :lambda, :alpha, :rng, :optimiser_changes_trigger_retraining, :acceleration)`"
+":hyperparameter_types" = "`(\"Any\", \"Any\", \"Any\", \"Any\", \"Int64\", \"Int64\", \"Float64\", \"Float64\", \"Union{Int64, Random.AbstractRNG}\", \"Bool\", \"ComputationalResources.AbstractResource\")`"
+":hyperparameter_ranges" = "`(nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing, nothing)`"
+":iteration_parameter" = ":epochs"
+":supports_training_losses" = "`true`"
+":reports_feature_importances" = "`false`"
+":deep_properties" = "`(:optimiser, :builder)`"
+":reporting_operations" = "`()`"
+":constructor" = "`nothing`"
+
 [MLJFlux.NeuralNetworkRegressor]
 ":input_scitype" = "`Union{ScientificTypesBase.Table{<:AbstractVector{<:ScientificTypesBase.Continuous}}, AbstractMatrix{ScientificTypesBase.Continuous}}`"
 ":output_scitype" = "`ScientificTypesBase.Unknown`"
@@ -8407,6 +8683,7 @@
 ":predict_scitype" = "`AbstractVector{<:ScientificTypesBase.Continuous}`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`true`"
 ":package_name" = "MLJFlux"
 ":package_license" = "MIT"
@@ -8417,7 +8694,7 @@
 ":supports_weights" = "`false`"
 ":supports_class_weights" = "`false`"
 ":supports_online" = "`false`"
-":docstring" = "```\nNeuralNetworkRegressor\n```\n\nA model type for constructing a neural network regressor, based on [MLJFlux.jl](https://github.com/alan-turing-institute/MLJFlux.jl), and implementing the MLJ model interface.\n\nFrom MLJ, the type can be imported using\n\n```\nNeuralNetworkRegressor = @load NeuralNetworkRegressor pkg=MLJFlux\n```\n\nDo `model = NeuralNetworkRegressor()` to construct an instance with default hyper-parameters. Provide keyword arguments to override hyper-parameter defaults, as in `NeuralNetworkRegressor(builder=...)`.\n\n`NeuralNetworkRegressor` is for training a data-dependent Flux.jl neural network to predict a `Continuous` target, given a table of `Continuous` features. Users provide a recipe for constructing the network, based on properties of the data that is encountered, by specifying an appropriate `builder`. See MLJFlux documentation for more on builders.\n\n# Training data\n\nIn MLJ or MLJBase, bind an instance `model` to data with\n\n```\nmach = machine(model, X, y)\n```\n\nHere:\n\n  * `X` is either a `Matrix` or any table of input features (eg, a `DataFrame`) whose columns are of scitype `Continuous`; check column scitypes with `schema(X)`. If `X` is a `Matrix`, it is assumed to have columns corresponding to features and rows corresponding to observations.\n  * `y` is the target, which can be any `AbstractVector` whose element scitype is `Continuous`; check the scitype with `scitype(y)`\n\nTrain the machine with `fit!(mach, rows=...)`.\n\n# Hyper-parameters\n\n  * `builder=MLJFlux.Linear(σ=Flux.relu)`: An MLJFlux builder that constructs a neural  network. Possible `builders` include: `MLJFlux.Linear`, `MLJFlux.Short`, and  `MLJFlux.MLP`. See MLJFlux documentation for more on builders, and the example below  for using the `@builder` convenience macro.\n  * `optimiser::Flux.Adam()`: A `Flux.Optimise` optimiser. The optimiser performs the updating of the weights of the network. For further reference, see [the Flux optimiser documentation](https://fluxml.ai/Flux.jl/stable/training/optimisers/). To choose a learning rate (the update rate of the optimizer), a good rule of thumb is to start out at `10e-3`, and tune using powers of 10 between `1` and `1e-7`.\n  * `loss=Flux.mse`: The loss function which the network will optimize. Should be a function which can be called in the form `loss(yhat, y)`.  Possible loss functions are listed in [the Flux loss function documentation](https://fluxml.ai/Flux.jl/stable/models/losses/). For a regression task, natural loss functions are:\n\n      * `Flux.mse`\n      * `Flux.mae`\n      * `Flux.msle`\n      * `Flux.huber_loss`\n\n    Currently MLJ measures are not supported as loss functions here.\n  * `epochs::Int=10`: The duration of training, in epochs. Typically, one epoch represents one pass through the complete the training dataset.\n  * `batch_size::int=1`: the batch size to be used for training, representing the number of samples per update of the network weights. Typically, batch size is between 8 and\n\n    512. Increasing batch size may accelerate training if `acceleration=CUDALibs()` and a\n\n    GPU is available.\n  * `lambda::Float64=0`: The strength of the weight regularization penalty. Can be any value in the range `[0, ∞)`.\n  * `alpha::Float64=0`: The L2/L1 mix of regularization, in the range `[0, 1]`. A value of 0 represents L2 regularization, and a value of 1 represents L1 regularization.\n  * `rng::Union{AbstractRNG, Int64}`: The random number generator or seed used during training.\n  * `optimizer_changes_trigger_retraining::Bool=false`: Defines what happens when re-fitting a machine if the associated optimiser has changed. If `true`, the associated machine will retrain from scratch on `fit!` call, otherwise it will not.\n  * `acceleration::AbstractResource=CPU1()`: Defines on what hardware training is done. For Training on GPU, use `CUDALibs()`.\n\n# Operations\n\n  * `predict(mach, Xnew)`: return predictions of the target given new features `Xnew`, which should have the same scitype as `X` above.\n\n# Fitted parameters\n\nThe fields of `fitted_params(mach)` are:\n\n  * `chain`: The trained \"chain\" (Flux.jl model), namely the series of layers, functions,  and activations which make up the neural network.\n\n# Report\n\nThe fields of `report(mach)` are:\n\n  * `training_losses`: A vector of training losses (penalized if `lambda != 0`) in  historical order, of length `epochs + 1`.  The first element is the pre-training loss.\n\n# Examples\n\nIn this example we build a regression model for the Boston house price dataset.\n\n```julia\nusing MLJ\nimport MLJFlux\nusing Flux\n```\n\nFirst, we load in the data: The `:MEDV` column becomes the target vector `y`, and all remaining columns go into a table `X`, with the exception of `:CHAS`:\n\n```julia\ndata = OpenML.load(531); # Loads from https://www.openml.org/d/531\ny, X = unpack(data, ==(:MEDV), !=(:CHAS); rng=123);\n\nscitype(y)\nschema(X)\n```\n\nSince MLJFlux models do not handle ordered factors, we'll treat `:RAD` as `Continuous`:\n\n```julia\nX = coerce(X, :RAD=>Continuous)\n```\n\nSplitting off a test set:\n\n```julia\n(X, Xtest), (y, ytest) = partition((X, y), 0.7, multi=true);\n```\n\nNext, we can define a `builder`, making use of a convenience macro to do so.  In the following `@builder` call, `n_in` is a proxy for the number input features (which will be known at `fit!` time) and `rng` is a proxy for a RNG (which will be passed from the `rng` field of `model` defined below). We also have the parameter `n_out` which is the number of output features. As we are doing single target regression, the value passed will always be `1`, but the builder we define will also work for [`MultitargetNeuralRegressor`](@ref).\n\n```julia\nbuilder = MLJFlux.@builder begin\n    init=Flux.glorot_uniform(rng)\n    Chain(\n        Dense(n_in, 64, relu, init=init),\n        Dense(64, 32, relu, init=init),\n        Dense(32, n_out, init=init),\n    )\nend\n```\n\nInstantiating a model:\n\n```julia\nNeuralNetworkRegressor = @load NeuralNetworkRegressor pkg=MLJFlux\nmodel = NeuralNetworkRegressor(\n    builder=builder,\n    rng=123,\n    epochs=20\n)\n```\n\nWe arrange for standardization of the the target by wrapping our model in `TransformedTargetModel`, and standardization of the features by inserting the wrapped model in a pipeline:\n\n```julia\npipe = Standardizer |> TransformedTargetModel(model, target=Standardizer)\n```\n\nIf we fit with a high verbosity (>1), we will see the losses during training. We can also see the losses in the output of `report(mach)`.\n\n```julia\nmach = machine(pipe, X, y)\nfit!(mach, verbosity=2)\n\n# first element initial loss, 2:end per epoch training losses\nreport(mach).transformed_target_model_deterministic.model.training_losses\n```\n\n## Experimenting with learning rate\n\nWe can visually compare how the learning rate affects the predictions:\n\n```julia\nusing Plots\n\nrates = rates = [5e-5, 1e-4, 0.005, 0.001, 0.05]\nplt=plot()\n\nforeach(rates) do η\n  pipe.transformed_target_model_deterministic.model.optimiser.eta = η\n  fit!(mach, force=true, verbosity=0)\n  losses =\n      report(mach).transformed_target_model_deterministic.model.training_losses[3:end]\n  plot!(1:length(losses), losses, label=η)\nend\n\nplt\n\npipe.transformed_target_model_deterministic.model.optimiser.eta = 0.0001\n```\n\nWith the learning rate fixed, we compute a CV estimate of the performance (using all data bound to `mach`) and compare this with performance on the test set:\n\n```julia\n# CV estimate, based on `(X, y)`:\nevaluate!(mach, resampling=CV(nfolds=5), measure=l2)\n\n# loss for `(Xtest, test)`:\nfit!(mach) # train on `(X, y)`\nyhat = predict(mach, Xtest)\nl2(yhat, ytest)  |> mean\n```\n\nThese losses, for the pipeline model, refer to the target on the original, unstandardized, scale.\n\nFor implementing stopping criterion and other iteration controls, refer to examples linked from the MLJFlux documentation.\n\nSee also [`MultitargetNeuralNetworkRegressor`](@ref)\n"
+":docstring" = "```\nNeuralNetworkRegressor\n```\n\nA model type for constructing a neural network regressor, based on [MLJFlux.jl](https://github.com/alan-turing-institute/MLJFlux.jl), and implementing the MLJ model interface.\n\nFrom MLJ, the type can be imported using\n\n```\nNeuralNetworkRegressor = @load NeuralNetworkRegressor pkg=MLJFlux\n```\n\nDo `model = NeuralNetworkRegressor()` to construct an instance with default hyper-parameters. Provide keyword arguments to override hyper-parameter defaults, as in `NeuralNetworkRegressor(builder=...)`.\n\n`NeuralNetworkRegressor` is for training a data-dependent Flux.jl neural network to predict a `Continuous` target, given a table of `Continuous` features. Users provide a recipe for constructing the network, based on properties of the data that is encountered, by specifying an appropriate `builder`. See MLJFlux documentation for more on builders.\n\n# Training data\n\nIn MLJ or MLJBase, bind an instance `model` to data with\n\n```\nmach = machine(model, X, y)\n```\n\nHere:\n\n  * `X` is either a `Matrix` or any table of input features (eg, a `DataFrame`) whose columns are of scitype `Continuous`; check column scitypes with `schema(X)`. If `X` is a `Matrix`, it is assumed to have columns corresponding to features and rows corresponding to observations.\n  * `y` is the target, which can be any `AbstractVector` whose element scitype is `Continuous`; check the scitype with `scitype(y)`\n\nTrain the machine with `fit!(mach, rows=...)`.\n\n# Hyper-parameters\n\n  * `builder=MLJFlux.Linear(σ=Flux.relu)`: An MLJFlux builder that constructs a neural  network. Possible `builders` include: `MLJFlux.Linear`, `MLJFlux.Short`, and  `MLJFlux.MLP`. See MLJFlux documentation for more on builders, and the example below  for using the `@builder` convenience macro.\n  * `optimiser::Optimisers.Adam()`: An Optimisers.jl optimiser. The optimiser performs the updating of the weights of the network. To choose a learning rate (the update rate of the optimizer), a good rule of thumb is to start out at `10e-3`, and tune using powers of `10` between `1` and `1e-7`.\n  * `loss=Flux.mse`: The loss function which the network will optimize. Should be a function which can be called in the form `loss(yhat, y)`.  Possible loss functions are listed in [the Flux loss function documentation](https://fluxml.ai/Flux.jl/stable/models/losses/). For a regression task, natural loss functions are:\n\n      * `Flux.mse`\n      * `Flux.mae`\n      * `Flux.msle`\n      * `Flux.huber_loss`\n\n    Currently MLJ measures are not supported as loss functions here.\n  * `epochs::Int=10`: The duration of training, in epochs. Typically, one epoch represents one pass through the complete the training dataset.\n  * `batch_size::int=1`: the batch size to be used for training, representing the number of samples per update of the network weights. Typically, batch size is between `8` and `512`. Increasing batch size may accelerate training if `acceleration=CUDALibs()` and a GPU is available.\n  * `lambda::Float64=0`: The strength of the weight regularization penalty. Can be any value in the range `[0, ∞)`. Note the history reports unpenalized losses.\n  * `alpha::Float64=0`: The L2/L1 mix of regularization, in the range `[0, 1]`. A value of 0 represents L2 regularization, and a value of 1 represents L1 regularization.\n  * `rng::Union{AbstractRNG, Int64}`: The random number generator or seed used during training. The default is `Random.default_rng()`.\n  * `optimizer_changes_trigger_retraining::Bool=false`: Defines what happens when re-fitting a machine if the associated optimiser has changed. If `true`, the associated machine will retrain from scratch on `fit!` call, otherwise it will not.\n  * `acceleration::AbstractResource=CPU1()`: Defines on what hardware training is done. For Training on GPU, use `CUDALibs()`.\n\n# Operations\n\n  * `predict(mach, Xnew)`: return predictions of the target given new features `Xnew`, which should have the same scitype as `X` above.\n\n# Fitted parameters\n\nThe fields of `fitted_params(mach)` are:\n\n  * `chain`: The trained \"chain\" (Flux.jl model), namely the series of layers, functions,  and activations which make up the neural network.\n\n# Report\n\nThe fields of `report(mach)` are:\n\n  * `training_losses`: A vector of training losses (penalized if `lambda != 0`) in  historical order, of length `epochs + 1`.  The first element is the pre-training loss.\n\n# Examples\n\nIn this example we build a regression model for the Boston house price dataset.\n\n```julia\nusing MLJ\nimport MLJFlux\nusing Flux\nimport Optimisers\n```\n\nFirst, we load in the data: The `:MEDV` column becomes the target vector `y`, and all remaining columns go into a table `X`, with the exception of `:CHAS`:\n\n```julia\ndata = OpenML.load(531); # Loads from https://www.openml.org/d/531\ny, X = unpack(data, ==(:MEDV), !=(:CHAS); rng=123);\n\nscitype(y)\nschema(X)\n```\n\nSince MLJFlux models do not handle ordered factors, we'll treat `:RAD` as `Continuous`:\n\n```julia\nX = coerce(X, :RAD=>Continuous)\n```\n\nSplitting off a test set:\n\n```julia\n(X, Xtest), (y, ytest) = partition((X, y), 0.7, multi=true);\n```\n\nNext, we can define a `builder`, making use of a convenience macro to do so.  In the following `@builder` call, `n_in` is a proxy for the number input features (which will be known at `fit!` time) and `rng` is a proxy for a RNG (which will be passed from the `rng` field of `model` defined below). We also have the parameter `n_out` which is the number of output features. As we are doing single target regression, the value passed will always be `1`, but the builder we define will also work for [`MultitargetNeuralNetworkRegressor`](@ref).\n\n```julia\nbuilder = MLJFlux.@builder begin\n    init=Flux.glorot_uniform(rng)\n    Chain(\n        Dense(n_in, 64, relu, init=init),\n        Dense(64, 32, relu, init=init),\n        Dense(32, n_out, init=init),\n    )\nend\n```\n\nInstantiating a model:\n\n```julia\nNeuralNetworkRegressor = @load NeuralNetworkRegressor pkg=MLJFlux\nmodel = NeuralNetworkRegressor(\n    builder=builder,\n    rng=123,\n    epochs=20\n)\n```\n\nWe arrange for standardization of the the target by wrapping our model in `TransformedTargetModel`, and standardization of the features by inserting the wrapped model in a pipeline:\n\n```julia\npipe = Standardizer |> TransformedTargetModel(model, target=Standardizer)\n```\n\nIf we fit with a high verbosity (>1), we will see the losses during training. We can also see the losses in the output of `report(mach)`.\n\n```julia\nmach = machine(pipe, X, y)\nfit!(mach, verbosity=2)\n\n# first element initial loss, 2:end per epoch training losses\nreport(mach).transformed_target_model_deterministic.model.training_losses\n```\n\n## Experimenting with learning rate\n\nWe can visually compare how the learning rate affects the predictions:\n\n```julia\nusing Plots\n\nrates = rates = [5e-5, 1e-4, 0.005, 0.001, 0.05]\nplt=plot()\n\nforeach(rates) do η\n  pipe.transformed_target_model_deterministic.model.optimiser = Optimisers.Adam(η)\n  fit!(mach, force=true, verbosity=0)\n  losses =\n      report(mach).transformed_target_model_deterministic.model.training_losses[3:end]\n  plot!(1:length(losses), losses, label=η)\nend\n\nplt\n\npipe.transformed_target_model_deterministic.model.optimiser.eta = Optimisers.Adam(0.0001)\n```\n\nWith the learning rate fixed, we compute a CV estimate of the performance (using all data bound to `mach`) and compare this with performance on the test set:\n\n```julia\n# CV estimate, based on `(X, y)`:\nevaluate!(mach, resampling=CV(nfolds=5), measure=l2)\n\n# loss for `(Xtest, test)`:\nfit!(mach) # train on `(X, y)`\nyhat = predict(mach, Xtest)\nl2(yhat, ytest)\n```\n\nThese losses, for the pipeline model, refer to the target on the original, unstandardized, scale.\n\nFor implementing stopping criterion and other iteration controls, refer to examples linked from the MLJFlux documentation.\n\nSee also [`MultitargetNeuralNetworkRegressor`](@ref)\n"
 ":name" = "NeuralNetworkRegressor"
 ":human_name" = "neural network regressor"
 ":is_supervised" = "`true`"
@@ -8442,6 +8719,7 @@
 ":predict_scitype" = "`ScientificTypesBase.Unknown`"
 ":transform_scitype" = "`ScientificTypesBase.Unknown`"
 ":inverse_transform_scitype" = "`ScientificTypesBase.Unknown`"
+":target_in_fit" = "`true`"
 ":is_pure_julia" = "`false`"
 ":package_name" = "MLJEnsembles"
 ":package_license" = "unknown"
diff --git a/src/registry/Models.toml b/src/registry/Models.toml
index 1c6fd00..1c029f4 100644
--- a/src/registry/Models.toml
+++ b/src/registry/Models.toml
@@ -31,5 +31,5 @@ SelfOrganizingMaps = ["SelfOrganizingMap"]
 LIBSVM = ["SVC", "EpsilonSVR", "LinearSVC", "ProbabilisticSVC", "NuSVR", "NuSVC", "ProbabilisticNuSVC", "OneClassSVM"]
 TSVD = ["TSVDTransformer"]
 GLM = ["LinearBinaryClassifier", "LinearCountRegressor", "LinearRegressor"]
-MLJFlux = ["MultitargetNeuralNetworkRegressor", "NeuralNetworkClassifier", "ImageClassifier", "NeuralNetworkRegressor"]
+MLJFlux = ["MultitargetNeuralNetworkRegressor", "NeuralNetworkClassifier", "ImageClassifier", "NeuralNetworkBinaryClassifier", "NeuralNetworkRegressor"]
 MLJEnsembles = ["EnsembleModel"]