dump predict_or_transform_mutates in favour of is_static

ablaom · ablaom · commit 6da8531df1b0 · 2024-10-08T12:35:38.000+13:00
diff --git a/docs/src/fit_update.md b/docs/src/fit_update.md
@@ -26,6 +26,8 @@ Data slurping forms are similarly provided for updating methods.
 
 ## Typical workflows
 
+### Supervised models
+
 Supposing `Algorithm` is some supervised classifier type, with an iteration parameter `n`:
 
 ```julia
@@ -43,15 +45,32 @@ model = update(model; n=150)
 predict(model, Distribution(), X)
 ```
 
-### A static algorithm (no "learning")
+### Tranformers
+
+A dimension-reducing transformer, `algorithm`  might be used in this way:
+
+```julia
+model = fit(algorithm, X)
+transform(model, X) # or `transform(model, Xnew)`
+```
+
+or, if implemented, using a single call:
+
+```julia
+transform(algorithm, X) # `fit` implied
+```
+
+### Static algorithms (no "learning")
+
+Suppose `algorithm` is some clustering algorithm that cannot be generalized to new data
+(e.g. DBSCAN):
 
 ```julia
-# Apply some clustering algorithm which cannot be generalized to new data:
 model = fit(algorithm) # no training data
-labels = predict(model, LabelAmbiguous(), X) # may mutate `model`
+labels = predict(model, X) # may mutate `model`
 
 # Or, in one line:
-labels = predict(algorithm, LabelAmbiguous(), X)
+labels = predict(algorithm, X)
 
 # But two-line version exposes byproducts of the clustering algorithm (e.g., outliers):
 LearnAPI.extras(model)
diff --git a/docs/src/traits.md b/docs/src/traits.md
@@ -13,24 +13,24 @@ training). They may also record more mundane information, such as a package lice
 In the examples column of the table below, `Continuous` is a name owned the package
 [ScientificTypesBase.jl](https://github.com/JuliaAI/ScientificTypesBase.jl/).
 
-| trait                                                        | return value                                                                                                             | fallback value                                        | example                                                    |
-|:-------------------------------------------------------------|:-------------------------------------------------------------------------------------------------------------------------|:------------------------------------------------------|:-----------------------------------------------------------|
-| [`LearnAPI.constructor`](@ref)`(algorithm)`                  | constructor for generating new or modified versions of `algorithm`                                                       | (no fallback)                                         | `RidgeRegressor`                                           |
-| [`LearnAPI.functions`](@ref)`(algorithm)`                    | functions you can apply to `algorithm` or associated model (traits excluded)                                             | `()`                                                  | `(:fit, :predict, :minimize, :(LearnAPI.algorithm), :obs)` |
-| [`LearnAPI.kinds_of_proxy`](@ref)`(algorithm)`               | instances `kind` of `KindOfProxy` for which an implementation of `LearnAPI.predict(algorithm, kind, ...)` is guaranteed. | `()`                                                  | `(Distribution(), Interval())`                             |
-| [`LearnAPI.tags`](@ref)`(algorithm)`                         | lists one or more suggestive algorithm tags from `LearnAPI.tags()`                                                       | `()`                                                  | (:regression, :probabilistic)                              |
-| [`LearnAPI.is_pure_julia`](@ref)`(algorithm)`                | `true` if implementation is 100% Julia code                                                                              | `false`                                               | `true`                                                     |
-| [`LearnAPI.pkg_name`](@ref)`(algorithm)`                     | name of package providing core code (may be different from package providing LearnAPI.jl implementation)                 | `"unknown"`                                           | `"DecisionTree"`                                           |
-| [`LearnAPI.pkg_license`](@ref)`(algorithm)`                  | name of license of package providing core code                                                                           | `"unknown"`                                           | `"MIT"`                                                    |
-| [`LearnAPI.doc_url`](@ref)`(algorithm)`                      | url providing documentation of the core code                                                                             | `"unknown"`                                           | `"https://en.wikipedia.org/wiki/Decision_tree_learning"`   |
-| [`LearnAPI.load_path`](@ref)`(algorithm)`                    | string locating name returned by `LearnAPI.constructor(algorithm)`, beginning with a package name                        | "unknown"`                                            | `FastTrees.LearnAPI.DecisionTreeClassifier`                |
-| [`LearnAPI.is_composite`](@ref)`(algorithm)`                 | `true` if one or more properties of `algorithm` may be an algorithm                                                      | `false`                                               | `true`                                                     |
-| [`LearnAPI.human_name`](@ref)`(algorithm)`                   | human name for the algorithm; should be a noun                                                                           | type name with spaces                                 | "elastic net regressor"                                    |
-| [`LearnAPI.iteration_parameter`](@ref)`(algorithm)`          | symbolic name of an iteration parameter                                                                                  | `nothing`                                             | :epochs                                                    |
-| [`LearnAPI.data_interface`](@ref)`(algorithm)`               | Interface implemented by objects returned by [`obs`](@ref)                                                               | `Base.HasLength()` (supports `MLUtils.getobs/numobs`) | `Base.SizeUnknown()` (supports `iterate`)                  |
-| [`LearnAPI.fit_observation_scitype`](@ref)`(algorithm)`      | upper bound on `scitype(observation)` for `observation` in `data` ensuring `fit(algorithm, data)` works                  | `Union{}`                                             | `Tuple{AbstractVector{Continuous}, Continuous}`            |
-| [`LearnAPI.target_observation_scitype`](@ref)`(algorithm)`   | upper bound on the scitype of each observation of the targget                                                            | `Any`                                                 | `Continuous`                                               |
-| [`LearnAPI.predict_or_transform_mutates`](@ref)`(algorithm)` | `true` if `predict` or `transform` mutates first argument                                                                | `false`                                               | `true`                                                     |
+| trait                                                      | return value                                                                                                             | fallback value                                        | example                                                    |
+|:-----------------------------------------------------------|:-------------------------------------------------------------------------------------------------------------------------|:------------------------------------------------------|:-----------------------------------------------------------|
+| [`LearnAPI.constructor`](@ref)`(algorithm)`                | constructor for generating new or modified versions of `algorithm`                                                       | (no fallback)                                         | `RidgeRegressor`                                           |
+| [`LearnAPI.functions`](@ref)`(algorithm)`                  | functions you can apply to `algorithm` or associated model (traits excluded)                                             | `()`                                                  | `(:fit, :predict, :minimize, :(LearnAPI.algorithm), :obs)` |
+| [`LearnAPI.kinds_of_proxy`](@ref)`(algorithm)`             | instances `kind` of `KindOfProxy` for which an implementation of `LearnAPI.predict(algorithm, kind, ...)` is guaranteed. | `()`                                                  | `(Distribution(), Interval())`                             |
+| [`LearnAPI.tags`](@ref)`(algorithm)`                       | lists one or more suggestive algorithm tags from `LearnAPI.tags()`                                                       | `()`                                                  | (:regression, :probabilistic)                              |
+| [`LearnAPI.is_pure_julia`](@ref)`(algorithm)`              | `true` if implementation is 100% Julia code                                                                              | `false`                                               | `true`                                                     |
+| [`LearnAPI.pkg_name`](@ref)`(algorithm)`                   | name of package providing core code (may be different from package providing LearnAPI.jl implementation)                 | `"unknown"`                                           | `"DecisionTree"`                                           |
+| [`LearnAPI.pkg_license`](@ref)`(algorithm)`                | name of license of package providing core code                                                                           | `"unknown"`                                           | `"MIT"`                                                    |
+| [`LearnAPI.doc_url`](@ref)`(algorithm)`                    | url providing documentation of the core code                                                                             | `"unknown"`                                           | `"https://en.wikipedia.org/wiki/Decision_tree_learning"`   |
+| [`LearnAPI.load_path`](@ref)`(algorithm)`                  | string locating name returned by `LearnAPI.constructor(algorithm)`, beginning with a package name                        | "unknown"`                                            | `FastTrees.LearnAPI.DecisionTreeClassifier`                |
+| [`LearnAPI.is_composite`](@ref)`(algorithm)`               | `true` if one or more properties of `algorithm` may be an algorithm                                                      | `false`                                               | `true`                                                     |
+| [`LearnAPI.human_name`](@ref)`(algorithm)`                 | human name for the algorithm; should be a noun                                                                           | type name with spaces                                 | "elastic net regressor"                                    |
+| [`LearnAPI.iteration_parameter`](@ref)`(algorithm)`        | symbolic name of an iteration parameter                                                                                  | `nothing`                                             | :epochs                                                    |
+| [`LearnAPI.data_interface`](@ref)`(algorithm)`             | Interface implemented by objects returned by [`obs`](@ref)                                                               | `Base.HasLength()` (supports `MLUtils.getobs/numobs`) | `Base.SizeUnknown()` (supports `iterate`)                  |
+| [`LearnAPI.fit_observation_scitype`](@ref)`(algorithm)`    | upper bound on `scitype(observation)` for `observation` in `data` ensuring `fit(algorithm, data)` works                  | `Union{}`                                             | `Tuple{AbstractVector{Continuous}, Continuous}`            |
+| [`LearnAPI.target_observation_scitype`](@ref)`(algorithm)` | upper bound on the scitype of each observation of the targget                                                            | `Any`                                                 | `Continuous`                                               |
+| [`LearnAPI.is_static`](@ref)`(algorithm)`                  | `true` if `fit` consumes no data                                                                                         | `false`                                               | `true`                                                     |
 
 ### Derived Traits
 
@@ -104,5 +104,5 @@ LearnAPI.data_interface
 LearnAPI.iteration_parameter
 LearnAPI.fit_observation_scitype
 LearnAPI.target_observation_scitype
-LearnAPI.predict_or_transform_mutates
+LearnAPI.is_static
 ```
diff --git a/src/clone.jl b/src/clone.jl
@@ -7,7 +7,7 @@ Return a shallow copy of `algorithm` with the specified hyperparameter replaceme
 clone(algorithm; epochs=100, learning_rate=0.01)
 ```
 
-It is guaranted that `LearnAPI.clone(algorithm) == algorithm`.
+It is guaranteed that `LearnAPI.clone(algorithm) == algorithm`.
 
 """
 function clone(algorithm; replacements...)
diff --git a/src/fit_update.jl b/src/fit_update.jl
@@ -10,8 +10,8 @@ returning an object, `model`, on which other methods, such as [`predict`](@ref)
 list of methods that can be applied to either `algorithm` or `model`.
 
 The second signature is provided by algorithms that do not generalize to new observations
-("static" algorithms). In that case, `transform(model, data)` or `predict(model, ...,
-data)` carries out the actual algorithm execution, writing any byproducts of that
+(called *static algorithms*). In that case, `transform(model, data)` or `predict(model,
+..., data)` carries out the actual algorithm execution, writing any byproducts of that
 operation to the mutable object `model` returned by `fit`.
 
 Whenever `fit` expects a tuple form of argument, `data = (X1, ..., Xn)`, then the
@@ -33,14 +33,16 @@ See also [`predict`](@ref), [`transform`](@ref), [`inverse_transform`](@ref),
 
 # New implementations
 
-Implementation is compulsory. The signature must include `verbosity`. A fallback for the
-first signature calls the second, ignoring `data`:
+Implementation is compulsory. The signature must include `verbosity`. Fallbacks provide
+the data slurping versions.  A fallback for the first signature calls the second, ignoring
+`data`:
 
 ```julia
 fit(algorithm, data; kwargs...) = fit(algorithm; kwargs...)
 ```
 
-Fallbacks also provide the data slurping versions.
+If only the `fit(algorithm)` signature is expliclty implemented, then the trait
+[`LearnAPI.is_static`](@ref) must be overloaded to return `true`.
 
 $(DOC_DATA_INTERFACE(:fit))
 
diff --git a/src/predict_transform.jl b/src/predict_transform.jl
@@ -11,11 +11,9 @@ const DOC_OPERATIONS_LIST_FUNCTION = join(map(op -> "`LearnAPI.$op`", OPERATIONS
 DOC_MUTATION(op) =
     """
 
-    If [`LearnAPI.predict_or_transform_mutates(algorithm)`](@ref) is overloaded to return
-    `true`, then `$op` may mutate it's first argument, but not in a way that alters the
-    result of a subsequent call to `predict`, `transform` or
-    `inverse_transform`. This is necessary for some non-generalizing algorithms but is
-    otherwise discouraged. See more at [`fit`](@ref).
+    If [`LearnAPI.is_static(algorithm)`](@ref) is `true`, then `$op` may mutate it's first
+    argument, but not in a way that alters the result of a subsequent call to `predict`,
+    `transform` or `inverse_transform`. See more at [`fit`](@ref).
 
     """
 
@@ -86,7 +84,7 @@ If `predict` supports data in the form of a tuple `data = (X1, ..., Xn)`, then a
 signature is also provided, as in `predict(model, X1, ..., Xn)`.
 
 Note `predict ` does not mutate any argument, except in the special case
-`LearnAPI.predict_or_transform_mutates(algorithm) = true`.
+`LearnAPI.is_static(algorithm) == true`.
 
 # New implementations
 
@@ -150,7 +148,7 @@ W = transform(algorithm, X)
 ```
 
 Note `transform` does not mutate any argument, except in the special case
-`LearnAPI.predict_or_transform_mutates(algorithm) = true`.
+`LearnAPI.is_static(algorithm) == true`.
 
 See also [`fit`](@ref), [`predict`](@ref),
 [`inverse_transform`](@ref).
diff --git a/src/target_weights_features.jl b/src/target_weights_features.jl
@@ -70,4 +70,4 @@ return `nothing`.
 features(algorithm, data) = _first(data)
 _first(data) = data
 _first(data::Tuple) = first(data)
-# note the factoring above guards agains method ambiguities
+# note the factoring above guards against method ambiguities
diff --git a/src/traits.jl b/src/traits.jl
@@ -346,19 +346,30 @@ tables, and tuples of these. See the doc-string for details.
 data_interface(::Any) = LearnAPI.RandomAccess()
 
 """
-    LearnAPI.predict_or_transform_mutates(algorithm)
+    LearnAPI.is_static(algorithm)
 
-Returns `true` if [`predict`](@ref) or [`transform`](@ref) possibly mutate their first
-argument, `model`, when `LearnAPI.algorithm(model) == algorithm`. If `false`, no arguments
-are ever mutated.
+Returns `true` if [`fit`](@ref) is called with no data arguments, as in
+`fit(algorithm)`. That is, `algorithm` does not generalize to new data, and data is only
+provided at the `predict` or `transform` step.
+
+For example, some clustering algorithms are applied with this workflow, to label points
+observations in `X`:
+
+```julia
+model = fit(algorithm) # no training data
+labels = predict(model, X) # may mutate `model`!
+
+# extract some byproducts of the clustering algorithm (e.g., outliers):
+LearnAPI.extras(model)
+```
 
 # New implementations
 
 This trait, falling back to `false`, may only be overloaded when `fit` has no data
-arguments (`algorithm` does not generalize to new data). See more at [`fit`](@ref).
+arguments. See more at [`fit`](@ref).
 
 """
-predict_or_transform_mutates(::Any) = false
+is_static(::Any) = false
 
 """
     LearnAPI.iteration_parameter(algorithm)
diff --git a/test/integration/static_algorithms.jl b/test/integration/static_algorithms.jl
@@ -36,10 +36,12 @@ function LearnAPI.transform(algorithm::Selector, X)
     transform(model, X)
 end
 
+# note the necessity of overloading `is_static` (`fit` consumes no data):
 @trait(
     Selector,
     constructor = Selector,
     tags = ("feature engineering",),
+    is_static = true,
     functions = (
         :(LearnAPI.fit),
         :(LearnAPI.algorithm),
@@ -63,9 +65,7 @@ end
 # # FEATURE SELECTOR THAT REPORTS BYPRODUCTS OF SELECTION PROCESS
 
 # This a variation of `Selector` above that stores the names of rejected features in the
-# model object, for inspection by an accessor function called `rejected`. Since
-# `transform(model, X)` mutates `model` in this case, we must overload the
-# `predict_or_transform_mutates` trait.
+# output of `fit`, for inspection by an accessor function called `rejected`.
 
 struct Selector2
     names::Vector{Symbol}
@@ -101,10 +101,11 @@ function LearnAPI.transform(algorithm::Selector2, X)
     transform(model, X)
 end
 
+# note the necessity of overloading `is_static` (`fit` consumes no data):
 @trait(
     Selector2,
     constructor = Selector2,
-    predict_or_transform_mutates = true,
+    is_static = true,
     tags = ("feature engineering",),
     functions = (
         :(LearnAPI.fit),