From dd5b1348e331451909b98302859bd383c1173320 Mon Sep 17 00:00:00 2001
From: Adrian Hayler <adrian@priorlabs.ai>
Date: Wed, 13 May 2026 17:14:23 +0200
Subject: [PATCH] Improve feature_selection wrapper: richer return type +
 per-round verbose + KV-cache caveat
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Rewrite `feature_selection` around a `FeatureSelectionResult` dataclass.
  The wrapper now returns the fitted SFS plus the support mask, selected
  indices/names, and the pre/post CV scores it already had to compute —
  collapses the typical caller-side mask -> names dance into one
  attribute access. Backward-incompatible: callers using
  `sfs.get_support()` directly need to switch to `result.support_mask`
  (or `result.selector.get_support()`).
- Make `n_features_to_select` a required positional argument — there's
  no sensible default.
- Expose the SFS knobs we were swallowing: `cv`, `scoring`, `direction`,
  `n_jobs`, `tol`. All keyword-only after the `*`. `cv=5` is the
  pre-existing hardcoded value, just configurable now.
- Always compute baseline (all-features) and selected (subset) CV scores
  using the same `cv` / `scoring` as SFS, surface them on the result.
- Add `verbose: bool = True`. When set:
  - print a config header (direction, cv, scoring, k)
  - print the baseline CV score before SFS runs
  - print per-round picks ("round i/k: picked feature 'x', cv = ...")
    via a `_VerboseSFS` subclass that overrides the private
    `_get_best_new_feature_score` method (sklearn doesn't expose a
    `verbose` parameter or callback hook on SFS itself — this is the
    cleanest workaround; documented in a class docstring with the
    private-API dependency caveat)
  - print the selected names + final CV score
  `verbose=False` keeps everything silent; the scores are still available
  on the returned `FeatureSelectionResult`.
- Add a docstring note: TabPFN is very robust to noisy features in its
  in-context-learning regime, so accuracy gain from running SFS is often
  marginal — the value is more interpretability / parsimony / faster
  predict-time. Verified by a quick noise-trajectory benchmark
  (n_features 3 -> 13, CV score stays in 0.92–0.94 throughout). Mention
  SHAP as the alternative interpretability route since it can use the
  KV cache and is generally much faster.
- Re-export `FeatureSelectionResult` from `tabpfn_extensions.interpretability`
  so callers can type-annotate without reaching into the submodule.
- Update `examples/interpretability/feature_selection.py` to use the new
  return shape, and align params with the public TabPFN demo notebook
  (`n_estimators=1`, `n_features_to_select=4`).

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 .../interpretability/feature_selection.py     |  32 +-
 .../interpretability/__init__.py              |   3 +-
 .../interpretability/feature_selection.py     | 322 ++++++++++++++----
 3 files changed, 282 insertions(+), 75 deletions(-)

diff --git a/examples/interpretability/feature_selection.py b/examples/interpretability/feature_selection.py
index cda52540..7577e876 100644
--- a/examples/interpretability/feature_selection.py
+++ b/examples/interpretability/feature_selection.py
@@ -12,22 +12,28 @@
 X, y = data.data, data.target
 feature_names = data.feature_names
 
-# Initialize model
-clf = TabPFNClassifier(n_estimators=3)
+# Initialize model. Single estimator keeps the runtime manageable — feature
+# selection runs many TabPFN fits per round.
+clf = TabPFNClassifier(n_estimators=1)
 
-# Feature selection
-sfs = interpretability.feature_selection.feature_selection(
+# Feature selection. With verbose=True (the default) the wrapper prints the
+# baseline CV score on all features, the per-round picks, and the selected
+# names + CV score on the subset. The same numbers are also available on
+# the returned FeatureSelectionResult for programmatic use.
+result = interpretability.feature_selection.feature_selection(
     estimator=clf,
     X=X,
     y=y,
-    n_features_to_select=5,  # How many features to select
-    feature_names=feature_names,
+    n_features_to_select=4,
+    feature_names=list(feature_names),
 )
 
-# Print selected features
-selected_features = [
-    feature_names[i] for i in range(len(feature_names)) if sfs.get_support()[i]
-]
-print("\nSelected features:")
-for feature in selected_features:
-    print(f"- {feature}")
+# `result.selected_names` is populated because we passed `feature_names`.
+# `result.selector.transform(X)` would project to just those columns;
+# `result.support_mask` / `result.selected_indices` are also available.
+print("\nProgrammatic summary:")
+print(f"Selected features: {result.selected_names}")
+print(
+    f"CV score before / after: "
+    f"{result.baseline_score_mean:.4f} -> {result.selected_score_mean:.4f}"
+)
diff --git a/src/tabpfn_extensions/interpretability/__init__.py b/src/tabpfn_extensions/interpretability/__init__.py
index 77aa1c39..89cf518b 100644
--- a/src/tabpfn_extensions/interpretability/__init__.py
+++ b/src/tabpfn_extensions/interpretability/__init__.py
@@ -1,7 +1,8 @@
 try:
     from . import feature_selection, pdp, shapiq
+    from .feature_selection import FeatureSelectionResult
 except ImportError:
     raise ImportError(
         "Please install tabpfn-extensions with the 'interpretability' extra: pip install 'tabpfn-extensions[interpretability]'",
     )
-__all__ = ["feature_selection", "shapiq", "pdp"]
+__all__ = ["feature_selection", "shapiq", "pdp", "FeatureSelectionResult"]
diff --git a/src/tabpfn_extensions/interpretability/feature_selection.py b/src/tabpfn_extensions/interpretability/feature_selection.py
index 5aff6cff..e6da24cc 100644
--- a/src/tabpfn_extensions/interpretability/feature_selection.py
+++ b/src/tabpfn_extensions/interpretability/feature_selection.py
@@ -2,109 +2,309 @@
 #  Licensed under the Apache License, Version 2.0
 from __future__ import annotations
 
-from typing import TYPE_CHECKING
+from dataclasses import dataclass
+from typing import TYPE_CHECKING, Any
 
 from sklearn.feature_selection import SequentialFeatureSelector
 from sklearn.model_selection import cross_val_score
 
 if TYPE_CHECKING:
+    from collections.abc import Callable, Iterable
+
     import numpy as np
     from sklearn.base import BaseEstimator
+    from sklearn.model_selection import BaseCrossValidator
+
+
+class _VerboseSFS(SequentialFeatureSelector):
+    """Subclass of ``SequentialFeatureSelector`` that prints which feature it
+    picked at each round, along with the CV score.
+
+    Hook is the private ``_get_best_new_feature_score`` method. It's stable
+    in current sklearn (1.6 / 1.7 / 1.8 all share the signature) but is
+    private API — if sklearn renames or restructures it, this will break
+    visibly (no per-round output) rather than silently. Verbosity then
+    falls back to the pre/post CV-score prints in ``_feature_selection``.
+
+    We deliberately do not override ``__init__``. sklearn's parameter
+    introspection (``get_params`` / ``clone`` / ``_validate_params``)
+    rejects subclasses whose ``__init__`` uses ``*args`` / ``**kwargs``
+    or introduces parameters not in ``_parameter_constraints``. Instead
+    the caller sets ``_verbose_feature_names`` as a plain attribute on
+    the instance after construction; the iteration counter is lazy.
+    """
+
+    def _get_best_new_feature_score(  # type: ignore[override]
+        self,
+        estimator: BaseEstimator,
+        X: np.ndarray,
+        y: np.ndarray,
+        cv: Any,
+        current_mask: np.ndarray,
+        **params: Any,
+    ) -> tuple[int, float]:
+        idx, score = super()._get_best_new_feature_score(
+            estimator,
+            X,
+            y,
+            cv,
+            current_mask,
+            **params,
+        )
+        self._verbose_iter = getattr(self, "_verbose_iter", 0) + 1
+        names = getattr(self, "_verbose_feature_names", None)
+        label = names[idx] if names is not None else idx
+        # Direction matters for the message: forward "picks to add",
+        # backward "picks to remove" — same _get_best_new_feature_score
+        # method but the semantics differ.
+        verb = "picked" if self.direction == "forward" else "dropped"
+        print(  # noqa: T201 — intentional verbose-mode output
+            f"  round {self._verbose_iter}/{self.n_features_to_select_}: "
+            f"{verb} feature {label!r}, cv score = {score:.4f}",
+        )
+        return idx, score
+
+
+@dataclass
+class FeatureSelectionResult:
+    """Result of running ``feature_selection``.
+
+    Attributes:
+        selector: The underlying fitted ``SequentialFeatureSelector``.
+            Use it for ``.transform(X)`` to project to the selected
+            columns, or for any sklearn-style downstream work.
+        support_mask: Boolean array of shape ``(n_features,)`` — ``True``
+            for the columns SFS picked.
+        selected_indices: Integer indices of the selected columns, in
+            ascending order.
+        selected_names: Selected feature names, in the same order as
+            ``selected_indices``. ``None`` iff ``feature_names`` wasn't
+            passed.
+        baseline_score_mean: Mean cross-validated score of ``estimator``
+            on **all** features, using the same ``cv`` and ``scoring`` as
+            the selection step.
+        baseline_score_std: Standard deviation across CV folds for the
+            baseline score.
+        selected_score_mean: Mean cross-validated score of ``estimator``
+            on the **selected** subset of features.
+        selected_score_std: Standard deviation across CV folds for the
+            selected-subset score.
+    """
+
+    selector: SequentialFeatureSelector
+    support_mask: np.ndarray
+    selected_indices: list[int]
+    selected_names: list[str] | None
+    baseline_score_mean: float
+    baseline_score_std: float
+    selected_score_mean: float
+    selected_score_std: float
 
 
 def feature_selection(
     estimator: BaseEstimator,
     X: np.ndarray,
     y: np.ndarray,
-    n_features_to_select: int = 3,
+    n_features_to_select: int | float | str,
     feature_names: list[str] | None = None,
-    **kwargs,
-) -> SequentialFeatureSelector:
-    """Perform feature selection to find the most important features.
+    *,
+    cv: int | BaseCrossValidator | Iterable = 5,
+    scoring: str | Callable | None = None,
+    direction: str = "forward",
+    n_jobs: int | None = None,
+    tol: float | None = None,
+    verbose: bool = True,
+    **kwargs: Any,
+) -> FeatureSelectionResult:
+    """Sequential feature selection wrapper around scikit-learn's SFS.
 
-    Uses forward sequential feature selection to identify the most important
-    features for the given estimator and data.
+    Picks a subset of features that work well for ``estimator`` by
+    repeatedly fitting ``estimator`` on candidate subsets and keeping the
+    one that maximizes a cross-validated score. Forwards the relevant
+    ``SequentialFeatureSelector`` hyperparameters; always computes the
+    baseline (all-features) and selected (subset-only) CV scores so they
+    are available on the returned object regardless of ``verbose``.
+
+    Note that while we expose feature selection here, **TabPFN is very
+    robust to noisy / uninformative features** in its native
+    in-context-learning regime, so the *accuracy gain* from running this
+    selector is often marginal — on real datasets the all-features
+    baseline and the selected subset typically score within
+    cross-validation noise of each other. The value of running selection
+    on TabPFN is usually more in terms of interpretability.
+    Note that other interpretability methods, such as SHAP, are also supported
+    and are generally much faster because they can use the KV cache.
+
+    Sequential feature selection is expensive: forward selection with
+    ``n_features_to_select=k`` on ``d`` features uses on the order of
+    ``cv * sum_{i=0..k-1} (d - i)`` model fits, plus 2 more for the
+    baseline / selected CV scores. ``n_jobs`` parallelizes
+    candidate-feature evaluation within each round; pass ``-1`` for all
+    cores. Note that v3's KV cache does *not* help here — every candidate
+    has a different ``X_train`` so the cache invalidates between fits.
 
     Args:
-        estimator: The model to use for feature selection
-        X: Input features, shape (n_samples, n_features)
-        y: Target values, shape (n_samples,)
-        n_features_to_select: Number of features to select
-        feature_names: Names of the features (optional)
-        **kwargs: Additional parameters to pass to SequentialFeatureSelector
+        estimator: The model to use for feature selection.
+        X: Input features, shape ``(n_samples, n_features)``.
+        y: Target values, shape ``(n_samples,)``.
+        n_features_to_select: Number of features to keep. ``int`` for an
+            absolute count, ``float`` for a fraction of the total, or
+            ``"auto"`` to let ``tol`` decide (requires ``tol``).
+        feature_names: Optional list of feature names. When provided, the
+            returned ``FeatureSelectionResult`` carries the selected
+            names under ``selected_names``.
+        cv: Cross-validation folds — int (k-fold), CV generator, or
+            iterable of splits. Default 5.
+        scoring: Metric to maximize. ``str`` (e.g. ``"roc_auc"``,
+            ``"neg_log_loss"``, ``"r2"``) or a callable. Default ``None``
+            uses sklearn's per-estimator default (``accuracy`` for
+            classifiers, ``r2`` for regressors).
+        direction: ``"forward"`` (start empty, add features) or
+            ``"backward"`` (start full, remove features). Backward is
+            much more expensive but sometimes preferred when features
+            are redundant.
+        n_jobs: Parallelism over candidate features in each round.
+            ``-1`` uses all cores. Default ``None`` is single-threaded.
+        tol: Stop condition for auto selection — only used when
+            ``n_features_to_select="auto"``. Forward selection stops
+            when adding a feature improves the CV score by less than
+            ``tol``.
+        verbose: When ``True`` (default), print the pre- and
+            post-selection CV scores and the names of the selected
+            features. The scores are computed and returned regardless.
+        **kwargs: Forwarded to ``SequentialFeatureSelector`` for forward
+            compatibility with future sklearn options.
 
     Returns:
-        SequentialFeatureSelector: Fitted feature selector that can be used
-            to transform data to use only the selected features
+        FeatureSelectionResult: a dataclass with the fitted selector,
+        the boolean support mask, the selected indices and names, and
+        the baseline / selected CV scores.
     """
     if hasattr(estimator, "show_progress"):
-        show_progress_ = estimator.show_progress
+        prev_show_progress = estimator.show_progress
         estimator.show_progress = False
         try:
             return _feature_selection(
                 estimator,
                 X,
                 y,
-                n_features_to_select,
-                feature_names,
+                n_features_to_select=n_features_to_select,
+                feature_names=feature_names,
+                cv=cv,
+                scoring=scoring,
+                direction=direction,
+                n_jobs=n_jobs,
+                tol=tol,
+                verbose=verbose,
                 **kwargs,
             )
         finally:
-            estimator.show_progress = show_progress_
-    else:
-        return _feature_selection(
-            estimator,
-            X,
-            y,
-            n_features_to_select,
-            feature_names,
-            **kwargs,
-        )
+            estimator.show_progress = prev_show_progress
+    return _feature_selection(
+        estimator,
+        X,
+        y,
+        n_features_to_select=n_features_to_select,
+        feature_names=feature_names,
+        cv=cv,
+        scoring=scoring,
+        direction=direction,
+        n_jobs=n_jobs,
+        tol=tol,
+        verbose=verbose,
+        **kwargs,
+    )
 
 
 def _feature_selection(
     estimator: BaseEstimator,
     X: np.ndarray,
     y: np.ndarray,
-    n_features_to_select: int = 3,
-    feature_names: list[str] | None = None,
-    **kwargs,
-) -> SequentialFeatureSelector:
-    """Internal implementation of feature selection.
-
-    Args:
-        estimator: The model to use for feature selection
-        X: Input features
-        y: Target values
-        n_features_to_select: Number of features to select
-        feature_names: Names of the features
-        **kwargs: Additional parameters for SequentialFeatureSelector
-
-    Returns:
-        SequentialFeatureSelector: Fitted feature selector
-    """
-    # TODO: Try https://rasbt.github.io/mlxtend/api_subpackages/mlxtend.feature_selection/#sequentialfeatureselector
-    # TODO: Could use more feature in training, but only keep fewer in test
-    # TODO: the fit function is somehow still called; We need to to change the feature selection
-    #  method so it sets feature to none in test; Could be done with a wrapper that sets the feature subsets in fit
-    #  and predict
-    CV_FOLDS = 5
+    *,
+    n_features_to_select: int | float | str,
+    feature_names: list[str] | None,
+    cv: int | BaseCrossValidator | Iterable,
+    scoring: str | Callable | None,
+    direction: str,
+    n_jobs: int | None,
+    tol: float | None,
+    verbose: bool,
+    **kwargs: Any,
+) -> FeatureSelectionResult:
+    """Internal implementation; ``feature_selection`` is the public entry."""
+    scoring_desc = f"scoring={scoring!r}" if scoring is not None else "scoring=default"
+    if verbose:
+        print(  # noqa: T201
+            f"Feature selection: direction={direction!r}, cv={cv}, "
+            f"{scoring_desc}, n_features_to_select={n_features_to_select!r}"
+        )
 
-    cross_val_score(estimator, X, y, cv=CV_FOLDS)
+    # Baseline: how well does the model do with every feature available?
+    baseline_scores = cross_val_score(
+        estimator,
+        X,
+        y,
+        cv=cv,
+        scoring=scoring,
+        n_jobs=n_jobs,
+    )
+    if verbose:
+        print(  # noqa: T201
+            f"Baseline CV score on all {X.shape[1]} features: "
+            f"{baseline_scores.mean():.4f} ± {baseline_scores.std():.4f}"
+        )
 
-    # TODO: Feature selection is done without CV, i.e. final CV scores might be biased (too good)
-    sfs = SequentialFeatureSelector(
+    sfs_cls = _VerboseSFS if verbose else SequentialFeatureSelector
+    sfs = sfs_cls(
         estimator,
         n_features_to_select=n_features_to_select,
-        direction="forward",
+        tol=tol,
+        direction=direction,
+        scoring=scoring,
+        cv=cv,
+        n_jobs=n_jobs,
+        **kwargs,
     )
+    if verbose:
+        # Plain attributes, not constructor args — sklearn's get_params
+        # introspects __init__ for parameter discovery and rejects extras.
+        sfs._verbose_feature_names = feature_names  # type: ignore[attr-defined]
     sfs.fit(X, y)
-    sfs.get_support()
-    X_transformed = sfs.transform(X)
 
-    cross_val_score(estimator, X_transformed, y, cv=CV_FOLDS)
+    support_mask = sfs.get_support()
+    selected_indices = [i for i, keep in enumerate(support_mask) if keep]
+    selected_names = (
+        [feature_names[i] for i in selected_indices]
+        if feature_names is not None
+        else None
+    )
+
+    selected_scores = cross_val_score(
+        estimator,
+        sfs.transform(X),
+        y,
+        cv=cv,
+        scoring=scoring,
+        n_jobs=n_jobs,
+    )
 
-    if feature_names is not None:
-        pass
+    if verbose:
+        display = selected_names if selected_names is not None else selected_indices
+        print(  # noqa: T201
+            f"Selected {sfs.n_features_to_select_} feature(s): {display}"
+        )
+        print(  # noqa: T201
+            f"CV score on selected features: "
+            f"{selected_scores.mean():.4f} ± {selected_scores.std():.4f}"
+        )
 
-    return sfs
+    return FeatureSelectionResult(
+        selector=sfs,
+        support_mask=support_mask,
+        selected_indices=selected_indices,
+        selected_names=selected_names,
+        baseline_score_mean=float(baseline_scores.mean()),
+        baseline_score_std=float(baseline_scores.std()),
+        selected_score_mean=float(selected_scores.mean()),
+        selected_score_std=float(selected_scores.std()),
+    )