scikit-learn
diff --git a/‎dev/_downloads/07fcc19ba03226cd3d83d4e40ec44385/auto_examples_python.zip
685 Bytes b/‎dev/_downloads/07fcc19ba03226cd3d83d4e40ec44385/auto_examples_python.zip
685 Bytes
diff --git a/‎dev/_downloads/1b3f17ff0f112d5b77cbdb90f1c17046/plot_set_output.py
Lines changed: 23 additions & 1 deletion b/‎dev/_downloads/1b3f17ff0f112d5b77cbdb90f1c17046/plot_set_output.py
Lines changed: 23 additions & 1 deletion
diff --git a/‎dev/_downloads/6f1e7a639e0699d6164445b55e6c116d/auto_examples_jupyter.zip
1.4 KB b/‎dev/_downloads/6f1e7a639e0699d6164445b55e6c116d/auto_examples_jupyter.zip
1.4 KB
diff --git a/‎dev/_downloads/e23929e86fa0a415fb85ef2834a3ff7d/plot_set_output.ipynb
Lines changed: 48 additions & 1 deletion b/‎dev/_downloads/e23929e86fa0a415fb85ef2834a3ff7d/plot_set_output.ipynb
Lines changed: 48 additions & 1 deletion
diff --git a/‎dev/_downloads/scikit-learn-docs.zip
-3.96 KB b/‎dev/_downloads/scikit-learn-docs.zip
-3.96 KB
diff --git a/‎dev/_images/sphx_glr_plot_agglomerative_clustering_001.png
187 Bytes b/‎dev/_images/sphx_glr_plot_agglomerative_clustering_001.png
187 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_agglomerative_clustering_002.png
-1 Bytes b/‎dev/_images/sphx_glr_plot_agglomerative_clustering_002.png
-1 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_agglomerative_clustering_003.png
202 Bytes b/‎dev/_images/sphx_glr_plot_agglomerative_clustering_003.png
202 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_agglomerative_clustering_004.png
148 Bytes b/‎dev/_images/sphx_glr_plot_agglomerative_clustering_004.png
148 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_agglomerative_clustering_thumb.png
80 Bytes b/‎dev/_images/sphx_glr_plot_agglomerative_clustering_thumb.png
80 Bytes
@@ -84,9 +84,10 @@
 set_config(transform_output="pandas")
 
 num_pipe = make_pipeline(SimpleImputer(), StandardScaler())
+num_cols = ["age", "fare"]
 ct = ColumnTransformer(
     (
-        ("numerical", num_pipe, ["age", "fare"]),
+        ("numerical", num_pipe, num_cols),
         (
             "categorical",
             OneHotEncoder(
@@ -114,3 +115,24 @@
 # This resets `transform_output` to its default value to avoid impacting other
 # examples when generating the scikit-learn documentation
 set_config(transform_output="default")
+
+# %%
+# When configuring the output type with :func:`config_context` the
+# configuration at the time when `transform` or `fit_transform` are
+# called is what counts. Setting these only when you construct or fit
+# the transformer has no effect.
+from sklearn import config_context
+
+scaler = StandardScaler()
+scaler.fit(X_train[num_cols])
+
+# %%
+with config_context(transform_output="pandas"):
+    # the output of transform will be a Pandas DataFrame
+    X_test_scaled = scaler.transform(X_test[num_cols])
+X_test_scaled.head()
+
+# %%
+# outside of the context manager, the output will be a NumPy array
+X_test_scaled = scaler.transform(X_test[num_cols])
+X_test_scaled[:5]
@@ -141,7 +141,7 @@
       },
       "outputs": [],
       "source": [
-        "from sklearn.compose import ColumnTransformer\nfrom sklearn.preprocessing import OneHotEncoder, StandardScaler\nfrom sklearn.impute import SimpleImputer\nfrom sklearn import set_config\n\nset_config(transform_output=\"pandas\")\n\nnum_pipe = make_pipeline(SimpleImputer(), StandardScaler())\nct = ColumnTransformer(\n    (\n        (\"numerical\", num_pipe, [\"age\", \"fare\"]),\n        (\n            \"categorical\",\n            OneHotEncoder(\n                sparse_output=False, drop=\"if_binary\", handle_unknown=\"ignore\"\n            ),\n            [\"embarked\", \"sex\", \"pclass\"],\n        ),\n    ),\n    verbose_feature_names_out=False,\n)\nclf = make_pipeline(ct, SelectPercentile(percentile=50), LogisticRegression())\nclf.fit(X_train, y_train)\nclf.score(X_test, y_test)"
+        "from sklearn.compose import ColumnTransformer\nfrom sklearn.preprocessing import OneHotEncoder, StandardScaler\nfrom sklearn.impute import SimpleImputer\nfrom sklearn import set_config\n\nset_config(transform_output=\"pandas\")\n\nnum_pipe = make_pipeline(SimpleImputer(), StandardScaler())\nnum_cols = [\"age\", \"fare\"]\nct = ColumnTransformer(\n    (\n        (\"numerical\", num_pipe, num_cols),\n        (\n            \"categorical\",\n            OneHotEncoder(\n                sparse_output=False, drop=\"if_binary\", handle_unknown=\"ignore\"\n            ),\n            [\"embarked\", \"sex\", \"pclass\"],\n        ),\n    ),\n    verbose_feature_names_out=False,\n)\nclf = make_pipeline(ct, SelectPercentile(percentile=50), LogisticRegression())\nclf.fit(X_train, y_train)\nclf.score(X_test, y_test)"
       ]
     },
     {
@@ -179,6 +179,53 @@
       "source": [
         "set_config(transform_output=\"default\")"
       ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "When configuring the output type with :func:`config_context` the\nconfiguration at the time when `transform` or `fit_transform` are\ncalled is what counts. Setting these only when you construct or fit\nthe transformer has no effect.\n\n"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "collapsed": false
+      },
+      "outputs": [],
+      "source": [
+        "from sklearn import config_context\n\nscaler = StandardScaler()\nscaler.fit(X_train[num_cols])"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "collapsed": false
+      },
+      "outputs": [],
+      "source": [
+        "with config_context(transform_output=\"pandas\"):\n    # the output of transform will be a Pandas DataFrame\n    X_test_scaled = scaler.transform(X_test[num_cols])\nX_test_scaled.head()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "outside of the context manager, the output will be a NumPy array\n\n"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "collapsed": false
+      },
+      "outputs": [],
+      "source": [
+        "X_test_scaled = scaler.transform(X_test[num_cols])\nX_test_scaled[:5]"
+      ]
     }
   ],
   "metadata": {