scikit-learn
diff --git a/‎dev/_downloads/07fcc19ba03226cd3d83d4e40ec44385/auto_examples_python.zip
2.21 KB b/‎dev/_downloads/07fcc19ba03226cd3d83d4e40ec44385/auto_examples_python.zip
2.21 KB
diff --git a/‎dev/_downloads/1054d40caffbd65c52b20dac784c7c5c/plot_elastic_net_precomputed_gram_matrix_with_weighted_samples.ipynb
Lines changed: 108 additions & 0 deletions b/‎dev/_downloads/1054d40caffbd65c52b20dac784c7c5c/plot_elastic_net_precomputed_gram_matrix_with_weighted_samples.ipynb
Lines changed: 108 additions & 0 deletions
diff --git a/‎dev/_downloads/6f1e7a639e0699d6164445b55e6c116d/auto_examples_jupyter.zip
3.92 KB b/‎dev/_downloads/6f1e7a639e0699d6164445b55e6c116d/auto_examples_jupyter.zip
3.92 KB
diff --git a/‎dev/_downloads/c50f4529d4a653ccd8d5117ec9300975/plot_elastic_net_precomputed_gram_matrix_with_weighted_samples.py
Lines changed: 53 additions & 0 deletions b/‎dev/_downloads/c50f4529d4a653ccd8d5117ec9300975/plot_elastic_net_precomputed_gram_matrix_with_weighted_samples.py
Lines changed: 53 additions & 0 deletions
diff --git a/‎dev/_downloads/scikit-learn-docs.pdf
5.36 KB b/‎dev/_downloads/scikit-learn-docs.pdf
5.36 KB
diff --git a/‎dev/_images/binder_badge_logo.png
0 Bytes b/‎dev/_images/binder_badge_logo.png
0 Bytes
diff --git a/‎dev/_images/iris.png
0 Bytes b/‎dev/_images/iris.png
0 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_agglomerative_clustering_001.png
-337 Bytes b/‎dev/_images/sphx_glr_plot_agglomerative_clustering_001.png
-337 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_agglomerative_clustering_0011.png
-337 Bytes b/‎dev/_images/sphx_glr_plot_agglomerative_clustering_0011.png
-337 Bytes
diff --git a/‎dev/_images/sphx_glr_plot_agglomerative_clustering_002.png
-311 Bytes b/‎dev/_images/sphx_glr_plot_agglomerative_clustering_002.png
-311 Bytes
@@ -0,0 +1,108 @@
+{
+  "cells": [
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "collapsed": false
+      },
+      "outputs": [],
+      "source": [
+        "%matplotlib inline"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "\n# Fitting an Elastic Net with a precomputed Gram Matrix and Weighted Samples\n\nThe following example shows how to precompute the gram matrix\nwhile using weighted samples with an ElasticNet.\n\nIf weighted samples are used, the design matrix must be centered and then\nrescaled by the square root of the weight vector before the gram matrix\nis computed.\n\n<div class=\"alert alert-info\"><h4>Note</h4><p>`sample_weight` vector is also rescaled to sum to `n_samples`, see the\n   documentation for the `sample_weight` parameter to\n   :func:`linear_model.ElasticNet.fit`.</p></div>\n"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "collapsed": false
+      },
+      "outputs": [],
+      "source": [
+        "print(__doc__)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Let's start by loading the dataset and creating some sample weights.\n\n"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "collapsed": false
+      },
+      "outputs": [],
+      "source": [
+        "import numpy as np\nfrom sklearn.datasets import make_regression\n\nrng = np.random.RandomState(0)\n\nn_samples = int(1e5)\nX, y = make_regression(n_samples=n_samples, noise=0.5, random_state=rng)\n\nsample_weight = rng.lognormal(size=n_samples)\n# normalize the sample weights\nnormalized_weights = sample_weight * (n_samples / (sample_weight.sum()))"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "To fit the elastic net using the `precompute` option together with the sample\nweights, we must first center the design matrix,  and rescale it by the\nnormalized weights prior to computing the gram matrix.\n\n"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "collapsed": false
+      },
+      "outputs": [],
+      "source": [
+        "X_offset = np.average(X, axis=0, weights=normalized_weights)\nX_centered = (X - np.average(X, axis=0, weights=normalized_weights))\nX_scaled = X_centered * np.sqrt(normalized_weights)[:, np.newaxis]\ngram = np.dot(X_scaled.T, X_scaled)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "We can now proceed with fitting. We must passed the centered design matrix to\n`fit` otherwise the elastic net estimator will detect that it is uncentered\nand discard the gram matrix we passed. However, if we pass the scaled design\nmatrix, the preprocessing code will incorrectly rescale it a second time.\n\n"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "collapsed": false
+      },
+      "outputs": [],
+      "source": [
+        "from sklearn.linear_model import ElasticNet\n\nlm = ElasticNet(alpha=0.01, precompute=gram)\nlm.fit(X_centered, y, sample_weight=normalized_weights)"
+      ]
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "Python 3",
+      "language": "python",
+      "name": "python3"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.9.1"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 0
+}
@@ -0,0 +1,53 @@
+"""
+==========================================================================
+Fitting an Elastic Net with a precomputed Gram Matrix and Weighted Samples
+==========================================================================
+
+The following example shows how to precompute the gram matrix
+while using weighted samples with an ElasticNet.
+
+If weighted samples are used, the design matrix must be centered and then
+rescaled by the square root of the weight vector before the gram matrix
+is computed.
+
+.. note::
+  `sample_weight` vector is also rescaled to sum to `n_samples`, see the
+   documentation for the `sample_weight` parameter to
+   :func:`linear_model.ElasticNet.fit`.
+
+"""
+
+print(__doc__)
+
+# %%
+# Let's start by loading the dataset and creating some sample weights.
+import numpy as np
+from sklearn.datasets import make_regression
+
+rng = np.random.RandomState(0)
+
+n_samples = int(1e5)
+X, y = make_regression(n_samples=n_samples, noise=0.5, random_state=rng)
+
+sample_weight = rng.lognormal(size=n_samples)
+# normalize the sample weights
+normalized_weights = sample_weight * (n_samples / (sample_weight.sum()))
+
+# %%
+# To fit the elastic net using the `precompute` option together with the sample
+# weights, we must first center the design matrix,  and rescale it by the
+# normalized weights prior to computing the gram matrix.
+X_offset = np.average(X, axis=0, weights=normalized_weights)
+X_centered = (X - np.average(X, axis=0, weights=normalized_weights))
+X_scaled = X_centered * np.sqrt(normalized_weights)[:, np.newaxis]
+gram = np.dot(X_scaled.T, X_scaled)
+
+# %%
+# We can now proceed with fitting. We must passed the centered design matrix to
+# `fit` otherwise the elastic net estimator will detect that it is uncentered
+# and discard the gram matrix we passed. However, if we pass the scaled design
+# matrix, the preprocessing code will incorrectly rescale it a second time.
+from sklearn.linear_model import ElasticNet
+
+lm = ElasticNet(alpha=0.01, precompute=gram)
+lm.fit(X_centered, y, sample_weight=normalized_weights)