Skip to content

Commit 40d43fe

Browse files
committed
Pushing the docs for revision for branch: master, commit eb464fbc98efbab155ce24f4a9660464bd7d838d
1 parent 122a2ce commit 40d43fe

File tree

858 files changed

+2858
-2850
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

858 files changed

+2858
-2850
lines changed

dev/_downloads/plot_prediction_latency.py

Lines changed: 17 additions & 19 deletions
Original file line numberDiff line numberDiff line change
@@ -24,12 +24,15 @@
2424
import numpy as np
2525
import matplotlib.pyplot as plt
2626

27+
from sklearn.preprocessing import StandardScaler
28+
from sklearn.model_selection import train_test_split
2729
from scipy.stats import scoreatpercentile
2830
from sklearn.datasets.samples_generator import make_regression
2931
from sklearn.ensemble.forest import RandomForestRegressor
3032
from sklearn.linear_model.ridge import Ridge
3133
from sklearn.linear_model.stochastic_gradient import SGDRegressor
3234
from sklearn.svm.classes import SVR
35+
from sklearn.utils import shuffle
3336

3437

3538
def _not_in_sphinx():
@@ -93,27 +96,22 @@ def generate_dataset(n_train, n_test, n_features, noise=0.1, verbose=False):
9396
"""Generate a regression dataset with the given parameters."""
9497
if verbose:
9598
print("generating dataset...")
99+
96100
X, y, coef = make_regression(n_samples=n_train + n_test,
97101
n_features=n_features, noise=noise, coef=True)
98-
X_train = X[:n_train]
99-
y_train = y[:n_train]
100-
X_test = X[n_train:]
101-
y_test = y[n_train:]
102-
idx = np.arange(n_train)
103-
np.random.seed(13)
104-
np.random.shuffle(idx)
105-
X_train = X_train[idx]
106-
y_train = y_train[idx]
107-
108-
std = X_train.std(axis=0)
109-
mean = X_train.mean(axis=0)
110-
X_train = (X_train - mean) / std
111-
X_test = (X_test - mean) / std
112-
113-
std = y_train.std(axis=0)
114-
mean = y_train.mean(axis=0)
115-
y_train = (y_train - mean) / std
116-
y_test = (y_test - mean) / std
102+
103+
random_seed = 13
104+
X_train, X_test, y_train, y_test = train_test_split(
105+
X, y, train_size=n_train, random_state=random_seed)
106+
X_train, y_train = shuffle(X_train, y_train, random_state=random_seed)
107+
108+
X_scaler = StandardScaler()
109+
X_train = X_scaler.fit_transform(X_train)
110+
X_test = X_scaler.transform(X_test)
111+
112+
y_scaler = StandardScaler()
113+
y_train = y_scaler.fit_transform(y_train[:, None])[:, 0]
114+
y_test = y_scaler.transform(y_test[:, None])[:, 0]
117115

118116
gc.collect()
119117
if verbose:
155 Bytes
155 Bytes
736 Bytes
736 Bytes
678 Bytes
678 Bytes
191 Bytes
191 Bytes
108 Bytes

0 commit comments

Comments
 (0)