# StandardScaler

In [1]:
import pandas as pd  # data processing
from sklearn.datasets import load_breast_cancer  # loading the dataset
from sklearn.model_selection import train_test_split  # splitting the dataset
from sklearn.preprocessing import StandardScaler  # scaling the dataset

In [3]:
df = pd.read_csv("../../Datasets/SocialNetworkAds.csv")
df.head()

Unnamed: 0,Gender,Age,EstimatedSalary,Purchased
0,1,19,19000,0
1,1,35,20000,0
2,2,26,43000,0
3,2,27,57000,0
4,1,19,76000,0


In [4]:
X = df.iloc[:, :-1].values
y = df.iloc[:, -1].values

In [5]:
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.1, random_state=0)

The `StandardScaler` class in scikit-learn has two main parameters:

- `with_mean`: This is a boolean parameter that specifies whether to center the data before scaling. The default value is `True`, which means that the data will be centered before scaling.

- `with_std`: This is a boolean parameter that specifies whether to scale the data to unit variance. The default value is `True`, which means that the data will be scaled to unit variance.

You can also specify the `copy` parameter, which is a boolean that specifies whether to make a copy of the data before scaling. The default value is `True`, which means that a copy will be made. 

Here is an example of how to create a `StandardScaler` object with the default parameters:



In [6]:
scaler = StandardScaler()
X_train = scaler.fit_transform(X_train)
X_test = scaler.transform(X_test)

In [7]:
X_train

array([[-1.02817453, -1.05714987,  0.53420426],
       [-1.02817453,  0.2798728 , -0.51764734],
       [ 0.97259753, -1.05714987,  0.41733186],
       ...,
       [-1.02817453, -0.19763529, -0.51764734],
       [ 0.97259753, -1.05714987, -0.45921114],
       [ 0.97259753, -1.15265148,  1.41074727]])

In [8]:
X_test

array([[-1.02817453, -0.77064501,  0.50498616],
       [ 0.97259753, -0.00663206, -0.57608354],
       [-1.02817453, -0.29313691,  0.15436896],
       [ 0.97259753, -0.77064501,  0.27124136],
       [ 0.97259753, -0.29313691, -0.57608354],
       [-1.02817453, -1.05714987, -1.45262654],
       [ 0.97259753, -0.67514339, -1.59871705],
       [-1.02817453, -0.19763529,  2.17041787],
       [ 0.97259753, -1.91666444, -0.05015774],
       [-1.02817453,  0.85288251, -0.78061024],
       [-1.02817453, -0.77064501, -0.60530164],
       [ 0.97259753, -0.96164825, -0.42999304],
       [-1.02817453, -0.10213368, -0.42999304],
       [-1.02817453,  0.08886956,  0.21280516],
       [-1.02817453, -1.7256612 ,  0.47576806],
       [ 0.97259753, -0.57964177,  1.38152917],
       [-1.02817453, -0.10213368,  0.21280516],
       [-1.02817453, -1.82116282,  0.44654996],
       [ 0.97259753,  1.61689547,  1.76136447],
       [-1.02817453, -0.29313691, -1.39419034],
       [ 0.97259753, -0.29313691, -0.663