In [1]:
import numpy as np
import pandas as pd
from sklearn.datasets import load_iris, load_wine
from sklearn.preprocessing import MinMaxScaler, StandardScaler, RobustScaler, MaxAbsScaler

In [2]:
iris = load_iris()
wine = load_wine()

In [3]:
iris_df = pd.DataFrame(iris.data, columns=iris.feature_names)
wine_df = pd.DataFrame(wine.data, columns=wine.feature_names)

In [4]:
iris_df.head()

Unnamed: 0,sepal length (cm),sepal width (cm),petal length (cm),petal width (cm)
0,5.1,3.5,1.4,0.2
1,4.9,3.0,1.4,0.2
2,4.7,3.2,1.3,0.2
3,4.6,3.1,1.5,0.2
4,5.0,3.6,1.4,0.2


In [5]:
wine_df.head()

Unnamed: 0,alcohol,malic_acid,ash,alcalinity_of_ash,magnesium,total_phenols,flavanoids,nonflavanoid_phenols,proanthocyanins,color_intensity,hue,od280/od315_of_diluted_wines,proline
0,14.23,1.71,2.43,15.6,127.0,2.8,3.06,0.28,2.29,5.64,1.04,3.92,1065.0
1,13.2,1.78,2.14,11.2,100.0,2.65,2.76,0.26,1.28,4.38,1.05,3.4,1050.0
2,13.16,2.36,2.67,18.6,101.0,2.8,3.24,0.3,2.81,5.68,1.03,3.17,1185.0
3,14.37,1.95,2.5,16.8,113.0,3.85,3.49,0.24,2.18,7.8,0.86,3.45,1480.0
4,13.24,2.59,2.87,21.0,118.0,2.8,2.69,0.39,1.82,4.32,1.04,2.93,735.0


# MinMax Scaling

In [6]:
min_max_scaler = MinMaxScaler()

In [7]:
iris_min_max_scaled = min_max_scaler.fit_transform(iris_df)
iris_min_max_scaled_df = pd.DataFrame(iris_min_max_scaled, columns=iris.feature_names)

In [8]:
wine_min_max_scaled = min_max_scaler.fit_transform(wine_df)
wine_min_max_scaled_df = pd.DataFrame(wine_min_max_scaled, columns=wine.feature_names)

In [9]:
iris_min_max_scaled_df

Unnamed: 0,sepal length (cm),sepal width (cm),petal length (cm),petal width (cm)
0,0.222222,0.625000,0.067797,0.041667
1,0.166667,0.416667,0.067797,0.041667
2,0.111111,0.500000,0.050847,0.041667
3,0.083333,0.458333,0.084746,0.041667
4,0.194444,0.666667,0.067797,0.041667
...,...,...,...,...
145,0.666667,0.416667,0.711864,0.916667
146,0.555556,0.208333,0.677966,0.750000
147,0.611111,0.416667,0.711864,0.791667
148,0.527778,0.583333,0.745763,0.916667


In [10]:
wine_min_max_scaled_df

Unnamed: 0,alcohol,malic_acid,ash,alcalinity_of_ash,magnesium,total_phenols,flavanoids,nonflavanoid_phenols,proanthocyanins,color_intensity,hue,od280/od315_of_diluted_wines,proline
0,0.842105,0.191700,0.572193,0.257732,0.619565,0.627586,0.573840,0.283019,0.593060,0.372014,0.455285,0.970696,0.561341
1,0.571053,0.205534,0.417112,0.030928,0.326087,0.575862,0.510549,0.245283,0.274448,0.264505,0.463415,0.780220,0.550642
2,0.560526,0.320158,0.700535,0.412371,0.336957,0.627586,0.611814,0.320755,0.757098,0.375427,0.447154,0.695971,0.646933
3,0.878947,0.239130,0.609626,0.319588,0.467391,0.989655,0.664557,0.207547,0.558360,0.556314,0.308943,0.798535,0.857347
4,0.581579,0.365613,0.807487,0.536082,0.521739,0.627586,0.495781,0.490566,0.444795,0.259386,0.455285,0.608059,0.325963
...,...,...,...,...,...,...,...,...,...,...,...,...,...
173,0.705263,0.970356,0.582888,0.510309,0.271739,0.241379,0.056962,0.735849,0.205047,0.547782,0.130081,0.172161,0.329529
174,0.623684,0.626482,0.598930,0.639175,0.347826,0.282759,0.086498,0.566038,0.315457,0.513652,0.178862,0.106227,0.336662
175,0.589474,0.699605,0.481283,0.484536,0.543478,0.210345,0.073840,0.566038,0.296530,0.761092,0.089431,0.106227,0.397290
176,0.563158,0.365613,0.540107,0.484536,0.543478,0.231034,0.071730,0.754717,0.331230,0.684300,0.097561,0.128205,0.400856


# Standard Scaler

In [11]:
standard_scaler = StandardScaler()

In [12]:
iris_standard_scaled = standard_scaler.fit_transform(iris_df)
iris_standard_scaled_df = pd.DataFrame(iris_standard_scaled, columns=iris.feature_names)

In [13]:
wine_standard_scaled = standard_scaler.fit_transform(wine_df)
wine_standard_scaled_df = pd.DataFrame(wine_standard_scaled, columns=wine.feature_names)

In [14]:
print("Standard Scaled Iris Dataset:\n", iris_standard_scaled_df.head())

Standard Scaled Iris Dataset:
    sepal length (cm)  sepal width (cm)  petal length (cm)  petal width (cm)
0          -0.900681          1.019004          -1.340227         -1.315444
1          -1.143017         -0.131979          -1.340227         -1.315444
2          -1.385353          0.328414          -1.397064         -1.315444
3          -1.506521          0.098217          -1.283389         -1.315444
4          -1.021849          1.249201          -1.340227         -1.315444


In [15]:
print("\nStandard Scaled Wine Dataset:\n", wine_standard_scaled_df.head())


Standard Scaled Wine Dataset:
     alcohol  malic_acid       ash  alcalinity_of_ash  magnesium  \
0  1.518613   -0.562250  0.232053          -1.169593   1.913905   
1  0.246290   -0.499413 -0.827996          -2.490847   0.018145   
2  0.196879    0.021231  1.109334          -0.268738   0.088358   
3  1.691550   -0.346811  0.487926          -0.809251   0.930918   
4  0.295700    0.227694  1.840403           0.451946   1.281985   

   total_phenols  flavanoids  nonflavanoid_phenols  proanthocyanins  \
0       0.808997    1.034819             -0.659563         1.224884   
1       0.568648    0.733629             -0.820719        -0.544721   
2       0.808997    1.215533             -0.498407         2.135968   
3       2.491446    1.466525             -0.981875         1.032155   
4       0.808997    0.663351              0.226796         0.401404   

   color_intensity       hue  od280/od315_of_diluted_wines   proline  
0         0.251717  0.362177                      1.847920  1.01300

# Robust Scaler

In [17]:
robust_scaler = RobustScaler()

In [18]:
iris_robust_scaled = robust_scaler.fit_transform(iris_df)
iris_robust_scaled_df = pd.DataFrame(iris_robust_scaled, columns=iris.feature_names)

In [19]:
wine_robust_scaled = robust_scaler.fit_transform(wine_df)
wine_robust_scaled_df = pd.DataFrame(wine_robust_scaled, columns=wine.feature_names)

In [20]:
print("Robust Scaled Iris Dataset:\n", iris_robust_scaled_df.head())

Robust Scaled Iris Dataset:
    sepal length (cm)  sepal width (cm)  petal length (cm)  petal width (cm)
0          -0.538462               1.0          -0.842857         -0.733333
1          -0.692308               0.0          -0.842857         -0.733333
2          -0.846154               0.4          -0.871429         -0.733333
3          -0.923077               0.2          -0.814286         -0.733333
4          -0.615385               1.2          -0.842857         -0.733333


In [21]:
print("\nRobust Scaled Wine Dataset:\n", wine_robust_scaled_df.head())


Robust Scaled Wine Dataset:
     alcohol  malic_acid       ash  alcalinity_of_ash  magnesium  \
0  0.897338   -0.104730  0.201439          -0.906977   1.526316   
1  0.114068   -0.057432 -0.633094          -1.930233   0.105263   
2  0.083650    0.334459  0.892086          -0.209302   0.157895   
3  1.003802    0.057432  0.402878          -0.627907   0.789474   
4  0.144487    0.489865  1.467626           0.348837   1.052632   

   total_phenols  flavanoids  nonflavanoid_phenols  proanthocyanins  \
0       0.420804    0.553892             -0.358209         1.050000   
1       0.278960    0.374251             -0.477612        -0.392857   
2       0.420804    0.661677             -0.238806         1.792857   
3       1.413712    0.811377             -0.597015         0.892857   
4       0.420804    0.332335              0.298507         0.378571   

   color_intensity       hue  od280/od315_of_diluted_wines   proline  
0         0.318792  0.222222                      0.924949  0.808050 

# MaxAbs Scaler

In [22]:
max_abs_scaler = MaxAbsScaler()

In [23]:
iris_max_abs_scaled = max_abs_scaler.fit_transform(iris_df)
iris_max_abs_scaled_df = pd.DataFrame(iris_max_abs_scaled, columns=iris.feature_names)

In [24]:
wine_max_abs_scaled = max_abs_scaler.fit_transform(wine_df)
wine_max_abs_scaled_df = pd.DataFrame(wine_max_abs_scaled, columns=wine.feature_names)

In [25]:
print("MaxAbs Scaled Iris Dataset:\n", iris_max_abs_scaled_df.head())

MaxAbs Scaled Iris Dataset:
    sepal length (cm)  sepal width (cm)  petal length (cm)  petal width (cm)
0           0.645570          0.795455           0.202899              0.08
1           0.620253          0.681818           0.202899              0.08
2           0.594937          0.727273           0.188406              0.08
3           0.582278          0.704545           0.217391              0.08
4           0.632911          0.818182           0.202899              0.08


In [26]:
print("\nMaxAbs Scaled Wine Dataset:\n", wine_max_abs_scaled_df.head())


MaxAbs Scaled Wine Dataset:
     alcohol  malic_acid       ash  alcalinity_of_ash  magnesium  \
0  0.959541    0.294828  0.752322           0.520000   0.783951   
1  0.890088    0.306897  0.662539           0.373333   0.617284   
2  0.887390    0.406897  0.826625           0.620000   0.623457   
3  0.968982    0.336207  0.773994           0.560000   0.697531   
4  0.892785    0.446552  0.888545           0.700000   0.728395   

   total_phenols  flavanoids  nonflavanoid_phenols  proanthocyanins  \
0       0.721649    0.602362              0.424242         0.639665   
1       0.682990    0.543307              0.393939         0.357542   
2       0.721649    0.637795              0.454545         0.784916   
3       0.992268    0.687008              0.363636         0.608939   
4       0.721649    0.529528              0.590909         0.508380   

   color_intensity       hue  od280/od315_of_diluted_wines   proline  
0         0.433846  0.608187                        0.9800  0.633929 