In [1]:
# Importing all required modules
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import warnings
warnings.filterwarnings('ignore')

In [2]:
df = pd.read_csv('supershops.csv') # Load Dataset
selected_columns = (df.iloc[:,0:-1]).select_dtypes(include=['float64']) # Select all features except Target columns that contains float values

# Normalization

In [3]:
from sklearn.preprocessing import MinMaxScaler # import normalization scaler
normalized = MinMaxScaler() # create object for normalization scaler
normalized_columns = normalized.fit_transform(selected_columns) # converted all selected feature values to normalised scale
normalized_df = pd.concat((pd.DataFrame(normalized_columns, columns=df.columns[1:4]), df.Area, df.Profit), 1) # add converted values to dataframe
print(normalized_df) # print the converted dataframe

    Administration  Transport      Area     Area     Profit
0         0.692617   0.651744  1.000000    Dhaka  192261.83
1         0.983359   0.761972  0.940893      Ctg  191792.06
2         0.927985   0.379579  0.864664  Rangpur  191050.39
3         0.873136   0.512998  0.812235    Dhaka  182901.99
4         0.859438   0.305328  0.776136  Rangpur  166187.94
5         0.797566   0.369448  0.769126    Dhaka  156991.12
6         0.814128   0.730161  0.270710      Ctg  156122.51
7         0.788018   0.717457  0.686493  Rangpur  155752.60
8         0.729018   0.741733  0.660500    Dhaka  152211.77
9         0.745906   0.436929  0.646443      Ctg  149759.96
10        0.616351   0.451506  0.485733  Rangpur  146121.95
11        0.608845   0.308364  0.529362      Ctg  144259.40
12        0.567670   0.578836  0.529563  Rangpur  141585.52
13        0.556352   0.641066  0.535552      Ctg  134307.35
14        0.725394   0.801327  0.543708  Rangpur  132602.65
15        1.000000   0.543030  0.554864 

# Standardization

In [4]:
from sklearn.preprocessing import StandardScaler 
standardized = StandardScaler() 
standardized_columns = standardized.fit_transform(selected_columns)
standardized_df = pd.concat((pd.DataFrame(standardized_columns, columns=df.columns[1:4]), df.Area, df.Profit), 1)
print(standardized_df)

    Administration  Transport      Area     Area     Profit
0         0.897913   0.560753  2.165287    Dhaka  192261.83
1         1.955860   1.082807  1.929843      Ctg  191792.06
2         1.754364  -0.728257  1.626191  Rangpur  191050.39
3         1.554784  -0.096365  1.417348    Dhaka  182901.99
4         1.504937  -1.079919  1.273550  Rangpur  166187.94
5         1.279800  -0.776239  1.245627    Dhaka  156991.12
6         1.340066   0.932147 -0.739753      Ctg  156122.51
7         1.245057   0.871980  0.916470  Rangpur  155752.60
8         1.030369   0.986952  0.812928    Dhaka  152211.77
9         1.091819  -0.456640  0.756935      Ctg  149759.96
10        0.620398  -0.387599  0.116763  Rangpur  146121.95
11        0.593085  -1.065540  0.290555      Ctg  144259.40
12        0.443260   0.215449  0.291357  Rangpur  141585.52
13        0.402078   0.510179  0.315213      Ctg  134307.35
14        1.017181   1.269199  0.347702  Rangpur  132602.65
15        2.016411   0.045868  0.392142 

# Robust Scaler

In [5]:
from sklearn.preprocessing import RobustScaler
robust_scaled = RobustScaler()
robust_scaled_columns = robust_scaled.fit_transform(selected_columns)
robust_scaled_df = pd.concat((pd.DataFrame(robust_scaled_columns, columns=df.columns[1:4]), df.Area, df.Profit), 1)
print(robust_scaled_df)

    Administration  Transport      Area     Area     Profit
0         0.672530   0.345355  1.552016    Dhaka  192261.83
1         1.452113   0.697565  1.383714      Ctg  191792.06
2         1.303634  -0.524290  1.166654  Rangpur  191050.39
3         1.156567  -0.097977  1.017368    Dhaka  182901.99
4         1.119836  -0.761543  0.914576  Rangpur  166187.94
5         0.953936  -0.556662  0.894617    Dhaka  156991.12
6         0.998345   0.595921 -0.524591      Ctg  156122.51
7         0.928334   0.555328  0.659326  Rangpur  155752.60
8         0.770134   0.632895  0.585311    Dhaka  152211.77
9         0.815416  -0.341041  0.545285      Ctg  149759.96
10        0.468034  -0.294461  0.087672  Rangpur  146121.95
11        0.447908  -0.751841  0.211904      Ctg  144259.40
12        0.337504   0.112392  0.212476  Rangpur  141585.52
13        0.307158   0.311235  0.229530      Ctg  134307.35
14        0.760416   0.823317  0.252754  Rangpur  132602.65
15        1.496732  -0.002018  0.284521 

# Max Absolute Scaler

In [6]:
from sklearn.preprocessing import MaxAbsScaler
maxAbs_scaled = MaxAbsScaler()
maxAbs_scaled_columns = maxAbs_scaled.fit_transform(selected_columns)
maxAbs_scaled_df = pd.concat((pd.DataFrame(maxAbs_scaled_columns, columns=df.columns[1:4]), df.Area, df.Profit), 1)
print(maxAbs_scaled_df)

    Administration  Transport      Area     Area     Profit
0         0.692617   0.749527  1.000000    Dhaka  192261.83
1         0.983359   0.828805  0.940893      Ctg  191792.06
2         0.927985   0.553781  0.864664  Rangpur  191050.39
3         0.873136   0.649738  0.812235    Dhaka  182901.99
4         0.859438   0.500378  0.776136  Rangpur  166187.94
5         0.797566   0.546494  0.769126    Dhaka  156991.12
6         0.814128   0.805926  0.270710      Ctg  156122.51
7         0.788018   0.796789  0.686493  Rangpur  155752.60
8         0.729018   0.814249  0.660500    Dhaka  152211.77
9         0.745906   0.595028  0.646443      Ctg  149759.96
10        0.616351   0.605512  0.485733  Rangpur  146121.95
11        0.608845   0.502561  0.529362      Ctg  144259.40
12        0.567670   0.697090  0.529563  Rangpur  141585.52
13        0.556352   0.741847  0.535552      Ctg  134307.35
14        0.725394   0.857110  0.543708  Rangpur  132602.65
15        1.000000   0.671338  0.554864 