# **Normalization**

**min - max**

In [2]:
import pandas as pd

from sklearn.preprocessing import MinMaxScaler
data = pd.read_csv("/content/drive/MyDrive/Datasets/toyota.csv")
print("Original Data:")
print(data.head())
# data.head()

columns_to_scale = ["mileage", "price"]

for col in columns_to_scale:

    if col not in data.columns:

        print(f"Column '{col}' not found in the dataset.")

        exit(1)

scaler = MinMaxScaler()

data[columns_to_scale] = scaler.fit_transform(data[columns_to_scale])

print("Scaled Data:")

print(data.head())
# data.head()

data.to_csv("scaled_toyota.csv", index=False)

print("Scaled data saved to 'scaled_toyota.csv'")

Original Data:
   model  year  price transmission  mileage fuelType  tax   mpg  engineSize
0   GT86  2016  16000       Manual    24089   Petrol  265  36.2         2.0
1   GT86  2017  15995       Manual    18615   Petrol  145  36.2         2.0
2   GT86  2015  13998       Manual    27469   Petrol  265  36.2         2.0
3   GT86  2017  18998       Manual    14736   Petrol  150  36.2         2.0
4   GT86  2017  17498       Manual    36284   Petrol  145  36.2         2.0
Scaled Data:
   model  year     price transmission   mileage fuelType  tax   mpg  \
0   GT86  2016  0.256150       Manual  0.138100   Petrol  265  36.2   
1   GT86  2017  0.256066       Manual  0.106716   Petrol  145  36.2   
2   GT86  2015  0.222301       Manual  0.157479   Petrol  265  36.2   
3   GT86  2017  0.306839       Manual  0.084476   Petrol  150  36.2   
4   GT86  2017  0.281478       Manual  0.208019   Petrol  145  36.2   

   engineSize  
0         2.0  
1         2.0  
2         2.0  
3         2.0  
4        

**Z - score**

In [3]:
import pandas as pd

from sklearn.preprocessing import StandardScaler

data = pd.read_csv("/content/drive/MyDrive/Datasets/toyota.csv")

print("Original Data:")

print(data.head())
columns_to_normalize = ["mileage", "price"]
for col in columns_to_normalize:

    if col not in data.columns:

        print(f"Column '{col}' not found in the dataset.")

        exit(1)

scaler = StandardScaler()

data[columns_to_normalize] = scaler.fit_transform(data[columns_to_normalize])

print("Normalized Data:")

print(data.head())

data.to_csv("normalized_toyota.csv", index=False)

print("Normalized data saved to 'normalized_toyota.csv'")

Original Data:
   model  year  price transmission  mileage fuelType  tax   mpg  engineSize
0   GT86  2016  16000       Manual    24089   Petrol  265  36.2         2.0
1   GT86  2017  15995       Manual    18615   Petrol  145  36.2         2.0
2   GT86  2015  13998       Manual    27469   Petrol  265  36.2         2.0
3   GT86  2017  18998       Manual    14736   Petrol  150  36.2         2.0
4   GT86  2017  17498       Manual    36284   Petrol  145  36.2         2.0
Normalized Data:
   model  year     price transmission   mileage fuelType  tax   mpg  \
0   GT86  2016  0.548126       Manual  0.064400   Petrol  265  36.2   
1   GT86  2017  0.547338       Manual -0.221837   Petrol  145  36.2   
2   GT86  2015  0.232579       Manual  0.241141   Petrol  265  36.2   
3   GT86  2017  1.020657       Manual -0.424670   Petrol  150  36.2   
4   GT86  2017  0.784234       Manual  0.702079   Petrol  145  36.2   

   engineSize  
0         2.0  
1         2.0  
2         2.0  
3         2.0  
4    

**Decimal scaling**

In [4]:
import pandas as pd
data = pd.read_csv("/content/drive/MyDrive/Datasets/toyota.csv")

print("Original Data:")

print(data.head())

columns_to_normalize = ["mileage", "price"]
for col in columns_to_normalize:

    if col not in data.columns:

        print(f"Column '{col}' not found in the dataset.")

        exit(1)

for col in columns_to_normalize:

    max_abs_value = data[col].abs().max()

    scaling_factor = 10 ** len(str(int(max_abs_value)))

    data[col] /= scaling_factor


print("Decimal Scaled Data:")

print(data.head())

Original Data:
   model  year  price transmission  mileage fuelType  tax   mpg  engineSize
0   GT86  2016  16000       Manual    24089   Petrol  265  36.2         2.0
1   GT86  2017  15995       Manual    18615   Petrol  145  36.2         2.0
2   GT86  2015  13998       Manual    27469   Petrol  265  36.2         2.0
3   GT86  2017  18998       Manual    14736   Petrol  150  36.2         2.0
4   GT86  2017  17498       Manual    36284   Petrol  145  36.2         2.0
Decimal Scaled Data:
   model  year    price transmission   mileage fuelType  tax   mpg  engineSize
0   GT86  2016  0.16000       Manual  0.024089   Petrol  265  36.2         2.0
1   GT86  2017  0.15995       Manual  0.018615   Petrol  145  36.2         2.0
2   GT86  2015  0.13998       Manual  0.027469   Petrol  265  36.2         2.0
3   GT86  2017  0.18998       Manual  0.014736   Petrol  150  36.2         2.0
4   GT86  2017  0.17498       Manual  0.036284   Petrol  145  36.2         2.0
