In [2]:
# Feature Scaling & Encoding

# Objective: Learn to scale numerical features and encode categorical features for better model performance.
# Instructions:
# For each example, perform the following steps:
#     1. Load the Dataset: Load the dataset into your environment.
#     2. Feature Scaling: Apply scaling methods (StandardScaler or MinMaxScaler) to specified numerical columns.
#     3. Feature Encoding: Apply encoding methods (One-Hot Encoding or Label Encoding) to specified categorical columns.
#     4. Verify Changes: Check the data to ensure proper scaling and encoding. 


# Task:
#   Dataset: car_features.csv (get it by your own it includes the columns of Mileage , Horsepower)
    # Columns to scale: Mileage , Horsepower
    # Column to encode: Fuel_Type
    # Steps:
    #     1. Load car_features.csv .
    #     2. Scale Mileage and Horsepower using StandardScaler.
    #     3. Encode Fuel_Type using Label Encoding.
    #     4. Confirm scaling and encoding by checking these columns.





    






    


    






import pandas as pd
from sklearn.preprocessing import StandardScaler, LabelEncoder

# Step 1: Create sample dataset simulating car_features.csv
data = {
    "Mileage": [20, 30, 25, 35, 28, 40],
    "Horsepower": [150, 200, 180, 220, 160, 210],
    "Fuel_Type": ["Petrol", "Diesel", "Petrol", "Diesel", "CNG", "Petrol"]
}

df = pd.DataFrame(data)
df.to_csv("car_features.csv", index=False)

# Load the dataset
df = pd.read_csv("car_features.csv")
print("Original Data:")
print(df)

# Step 2: Scale Mileage and Horsepower using StandardScaler
scaler = StandardScaler()
df[["Mileage", "Horsepower"]] = scaler.fit_transform(df[["Mileage", "Horsepower"]])

# Step 3: Encode Fuel_Type using LabelEncoder
label_encoder = LabelEncoder()
df["Fuel_Type_Encoded"] = label_encoder.fit_transform(df["Fuel_Type"])

# Step 4: Confirm scaling and encoding
print("\nTransformed Data:")
print(df)

print("\nFuel Type Mapping:")
mapping = dict(zip(label_encoder.classes_, label_encoder.transform(label_encoder.classes_)))
print(mapping)





    







    
    


Original Data:
   Mileage  Horsepower Fuel_Type
0       20         150    Petrol
1       30         200    Diesel
2       25         180    Petrol
3       35         220    Diesel
4       28         160       CNG
5       40         210    Petrol

Transformed Data:
    Mileage  Horsepower Fuel_Type  Fuel_Type_Encoded
0 -1.487669   -1.432078    Petrol                  2
1  0.051299    0.520756    Diesel                  1
2 -0.718185   -0.260378    Petrol                  2
3  0.820783    1.301889    Diesel                  1
4 -0.256495   -1.041511       CNG                  0
5  1.590266    0.911322    Petrol                  2

Fuel Type Mapping:
{'CNG': 0, 'Diesel': 1, 'Petrol': 2}
