In [None]:
# Feature Scaling & Encoding

# Objective: Learn to scale numerical features and encode categorical features for better model performance.
# Instructions:
# For each example, perform the following steps:
#     1. Load the Dataset: Load the dataset into your environment.
#     2. Feature Scaling: Apply scaling methods (StandardScaler or MinMaxScaler) to specified numerical columns.
#     3. Feature Encoding: Apply encoding methods (One-Hot Encoding or Label Encoding) to specified categorical columns.
#     4. Verify Changes: Check the data to ensure proper scaling and encoding. 


# Task:
#   Dataset: car_features.csv (get it by your own it includes the columns of Mileage , Horsepower)
    # Columns to scale: Mileage , Horsepower
    # Column to encode: Fuel_Type
    # Steps:
    #     1. Load car_features.csv .
    #     2. Scale Mileage and Horsepower using StandardScaler.
    #     3. Encode Fuel_Type using Label Encoding.
    #     4. Confirm scaling and encoding by checking these columns.



    
    
    

In [1]:
import pandas as pd
from sklearn.preprocessing import StandardScaler, LabelEncoder

# 🔹 Step 1: Simulate a dataset
data = {
    'Mileage': [15, 18, 22, 30, 25],
    'Horsepower': [100, 120, 150, 200, 180],
    'Fuel_Type': ['Petrol', 'Diesel', 'Petrol', 'Diesel', 'CNG']
}

df = pd.DataFrame(data)
print("Original DataFrame:\n", df)

# 🔹 Step 2: Scale Mileage and Horsepower using StandardScaler
scaler = StandardScaler()
df[['Mileage', 'Horsepower']] = scaler.fit_transform(df[['Mileage', 'Horsepower']])
print("\nAfter Scaling:\n", df[['Mileage', 'Horsepower']])

# 🔹 Step 3: Encode Fuel_Type using LabelEncoder
encoder = LabelEncoder()
df['Fuel_Type'] = encoder.fit_transform(df['Fuel_Type'])
print("\nAfter Encoding:\n", df['Fuel_Type'])

# 🔹 Step 4: Confirm the final DataFrame
print("\nTransformed DataFrame:\n", df)


Original DataFrame:
    Mileage  Horsepower Fuel_Type
0       15         100    Petrol
1       18         120    Diesel
2       22         150    Petrol
3       30         200    Diesel
4       25         180       CNG

After Scaling:
     Mileage  Horsepower
0 -1.332427   -1.355815
1 -0.761387   -0.813489
2  0.000000    0.000000
3  1.522774    1.355815
4  0.571040    0.813489

After Encoding:
 0    2
1    1
2    2
3    1
4    0
Name: Fuel_Type, dtype: int64

Transformed DataFrame:
     Mileage  Horsepower  Fuel_Type
0 -1.332427   -1.355815          2
1 -0.761387   -0.813489          1
2  0.000000    0.000000          2
3  1.522774    1.355815          1
4  0.571040    0.813489          0
