In [None]:
# Feature Scaling & Encoding

# Objective: Learn to scale numerical features and encode categorical features for better model performance.
# Instructions:
# For each example, perform the following steps:
#     1. Load the Dataset: Load the dataset into your environment.
#     2. Feature Scaling: Apply scaling methods (StandardScaler or MinMaxScaler) to specified numerical columns.
#     3. Feature Encoding: Apply encoding methods (One-Hot Encoding or Label Encoding) to specified categorical columns.
#     4. Verify Changes: Check the data to ensure proper scaling and encoding. 


# Task:
#   Dataset: car_features.csv (get it by your own it includes the columns of Mileage , Horsepower)
    # Columns to scale: Mileage , Horsepower
    # Column to encode: Fuel_Type
    # Steps:
    #     1. Load car_features.csv .
    #     2. Scale Mileage and Horsepower using StandardScaler.
    #     3. Encode Fuel_Type using Label Encoding.
    #     4. Confirm scaling and encoding by checking these columns.



    
    
    

In [2]:
import pandas as pd
import numpy as np
from sklearn.preprocessing import StandardScaler, LabelEncoder

# Step 1: Create a sample dataset and save to 'car_features.csv'
data = {
    'Mileage': np.random.randint(10, 30, size=10),
    'Horsepower': np.random.randint(60, 200, size=10),
    'Fuel_Type': ['Petrol', 'Diesel', 'Petrol', 'Electric', 'Diesel', 
                  'Petrol', 'Electric', 'Diesel', 'Petrol', 'Electric']
}

df = pd.DataFrame(data)
df.to_csv('car_features.csv', index=False)
print("✅ Created and saved 'car_features.csv':\n")
print(df)

# Step 2: Load the dataset
df = pd.read_csv('car_features.csv')

# Step 3: Apply StandardScaler to 'Mileage' and 'Horsepower'
scaler = StandardScaler()
df[['Mileage_scaled', 'Horsepower_scaled']] = scaler.fit_transform(df[['Mileage', 'Horsepower']])

# Step 4: Apply Label Encoding to 'Fuel_Type'
label_encoder = LabelEncoder()
df['Fuel_Type_Encoded'] = label_encoder.fit_transform(df['Fuel_Type'])

# Step 5: Confirm changes
print("\n✅ Transformed Data:\n")
print(df)


✅ Created and saved 'car_features.csv':

   Mileage  Horsepower Fuel_Type
0       27         106    Petrol
1       21         187    Diesel
2       16         100    Petrol
3       20         111  Electric
4       27         104    Diesel
5       26          82    Petrol
6       26          83  Electric
7       28         102    Diesel
8       13         145    Petrol
9       21         112  Electric

✅ Transformed Data:

   Mileage  Horsepower Fuel_Type  Mileage_scaled  Horsepower_scaled  \
0       27         106    Petrol        0.921443          -0.242911   
1       21         187    Diesel       -0.307148           2.489835   
2       16         100    Petrol       -1.330973          -0.445336   
3       20         111  Electric       -0.511913          -0.074223   
4       27         104    Diesel        0.921443          -0.310386   
5       26          82    Petrol        0.716678          -1.052613   
6       26          83  Electric        0.716678          -1.018876   
7     