In [None]:
# Feature Scaling & Encoding

# Objective: Learn to scale numerical features and encode categorical features for better model performance.
# Instructions:
# For each example, perform the following steps:
#     1. Load the Dataset: Load the dataset into your environment.
#     2. Feature Scaling: Apply scaling methods (StandardScaler or MinMaxScaler) to specified numerical columns.
#     3. Feature Encoding: Apply encoding methods (One-Hot Encoding or Label Encoding) to specified categorical columns.
#     4. Verify Changes: Check the data to ensure proper scaling and encoding. 


# Task:
#   Dataset: car_features.csv (get it by your own it includes the columns of Mileage , Horsepower)
    # Columns to scale: Mileage , Horsepower
    # Column to encode: Fuel_Type
    # Steps:
    #     1. Load car_features.csv .
    #     2. Scale Mileage and Horsepower using StandardScaler.
    #     3. Encode Fuel_Type using Label Encoding.
    #     4. Confirm scaling and encoding by checking these columns.


import pandas as pd
from sklearn.preprocessing import StandardScaler, LabelEncoder

# 1. Load car_features.csv
try:
    df = pd.read_csv('car_features.csv')
except FileNotFoundError:
    print("Error: car_features.csv not found. Please make sure the file is in the correct directory.")
    exit()

# Ensure the columns exist
if 'Mileage' not in df.columns or 'Horsepower' not in df.columns or 'Fuel_Type' not in df.columns:
    print("Error: One or more required columns ('Mileage', 'Horsepower', 'Fuel_Type') not found in the dataset.")
    exit()

# 2. Scale Mileage and Horsepower using StandardScaler
scaler = StandardScaler()
df[['Mileage', 'Horsepower']] = scaler.fit_transform(df[['Mileage', 'Horsepower']])

# 3. Encode Fuel_Type using Label Encoding
label_encoder = LabelEncoder()
df['Fuel_Type_Encoded'] = label_encoder.fit_transform(df['Fuel_Type'])

# 4. Confirm scaling and encoding by checking these columns
print("Transformed Dataset Head:")
print(df.head())

print("\nSummary Statistics of Scaled Numerical Features (Mileage, Horsepower):")
print(df[['Mileage', 'Horsepower']].describe())

print("\nValue Counts of Original and Encoded Fuel_Type:")
print("Original Fuel_Type:")
print(df['Fuel_Type'].value_counts())
print("\nEncoded Fuel_Type:")
print(df['Fuel_Type_Encoded'].value_counts())
print("\nLabel Encoding Mapping for Fuel_Type:")
print(dict(zip(label_encoder.classes_, label_encoder.transform(label_encoder.classes_))))

print("\nInformation about the Transformed Dataset:")
df.info()
    
    
    

Error: car_features.csv not found. Please make sure the file is in the correct directory.


NameError: name 'df' is not defined

: 