In [1]:
import pandas as pd
import numpy as np

# Read the CSV file with encoding specification
try:
    # Try different encodings
    encodings = ['utf-8', 'latin1', 'iso-8859-1', 'cp1252']
    for encoding in encodings:
        try:
            df = pd.read_csv('The Ultimate Cars Dataset 2024.csv', encoding=encoding)
            print(f"\nSuccessfully read the file with {encoding} encoding")
            break
        except UnicodeDecodeError:
            continue

    # Display the first few rows
    print("\nFirst few rows of the dataset:")
    print(df.head())

    # Display dataset info
    print("\nDataset information:")
    print(df.info())

    # Check for missing values
    print("\nMissing values in each column:")
    print(df.isnull().sum())

    # Clean the data
    # Remove any leading/trailing whitespace from column names
    df.columns = df.columns.str.strip()

    # Remove any leading/trailing whitespace from string values
    df = df.apply(lambda x: x.str.strip() if x.dtype == "object" else x)

    # Save the cleaned dataset
    df.to_csv('cleaned_cars_dataset.csv', index=False, encoding='utf-8')

    print("\nData cleaning completed. Cleaned dataset saved as 'cleaned_cars_dataset.csv'")

except Exception as e:
    print(f"An error occurred: {str(e)}") 


Successfully read the file with latin1 encoding

First few rows of the dataset:
  Company Names     Cars Names      Engines CC/Battery Capacity HorsePower  \
0       FERRARI  SF90 STRADALE           V8             3990 cc     963 hp   
1   ROLLS ROYCE        PHANTOM          V12             6749 cc     563 hp   
2          Ford            KA+  1.2L Petrol            1,200 cc   70-85 hp   
3      MERCEDES        GT 63 S           V8            3,982 cc     630 hp   
4          AUDI     AUDI R8 Gt          V10            5,204 cc     602 hp   

  Total Speed Performance(0 - 100 )KM/H      Cars Prices       Fuel Types  \
0    340 km/h                   2.5 sec      $1,100,000   plug in hyrbrid   
1    250 km/h                   5.3 sec        $460,000            Petrol   
2    165 km/h                  10.5 sec  $12,000-$15,000           Petrol   
3    250 km/h                   3.2 sec        $161,000            Petrol   
4    320 km/h                   3.6 sec        $253,290          