## Datasets: Preprocessed

In [2]:
# Install dependencies as needed:
# pip install kagglehub[pandas-datasets]
import kagglehub
from kagglehub import KaggleDatasetAdapter

# Set the path to the file you'd like to load
file_path = "Electric_Vehicle_Population_Data.csv"

# Load the latest version
df = kagglehub.load_dataset(
  KaggleDatasetAdapter.PANDAS,
  "mzohaibzeeshan/electric-vehicle-population-data-messy-data",
  file_path,
  # Provide any additional arguments like 
  # sql_query or pandas_kwargs. See the 
  # documenation for more information:
  # https://github.com/Kaggle/kagglehub/blob/main/README.md#kaggledatasetadapterpandas
)

df.head() # Electric_Vehicle_Population_Data

  from .autonotebook import tqdm as notebook_tqdm
  df = kagglehub.load_dataset(


Unnamed: 0,VIN (1-10),County,City,State,Postal Code,Model Year,Make,Model,Electric Vehicle Type,Clean Alternative Fuel Vehicle (CAFV) Eligibility,Electric Range,Base MSRP,Legislative District,DOL Vehicle ID,Vehicle Location,Electric Utility,2020 Census Tract
0,1C4JJXP66P,Kitsap,Poulsbo,WA,98370.0,2023,JEEP,WRANGLER,Plug-in Hybrid Electric Vehicle (PHEV),Not eligible due to low battery range,21.0,0.0,23.0,258127145,POINT (-122.64681 47.73689),PUGET SOUND ENERGY INC,53035090000.0
1,1G1FX6S08K,Snohomish,Lake Stevens,WA,98258.0,2019,CHEVROLET,BOLT EV,Battery Electric Vehicle (BEV),Clean Alternative Fuel Vehicle Eligible,238.0,0.0,44.0,4735426,POINT (-122.06402 48.01497),PUGET SOUND ENERGY INC,53061050000.0
2,WBY1Z2C58F,King,Seattle,WA,98116.0,2015,BMW,I3,Battery Electric Vehicle (BEV),Clean Alternative Fuel Vehicle Eligible,81.0,0.0,34.0,272697666,POINT (-122.41067 47.57894),CITY OF SEATTLE - (WA)|CITY OF TACOMA - (WA),53033010000.0
3,5YJ3E1EBXK,King,Seattle,WA,98178.0,2019,TESLA,MODEL 3,Battery Electric Vehicle (BEV),Clean Alternative Fuel Vehicle Eligible,220.0,0.0,37.0,477309682,POINT (-122.23825 47.49461),CITY OF SEATTLE - (WA)|CITY OF TACOMA - (WA),53033010000.0
4,5YJSA1V24F,Yakima,Selah,WA,98942.0,2015,TESLA,MODEL S,Battery Electric Vehicle (BEV),Clean Alternative Fuel Vehicle Eligible,208.0,0.0,15.0,258112970,POINT (-120.53145 46.65405),PACIFICORP,53077000000.0


### About Electric Vehicle Population Dataset
This dataset shows the Battery Electric Vehicles (BEVs) and Plug-in Hybrid Electric Vehicles (PHEVs) that are currently registered through Washington State Department of Licensing (DOL)

Number of Rows: 223,995
Number of Columns: 17
Contains Missing Values

### 📊 Column Descriptions:
- VIN (1-10): First 10 characters of the Vehicle Identification Number.
- County: The county where the vehicle is registered.
- City: The city where the vehicle is registered.
- State: The state where the vehicle is registered.
- Postal Code: The ZIP code of the vehicle's registration location.
- Model Year: The manufacturing year of the vehicle.
- Make: The brand/manufacturer of the vehicle (e.g., Tesla, Nissan).
- Model: The specific model of the vehicle.
- Electric Vehicle Type: The type of EV (Battery Electric Vehicle or Plug-in Hybrid).
- Clean Alternative Fuel Vehicle (CAFV) Eligibility: Indicates if the vehicle qualifies for CAFV benefits.
- Electric Range: The maximum range the vehicle can travel on a single charge.
- Base MSRP: The Manufacturer's Suggested Retail Price of the vehicle.
- Legislative District: The legislative district where the vehicle is registered.
- DOL Vehicle ID: A unique identifier assigned by the Department of Licensing.
- Vehicle Location: A general reference to the vehicle's location.
- Electric Utility: The electric utility company serving the vehicle's area.
- 2020 Census Tract: The census tract based on 2020 data for demographic analysis.

In [3]:
df.describe().T

Unnamed: 0,count,mean,std,min,25%,50%,75%,max
Postal Code,223992.0,98176.49,2544.241,1731.0,98052.0,98126.0,98374.0,99577.0
Model Year,223995.0,2021.264,2.989676,1999.0,2020.0,2022.0,2023.0,2025.0
Electric Range,223977.0,47.73619,84.98714,0.0,0.0,0.0,39.0,337.0
Base MSRP,223977.0,829.8944,7372.509,0.0,0.0,0.0,0.0,845000.0
Legislative District,223521.0,28.87636,14.91102,1.0,17.0,32.0,42.0,49.0
DOL Vehicle ID,223995.0,232932800.0,68843290.0,4385.0,200800200.0,248299200.0,267397300.0,479254800.0
2020 Census Tract,223992.0,52979970000.0,1531491000.0,1001020000.0,53033010000.0,53033030000.0,53053070000.0,56021000000.0


In [4]:
df.isnull().sum()

VIN (1-10)                                             0
County                                                 3
City                                                   3
State                                                  0
Postal Code                                            3
Model Year                                             0
Make                                                   0
Model                                                  0
Electric Vehicle Type                                  0
Clean Alternative Fuel Vehicle (CAFV) Eligibility      0
Electric Range                                        18
Base MSRP                                             18
Legislative District                                 474
DOL Vehicle ID                                         0
Vehicle Location                                      10
Electric Utility                                       3
2020 Census Tract                                      3
dtype: int64

In [9]:
df['City'].value_counts()
df['City'].unique()

array(['Poulsbo', 'Lake Stevens', 'Seattle', 'Selah', 'Bremerton',
       'Lacey', 'Kent', 'Yakima', 'Lynnwood', 'Olalla', 'Suquamish',
       'Issaquah', 'Oak Harbor', 'Kenmore', 'Seabeck', 'Toppenish',
       'Sammamish', 'Port Orchard', 'Silverdale', 'Yelm', 'Olympia',
       'Bothell', 'Bainbridge Island', 'Edmonds', 'Tumwater', 'Redmond',
       'Stanwood', 'Kingston', 'Snohomish', 'Everett', 'Brier',
       'Marysville', 'Freeland', 'Chewelah', 'Auburn', 'Quincy',
       'Moses Lake', 'Colville', 'Burien', 'Langley', 'Woodinville',
       'Ellensburg', 'Zillah', 'Wapato', 'Duvall', 'Cheney', 'Pullman',
       'Bow', 'Rockford', 'Hunters', 'East Wenatchee', 'Spokane',
       'Monroe', 'Mount Vernon', 'College Place', 'Anacortes', 'Cle Elum',
       'Othello', 'Wenatchee', 'Renton', 'Greenbank', 'Palouse', 'Chelan',
       'Fall City', 'Clinton', 'Mountlake Terrace', 'Walla Walla',
       'Austin', 'Concrete', 'Manson', 'Orondo', 'Kirkland', 'Bellevue',
       'Camas', 'Federal Way

### About The Car Prices Dataset
This dataset contains 10,000 entries created for the purpose of predicting car prices. Each row represents information about a car and its price. The descriptions of the columns are as follows:

### 📊 Columns Descriptions:
- Brand: Specifies the brand of the car (e.g., Toyota, BMW, Ford).
- Model: Specifies the model of the car (e.g., Corolla, Focus, X5).
- Year: The production year of the car. Newer years typically indicate higher prices.
- Engine_Size: Specifies the engine size in liters (L). Larger engines generally correlate with higher prices.
- Fuel_Type: indicates the type of fuel used by the car.
- Transmission: The type of transmission in the car.
- Mileage: The total distance the car has traveled, measured in kilometers. Lower mileage generally indicates a higher price.
- Doors: The number of doors in the car. Commonly 2, 3, 4, or 5 doors.
- Owner_Count: The number of previous owners of the car. Fewer owners generally indicate a higher price.
- Price:The estimated selling price of the car. It is calculated based on several factors such as production year, engine size, mileage, fuel type, and transmission.

In [None]:
# Install dependencies as needed:
# pip install kagglehub[pandas-datasets]
import kagglehub
from kagglehub import KaggleDatasetAdapter

# Set the path to the file you'd like to load
file_path = "car_price_dataset.csv"

# Load the latest version
df2 = kagglehub.load_dataset(
  KaggleDatasetAdapter.PANDAS,
  "asinow/car-price-dataset",
  file_path,
  # Provide any additional arguments like 
  # sql_query or pandas_kwargs. See the 
  # documenation for more information:
  # https://github.com/Kaggle/kagglehub/blob/main/README.md#kaggledatasetadapterpandas
)

df2.head()

  df2 = kagglehub.load_dataset(


Unnamed: 0,Brand,Model,Year,Engine_Size,Fuel_Type,Transmission,Mileage,Doors,Owner_Count,Price
0,Kia,Rio,2020,4.2,Diesel,Manual,289944,3,5,8501
1,Chevrolet,Malibu,2012,2.0,Hybrid,Automatic,5356,2,3,12092
2,Mercedes,GLA,2020,4.2,Diesel,Automatic,231440,4,2,11171
3,Audi,Q5,2023,2.0,Electric,Manual,160971,2,1,11780
4,Volkswagen,Golf,2003,2.6,Hybrid,Semi-Automatic,286618,3,3,2867
