In [5]:
# Step 1: Import necessary libraries
import pandas as pd
import plotly.express as px
from IPython.display import display

# Step 2: Load and Inspect the Data
print("--- Loading and Inspecting Data ---")
file_path = 'delhi_aqi_2024_2025.csv'
try:
    df = pd.read_csv(file_path)
    print("Data loaded successfully!")

    # Display the first 5 rows
    print("\nFirst 5 rows of the dataset:")
    display(df.head())

    # Get information about the columns
    print("\nDataset Information:")
    df.info()
except FileNotFoundError:
    print(f"Error: The file '{file_path}' was not found.")

# Step 3: Data Preparation
print("\n--- Preparing Data ---")
# Convert the 'Date' column to a proper datetime format
df['Date'] = pd.to_datetime(df['Date'])
print("'Date' column converted to datetime format.")

# Step 4: Visualize the Data
print("\n--- Creating Visualization ---")
# Create an interactive line chart to see trends
fig = px.line(
    df,
    x='Date',
    y='PM2.5',
    title='Daily PM2.5 Air Pollution Levels in Delhi (2024-2025)',
    labels={'Date': 'Date', 'PM2.5': 'PM2.5 Concentration (µg/m³)'}
)

# Show the interactive chart
fig.show()

print("\n--- Analysis Complete ---")

--- Loading and Inspecting Data ---
Data loaded successfully!

First 5 rows of the dataset:


Unnamed: 0,Date,PM2.5
0,2024-09-10,85.2
1,2024-09-11,88.1
2,2024-09-12,90.5
3,2024-09-13,86.7
4,2024-09-14,83.4



Dataset Information:
<class 'pandas.core.frame.DataFrame'>
RangeIndex: 366 entries, 0 to 365
Data columns (total 2 columns):
 #   Column  Non-Null Count  Dtype  
---  ------  --------------  -----  
 0   Date    366 non-null    object 
 1   PM2.5   366 non-null    float64
dtypes: float64(1), object(1)
memory usage: 5.8+ KB

--- Preparing Data ---
'Date' column converted to datetime format.

--- Creating Visualization ---



--- Analysis Complete ---
