# Household Energy Consumption – Week 2 Internship Project
AICTE Edunet Foundation Internship | Theme: Sustainable Energy & Efficiency

In [None]:
import pandas as pd
import matplotlib.pyplot as plt

data = pd.read_csv('../data/household_power_consumption.csv', sep=';')
data['DateTime'] = pd.to_datetime(data['Date'] + ' ' + data['Time'], errors='coerce')

for col in ['Global_active_power','Global_reactive_power','Voltage','Global_intensity','Sub_metering_1','Sub_metering_2','Sub_metering_3']:
    data[col] = pd.to_numeric(data[col], errors='coerce')

print(data.info())
print(data.head())

In [None]:
print(data.isnull().sum())
data = data.dropna()

In [None]:
daily_energy = data.groupby(data['DateTime'].dt.date)['Global_active_power'].sum()
plt.figure(figsize=(12,5))
plt.plot(daily_energy.index, daily_energy.values, marker='o')
plt.title('Daily Household Energy Consumption')
plt.xlabel('Date')
plt.ylabel('Global Active Power (kWh)')
plt.xticks(rotation=45)
plt.grid(True)
plt.show()

In [None]:
plt.figure(figsize=(8,5))
plt.hist(daily_energy.values, bins=20, edgecolor='black')
plt.title('Distribution of Daily Household Energy Consumption')
plt.xlabel('Global Active Power (kWh)')
plt.ylabel('Frequency')
plt.show()

In [None]:
hourly_energy = data.groupby(data['DateTime'].dt.hour)['Global_active_power'].mean()
plt.figure(figsize=(8,5))
plt.plot(hourly_energy.index, hourly_energy.values, marker='o', color='green')
plt.title('Average Hourly Energy Consumption')
plt.xlabel('Hour of Day')
plt.ylabel('Global Active Power (kWh)')
plt.grid(True)
plt.show()

### 🔹 Observations
- Household energy consumption varies daily.
- Evening hours show peak usage.
- Consumption is lowest at night.
- Most daily consumption falls in a predictable range.