# Graphs to show different aspects of the data
1. average values across the day
2. average values across the year

In [None]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt

from utils.create_graph import draw_graph

df: pd.DataFrame = pd.read_parquet("../data/processed/processed_data.parquet")

## Values across day of 07/12/2006

In [None]:
specific_day = pd.Timestamp("2006-12-17")
df_day = df[df["Datetime"].dt.date == specific_day.date()]

x_day = df_day["Datetime"]

### Global active power

In [None]:
draw_graph(df_day, 
           "Global_active_power",
           "Feature Values Across Day", "Kilowatts (kW)")
# plt.figure(figsize=(20, 5))
# plt.plot(x_day, df_day["Global_active_power"], label="Global Power")

# plt.xlabel("Time of Day")
# plt.ylabel("Kilowatts (kW)")
# plt.title("Feature Values Across Day")
# plt.grid(True)


# plt.legend()
# plt.show()

### Average Voltage

In [None]:
plt.figure(figsize=(20, 5))
plt.plot(x_day, df_day["Voltage"], color='orange', label="Voltage")

plt.xlabel("Time of Day")
plt.ylabel("Volts (v)")
plt.title("Feature Values Across Day")
plt.grid(True)

plt.legend()
plt.show()

### Household Global intensity (Amps)

In [None]:
plt.figure(figsize=(20, 5))
plt.plot(x_day, df_day["Global_intensity"], label="Global_intensity Amps")

plt.xlabel("Time of Day")
plt.ylabel("Amps (A)")
plt.title("Feature Values Across Day")
plt.grid(True)

plt.legend()
plt.show()

### Sub meter readings (Watt hours)

In [None]:
plt.figure(figsize=(20, 5))
plt.plot(x_day, df_day["Sub_metering_1"], label="Sub_metering_1")
plt.plot(x_day, df_day["Sub_metering_2"], label="Sub_metering_2")
plt.plot(x_day, df_day["Sub_metering_3"], label="Sub_metering_3")

plt.xlabel("Time of Day")
plt.ylabel("Watt Hours (Wh)")
plt.title("Feature Values Across Day")
plt.grid(True)

plt.legend()
plt.show()

## Average daily values across year of 2007

In [None]:
year = 2007

df_year: pd.DataFrame = df[df["Datetime"].dt.year == year]

df_year_mean = df_year.groupby(df_year["Datetime"].dt.date).mean()

x_year = df_year_mean["Datetime"]

In [None]:
plt.figure(figsize=(20, 5))
plt.plot(x_year, df_year_mean["Global_active_power"], label="Global Power")

plt.xlabel("Day of Year")
plt.ylabel("Watt Hours (Wh)")
plt.title("Average Feature Values Within Day")
plt.grid(True)

plt.legend()
plt.show()

### Average Voltage

In [None]:
plt.figure(figsize=(20, 5))
plt.plot(x_year, df_year_mean["Voltage"], color='orange', label="Voltage")

plt.xlabel("Day of Year")
plt.ylabel("Volts (v)")
plt.title("Average Feature Values Across Year")
plt.grid(True)

plt.legend()
plt.show()