In [5]:
import pandas as pd
import matplotlib.pyplot as plt

In [6]:
# Load the data
df = pd.read_csv('sample_ecb_operation_data.csv', parse_dates=['date_time'])
df.set_index('date_time', inplace=True)

In [None]:
# 1. Basic data exploration
print(df.describe())
print(df.dtypes)

In [None]:
# 2. Analyze cooling operation
df['Cooling_active'] = df['compCool1'] > 0
cooling_time = df['Cooling_active'].sum() / len(df) * 100
print(f"\nPercentage of time cooling was active: {cooling_time:.2f}%")

In [None]:
# 3. Analyze fan operation
df['Fan_speed'] = pd.cut(df['fan'], bins=[0, 100, 200, 300], labels=['Low', 'Medium', 'High'])
fan_distribution = df['Fan_speed'].value_counts()
fan_distribution.plot(kind='pie', autopct='%1.1f%%', title='Fan Speed Distribution')
plt.show()

In [None]:
# 4. Correlations between variables
correlation_matrix = df[['Temperature_ctrl', 'Humidity', 'compCool1', 'fan']].corr()
plt.figure(figsize=(10, 8))
im = plt.imshow(correlation_matrix, cmap='coolwarm')
plt.colorbar(im)
plt.xticks(range(len(correlation_matrix.columns)), correlation_matrix.columns, rotation=45)
plt.yticks(range(len(correlation_matrix.columns)), correlation_matrix.columns)
plt.title('Correlation Heatmap of HVAC Variables')
for i in range(len(correlation_matrix.columns)):
    for j in range(len(correlation_matrix.columns)):
        text = plt.text(j, i, f"{correlation_matrix.iloc[i, j]:.2f}",
                        ha="center", va="center", color="black")
plt.tight_layout()
plt.show()

In [None]:
# 5. Analyze energy consumption patterns
df['Hour'] = df.index.hour
hourly_energy = df.groupby('Hour')[['compCool1', 'fan']].mean()
hourly_energy.plot(kind='bar', figsize=(12, 6))
plt.title('Average Hourly Energy Consumption')
plt.xlabel('Hour of Day')
plt.ylabel('Energy Consumption')
plt.legend(['Cooling', 'Fan'])
plt.tight_layout()
plt.show()