# Monday, July 18 2022 Data Analysis of Window Opening and Closing Experiment (First Run)
Data collected from July 10 - July 15 2022

In [None]:
# plot temp, rh data, highlight window openings and closings 
# try to get data from oustide weather station
# see if there is significant divergence for window closed periods? 

In [16]:
import pandas as pd
import plotly.graph_objects as go
from plotly.subplots import make_subplots

# 422 A (Windows Always Open)

In [3]:
trh_422a_csv = "/Users/julietnwagwuume-ezeoke/My Drive/UIL/windows/hobo_temprh/TRH_4_422A_071522.csv"

In [4]:
trh_422a = pd.read_csv(trh_422a_csv, header=0, names=["DateTime", "Temp C", "RH %"], usecols=[1,2,3], skiprows=[1])
trh_422a

Unnamed: 0,DateTime,Temp C,RH %
0,07/10/22 09:45:00 PM,26.579,52.870
1,07/10/22 09:45:30 PM,26.579,53.060
2,07/10/22 09:46:00 PM,26.554,53.089
3,07/10/22 09:46:30 PM,26.505,53.177
4,07/10/22 09:47:00 PM,26.481,53.205
...,...,...,...
13318,07/15/22 12:44:00 PM,25.070,49.646
13319,07/15/22 12:44:30 PM,25.167,49.914
13320,07/15/22 12:45:00 PM,25.336,51.304
13321,07/15/22 12:45:01 PM,,


In [11]:
# convert string dates to datetime format 
trh_422a["DateTime"] = pd.to_datetime(trh_422a["DateTime"])

In [19]:
# plotly plot 

fig = make_subplots(specs=[[{"secondary_y": True}]])
fig.add_trace(go.Scatter(x=trh_422a["DateTime"], y=trh_422a["Temp C"],
                    mode='lines',
                    name='422A Temperature ºC'), secondary_y=False,)
fig.add_trace(go.Scatter(x=trh_422a["DateTime"], y=trh_422a["RH %"],
                    mode='lines',
                    name='422A Rel. Humidity %'), secondary_y=True,)

fig.update_yaxes(title_text="Temperature ºC", secondary_y=False)
fig.update_yaxes(title_text="Relative Humidity %", secondary_y=True)

fig.update_layout(
    title_text="422A Temperature and RH"
)

# # Set x-axis title
# fig.update_xaxes(title_text="xaxis title")

fig.show()

# 422 B (Windows Sometimes Open)

In [21]:
trh_422b_csv = "/Users/julietnwagwuume-ezeoke/My Drive/UIL/windows/hobo_temprh/TRH_2_422B_071522.csv"
trh_422b = pd.read_csv(trh_422b_csv, header=0, names=["DateTime", "Temp C", "RH %"], usecols=[1,2,3], skiprows=[1])
trh_422b["DateTime"] = pd.to_datetime(trh_422b["DateTime"])
trh_422b

Unnamed: 0,DateTime,Temp C,RH %
0,2022-07-10 21:45:00,27.142,52.248
1,2022-07-10 21:45:30,27.093,52.305
2,2022-07-10 21:46:00,27.044,52.171
3,2022-07-10 21:46:30,26.970,52.448
4,2022-07-10 21:47:00,26.921,52.632
...,...,...,...
13321,2022-07-15 12:44:42,,
13322,2022-07-15 12:44:49,,
13323,2022-07-15 12:44:52,,
13324,2022-07-15 12:44:53,,


In [22]:
# plotly plot 

fig = make_subplots(specs=[[{"secondary_y": True}]])
fig.add_trace(go.Scatter(x=trh_422b["DateTime"], y=trh_422b["Temp C"],
                    mode='lines',
                    name='422B Temperature ºC'), secondary_y=False,)
fig.add_trace(go.Scatter(x=trh_422b["DateTime"], y=trh_422b["RH %"],
                    mode='lines',
                    name='422B Rel. Humidity %'), secondary_y=True,)

fig.update_yaxes(title_text="Temperature ºC", secondary_y=False)
fig.update_yaxes(title_text="Relative Humidity %", secondary_y=True)

fig.update_layout(
    title_text="422B Temperature and RH"
)

fig.show()

# Comparison of Data Sets 

In [None]:
# align data sets
# cut off both times at 12:30pm on 7/15
# then have data ranging from sunday 7/10, 9:45pm to fri 7/15 12:30pm 

In [32]:
# end the data at 12:30 on July 15 to compare the datasets 
endtime = pd.Timestamp(2022, 7, 15, 12, 30, 30)

trh_422a_cutoff = trh_422a[trh_422a["DateTime"] < endtime]
trh_422b_cutoff = trh_422b[trh_422b["DateTime"] < endtime]

In [34]:

fig = make_subplots()
fig.add_trace(go.Scatter(x=trh_422a_cutoff["DateTime"], y=trh_422a_cutoff["Temp C"],
                    mode='lines',
                    name='422A Temperature ºC'))
fig.add_trace(go.Scatter(x=trh_422b_cutoff["DateTime"], y=trh_422b_cutoff["Temp C"],
                    mode='lines',
                    name='422B Temperature ºC'))

fig.update_yaxes(title_text="Temperature ºC", secondary_y=False)
# fig.update_yaxes(title_text="Relative Humidity %", secondary_y=True)

fig.update_layout(
    title_text="422A vs 422B Temperature"
)

fig.show()

In [40]:
# note window opening and closing periods... -> higlight times of window closed

# closed times 
c0_start =  pd.Timestamp(2022, 7, 11, 15, 36) # monday 7/11, 3:36pm
c0_end =  pd.Timestamp(2022, 7, 11, 23, 40) # monday 7/11, 11:40pm

c1_start =  pd.Timestamp(2022, 7, 12, 8, 00) # tuesday 7/12, 8:00am
c1_end =  pd.Timestamp(2022, 7, 12, 18, 40) # tuesday 7/12, 6:40am

c2_start =  pd.Timestamp(2022, 7, 14, 10, 50) # thursday 7/14, 10:50am
c2_end =  pd.Timestamp(2022, 7, 14, 20, 28) # thursday 7/14, 8:28pm

In [41]:
# specify the corners of the rectangles
y0 = 21
y1 = 28
fig.update_layout(
    shapes=[
    dict(
        type="rect",
        xref="x",
        yref="y",
        x0=c0_start,
        y0=y0,
        x1=c0_end,
        y1=y1,
        fillcolor="lightgray",
        opacity=0.4,
        line_width=0,
        layer="below"
    ),
    dict(
        type="rect",
        xref="x",
        yref="y",
        x0=c1_start,
        y0=y0,
        x1=c1_end,
        y1=y1,
        fillcolor="lightgray",
        opacity=0.4,
        line_width=0,
        layer="below"
    ),
        dict(
        type="rect",
        xref="x",
        yref="y",
        x0=c2_start,
        y0=y0,
        x1=c2_end,
        y1=y1,
        fillcolor="lightgray",
        opacity=0.4,
        line_width=0,
        layer="below"
    ),
    ]
)

fig.show()

Grey shading indicates period of windows being closed in 422B

In [None]:
# todo 
# calculate statistics, mean, std dev of t and rh, time lag...
# what could be causing the  in the relative humidity? bc they are not all at noon... could it be measurement error? 
# compare to stanford temp data... 
# analyze temperature diff in window closed period vs other times...