# Houston, TX Regressions
Regressions to compare E+ v9.2 and v9.5 outputs 

In [1]:
# Dependencies
import pandas as pd
from matplotlib import pyplot as plt
from sklearn import linear_model
import numpy as np
import statsmodels.api as sm

---

## Annual Data

In [2]:
hou_annual95=pd.read_csv("data/hou_annual95_data.csv")
# hou_annual95

In [3]:
hou_annual92=pd.read_csv("data/hou_annual92_data.csv")
# hou_annual92

## Merge df with performance attributes

In [4]:
# Read in U and SHGC values
performance=pd.read_csv("data/para_values.csv")
#performance

In [5]:
# Merge the csv with the with the window performance attributes
hou_annual95_all = pd.merge(hou_annual95, performance, on="Scenario")

# hou_annual95_all.set_index(["Scenario"], inplace=True)
# hou_annual95_all

In [6]:
hou_annual92_all = pd.merge(hou_annual92, performance, on="Scenario")

# hou_annual92_all.set_index(["Scenario"], inplace=True)
# hou_annual92_all

## Get the energy data

In [7]:
# Drop unwanted columns, keep scenario, energy, U and SHGC and reset index
hou_annual95_energy = hou_annual95_all[["Scenario", "AnnualEnergy(kBtu)", "AnnualEnergy(kBtu/sf)", "U-factor", "SHGC"]]

# hou_annual95_cost.set_index(["Scenario"], inplace=True)
# hou_annual95_energy

In [8]:
hou_annual92_energy = hou_annual92_all[["Scenario", "AnnualEnergy(kBtu)", "AnnualEnergy(kBtu/sf)", "U-factor", "SHGC"]]

# hou_annual95_cost.set_index(["Scenario"], inplace=True)
# hou_annual92_energy

## Get the cost data

In [9]:
# Drop unwanted columns, keep scenario, costs, U and SHGC and reset index
hou_annual95_cost = hou_annual95_all[["Scenario", "AnnualCost($)", "AnnualCost($/sf)", "U-factor", "SHGC"]]

# hou_monthly95_cost.set_index(["Scenario"], inplace=True)
# hou_annual95_cost

In [10]:
hou_annual92_cost = hou_annual92_all[["Scenario", "AnnualCost($)", "AnnualCost($/sf)", "U-factor", "SHGC"]]

# hou_monthly95_cost.set_index(["Scenario"], inplace=True)
# hou_annual92_cost

## Regression Info
 https://datatofish.com/multiple-linear-regression-python/

------

## Regression for Annual Energy (kBtu)

In [18]:
# Rename df for multiple regressions
hou_annual95_EUI = hou_annual95_energy
hou_annual92_EUI = hou_annual92_energy

In [19]:
# Define X and Y
X = hou_annual95_EUI[["U-factor", "SHGC"]]
y = hou_annual95_EUI["AnnualEnergy(kBtu)"]

# Use sklearn
regr = linear_model.LinearRegression()
regr.fit(X,y)

print("Intercept: \n", regr.intercept_)
print("Coefficients: \n", regr.coef_)

Intercept: 
 41705.718775510206
Coefficients: 
 [14900.51938776 13372.11071429]


In [20]:
# Define X and Y
X = hou_annual92_EUI[["U-factor", "SHGC"]]
y = hou_annual92_EUI["AnnualEnergy(kBtu)"]

# Use sklearn
regr = linear_model.LinearRegression()
regr.fit(X,y)

print("Intercept: \n", regr.intercept_)
print("Coefficients: \n", regr.coef_)

Intercept: 
 41161.51428571428
Coefficients: 
 [15526.80714286 12465.36071429]


## Regression for Annual EUI (kBtu/sf)

In [23]:
# Rename df for multiple regressions
hou_annual95_EUIsf = hou_annual95_energy
hou_annual92_EUIsf = hou_annual92_energy

In [26]:
# Define X and Y
X = hou_annual95_EUIsf[["U-factor", "SHGC"]]
y = hou_annual95_EUIsf["AnnualEnergy(kBtu/sf)"]

# Use sklearn
regr = linear_model.LinearRegression()
regr.fit(X,y)

print("Intercept: \n", regr.intercept_)
print("Coefficients: \n", regr.coef_)

Intercept: 
 17.376122448979594
Coefficients: 
 [6.20969388 5.57397959]


In [27]:
# Define X and Y
X = hou_annual92_EUIsf[["U-factor", "SHGC"]]
y = hou_annual92_EUIsf["AnnualEnergy(kBtu/sf)"]

# Use sklearn
regr = linear_model.LinearRegression()
regr.fit(X,y)

print("Intercept: \n", regr.intercept_)
print("Coefficients: \n", regr.coef_)

Intercept: 
 17.153469387755102
Coefficients: 
 [6.46683673 5.19030612]


------

## Regression for Annual Cost( $)

In [28]:
# Rename df for multiple regressions
hou_annual95_EUIcost = hou_annual95_cost
hou_annual92_EUIcost = hou_annual92_cost

In [30]:
# Define X and Y
X = hou_annual95_EUIcost[["U-factor", "SHGC"]]
y = hou_annual95_EUIcost["AnnualCost($)"]

# Use sklearn
regr = linear_model.LinearRegression()
regr.fit(X,y)

print("Intercept: \n", regr.intercept_)
print("Coefficients: \n", regr.coef_)

Intercept: 
 974.4314285714286
Coefficients: 
 [180.44132653 619.40204082]


In [31]:
# Define X and Y
X = hou_annual92_EUIcost[["U-factor", "SHGC"]]
y = hou_annual92_EUIcost["AnnualCost($)"]

# Use sklearn
regr = linear_model.LinearRegression()
regr.fit(X,y)

print("Intercept: \n", regr.intercept_)
print("Coefficients: \n", regr.coef_)

Intercept: 
 948.2997959183672
Coefficients: 
 [202.84336735 592.04336735]


## Regression for Annual Cost ($/sf)

In [32]:
# Rename df for multiple regressions
hou_annual95_EUIcostsf =hou_annual95_cost
hou_annual92_EUIcostsf =hou_annual92_cost

In [33]:
# Define X and Y
X = hou_annual95_EUIcostsf[["U-factor", "SHGC"]]
y = hou_annual95_EUIcostsf["AnnualCost($/sf)"]

# Use sklearn
regr = linear_model.LinearRegression()
regr.fit(X,y)

print("Intercept: \n", regr.intercept_)
print("Coefficients: \n", regr.coef_)

Intercept: 
 0.40591836734693876
Coefficients: 
 [0.07397959 0.25867347]


In [34]:
# Define X and Y
X = hou_annual92_EUIcostsf[["U-factor", "SHGC"]]
y = hou_annual92_EUIcostsf["AnnualCost($/sf)"]

# Use sklearn
regr = linear_model.LinearRegression()
regr.fit(X,y)

print("Intercept: \n", regr.intercept_)
print("Coefficients: \n", regr.coef_)

Intercept: 
 0.3961224489795918
Coefficients: 
 [0.08571429 0.24234694]
