# Combined EDA - High Frequency and Low Frequency Features

This notebook is focused on combining the HF and LF features into a single dataframe. From there, this analysis will explore the relationships of the various features and wrap up the data preparation step, ready to move on to machine learning.

In [1]:
# Standard Library Modules
from pathlib import Path

# Pip Modules
import pandas as pd
import matplotlib.pyplot as plt

# Custom Modules
from src.utilities import new_logger


# Setting Pandas DataFrame options
pd.set_option("display.max_columns", None)
pd.set_option("display.max_rows", None)

In [2]:
# Start the logging object
logger = new_logger("eda.comb_series", 'logs/eda')

In [3]:
hf_features = pd.read_parquet(Path('data/wip/mseries.wip.parquet'))
lf_features = pd.read_parquet(Path('data/wip/qseries.wip.parquet'))

In [4]:
comb_features = pd.concat([hf_features, lf_features], axis=1, join='outer')

In [7]:
comb_features.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 96 entries, 0 to 95
Data columns (total 46 columns):
 #   Column            Non-Null Count  Dtype  
---  ------            --------------  -----  
 0   HSN1FNSA          96 non-null     float64
 1   PERMIT1NSA        96 non-null     float64
 2   HOUST1FNSA        96 non-null     float64
 3   UNDCON1UNSA       96 non-null     float64
 4   COMPU1UNSA        96 non-null     float64
 5   ACTLISCOUUS       96 non-null     float64
 6   NEWLISCOUUS       96 non-null     float64
 7   MEDDAYONMARUS     96 non-null     float64
 8   MNMFS             96 non-null     float64
 9   MSACSRNSA         96 non-null     float64
 10  PRRESCON          96 non-null     float64
 11  WPU80             96 non-null     float64
 12  PPIACO            96 non-null     float64
 13  WPU101            96 non-null     float64
 14  WPU102            96 non-null     float64
 15  WPU081            96 non-null     float64
 16  WPU139902094      96 non-null     float64
 17 

In [8]:
comb_features.describe()

Unnamed: 0,HSN1FNSA,PERMIT1NSA,HOUST1FNSA,UNDCON1UNSA,COMPU1UNSA,ACTLISCOUUS,NEWLISCOUUS,MEDDAYONMARUS,MNMFS,MSACSRNSA,PRRESCON,WPU80,PPIACO,WPU101,WPU102,WPU081,WPU139902094,FMNHSHPSIUS,UNRATE,ADPMINDCONNERNSA,ADPMNUSNERNSA,CSUSHPINSA,UMCSENT,CUUR0000SEHA,MORTGAGE30US,MORTGAGE15US,OBMMIVA30YF,OBMMIJUMBO30YF,OBMMIFHA30YF,OBMMIC30YF,OBMMIUSDA30YF,OBMMIC30YFNA,OBMMIC15YF,MSPUS,ASPUS,RCMFLOACT,RCMFLOLTVPCT50,RCMFLOLTVPCT75,RCMFLOLTVPCT90,DRSFRMACBN,RRVRUSQ156N,RHORUSQ156N,MEHOINUSA646N,MEPAINUSA646N,SPPOPGROWUSA,POPTOTUSA647NWDB
count,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0,96.0
mean,57.260417,78.208333,80.160417,611.739583,77.701042,869643.8,422925.0,56.020833,3.111458,6.60625,60414.09375,136.649354,223.976844,282.461292,289.080042,263.613865,137.031135,77.797917,4.586458,7414542.0,126367400.0,251.354687,80.892708,354.882333,4.692708,4.044792,4.532073,4.841531,4.81801,4.84076,4.760229,4.677948,4.16075,369693.75,439437.5,289069.5625,76.34375,83.3125,93.9375,2.470625,6.528125,65.275,71341.25,37857.5,0.592982,332497100.0
std,9.911445,13.261124,13.10229,111.847299,9.943308,291824.9,85923.632947,12.910199,0.714639,1.89358,15355.481606,20.402664,29.16311,71.436037,46.902823,59.939845,16.581452,10.275202,1.921711,433378.6,4776302.0,49.233089,15.063181,37.137937,1.489707,1.443266,1.404221,1.478837,1.32707,1.429598,1.370809,1.414088,1.414617,49189.427218,61327.672555,138690.680992,3.914422,2.769429,1.896326,0.670194,0.495177,0.963874,7446.145912,4184.104507,0.236866,4136002.0
min,38.0,50.9,52.6,424.4,52.7,346514.0,215940.0,30.0,1.5,3.4,34714.0,111.8,185.5,200.4,220.4,203.1,112.0,56.7,3.4,6580000.0,116266000.0,184.633,50.0,303.467,2.67,2.1,2.347,2.822,2.71,2.77,2.634,2.69,2.241,313000.0,371100.0,79061.0,68.0,80.0,90.0,1.68,5.6,63.6,61140.0,31960.0,0.157317,326608600.0
25%,50.0,68.85,72.475,516.975,71.225,616235.8,368866.0,47.75,2.6,5.175,48634.75,120.3,198.55,214.05,244.425,216.7,119.55,70.375,3.675,7144750.0,123182500.0,205.33175,68.125,325.4015,3.54,2.9875,3.43275,3.7295,3.8565,3.74275,3.74775,3.56425,3.0585,322725.0,381625.0,129737.0,74.5,80.0,93.75,1.8075,6.275,64.375,66802.5,35315.0,0.488438,329802100.0
50%,56.0,79.2,80.9,594.65,78.8,855739.0,426440.0,55.0,3.15,6.25,59100.5,125.25,204.7,248.75,283.15,249.672,134.75,77.0,3.95,7344000.0,126189500.0,235.364,79.2,344.6065,4.195,3.63,4.299,4.3975,4.5985,4.4855,4.437,4.3295,3.805,346800.0,409000.0,313623.5,78.5,84.5,95.0,2.395,6.6,65.45,69740.0,36750.0,0.581089,331838700.0
75%,62.0,85.85,89.55,690.3,84.45,1151889.0,493544.0,64.0,3.525,7.7,73744.75,162.5845,254.1265,333.252,331.95175,278.1005,151.02725,87.025,4.4,7762250.0,130554000.0,302.05725,96.825,386.32975,6.3675,5.59,6.06625,6.44275,6.36175,6.41025,6.249,6.2,5.78025,418700.0,502400.0,360420.0,79.25,85.0,95.0,2.8625,6.9,65.8,76087.5,40915.0,0.727553,334714500.0
max,85.0,111.3,111.6,839.0,100.6,1325376.0,584354.0,88.0,5.1,11.4,88297.0,166.682,280.251,433.525,376.168,462.0,163.808,93.8,14.8,8309000.0,134890000.0,325.67,101.4,428.151,7.79,7.03,7.399,7.942,7.437,7.777,7.525,7.621,6.999,442600.0,525100.0,513695.0,80.0,88.0,95.0,3.9,7.5,67.9,83730.0,45140.0,0.976422,340111000.0


In [5]:
comb_features.head(12)

Unnamed: 0,HSN1FNSA,PERMIT1NSA,HOUST1FNSA,UNDCON1UNSA,COMPU1UNSA,ACTLISCOUUS,NEWLISCOUUS,MEDDAYONMARUS,MNMFS,MSACSRNSA,PRRESCON,WPU80,PPIACO,WPU101,WPU102,WPU081,WPU139902094,FMNHSHPSIUS,UNRATE,ADPMINDCONNERNSA,ADPMNUSNERNSA,CSUSHPINSA,UMCSENT,CUUR0000SEHA,MORTGAGE30US,MORTGAGE15US,OBMMIVA30YF,OBMMIJUMBO30YF,OBMMIFHA30YF,OBMMIC30YF,OBMMIUSDA30YF,OBMMIC30YFNA,OBMMIC15YF,MSPUS,ASPUS,RCMFLOACT,RCMFLOLTVPCT50,RCMFLOLTVPCT75,RCMFLOLTVPCT90,DRSFRMACBN,RRVRUSQ156N,RHORUSQ156N,MEHOINUSA646N,MEPAINUSA646N,SPPOPGROWUSA,POPTOTUSA647NWDB
0,45.0,53.7,53.1,424.4,55.0,1154139.0,387202.0,88.0,3.2,5.8,34714.0,111.8,190.7,204.8,220.4,203.1,112.0,82.7,4.7,6580000.0,120579000.0,184.633,98.5,303.467,4.19,3.4,4.045,4.349,4.275,4.422,4.384,4.309,3.56,313100.0,374800.0,300010.0,75.0,80.0,95.0,3.9,7.0,63.6,61140.0,31960.0,0.692906,326608609.0
1,51.0,57.8,58.8,430.4,52.7,1151139.0,437754.0,82.0,3.4,5.1,36399.0,111.8,191.6,207.3,225.8,210.1,112.0,88.3,4.6,6592000.0,120009000.0,185.001,96.3,304.211,4.16,3.37,4.012,4.294,4.215,4.364,4.14,4.224,3.535,313100.0,374800.0,300010.0,75.0,80.0,95.0,3.9,7.0,63.6,61140.0,31960.0,0.692906,326608609.0
2,61.0,77.1,69.5,435.0,62.4,1172731.0,509098.0,62.0,3.6,4.3,42366.0,111.9,191.5,213.3,225.2,211.8,112.0,84.5,4.4,6608000.0,120172000.0,186.51,96.9,304.868,4.14,3.39,4.091,4.312,4.313,4.413,4.184,4.325,3.557,313100.0,374800.0,300010.0,75.0,80.0,95.0,3.9,7.0,63.6,61140.0,31960.0,0.692906,326608609.0
3,56.0,69.3,76.9,450.9,60.1,1198445.0,555252.0,58.0,3.7,4.6,44596.0,112.4,193.0,212.0,227.4,215.9,112.2,86.7,4.4,6638000.0,120687000.0,188.524,97.0,305.477,4.03,3.27,3.972,4.202,4.231,4.295,4.181,4.137,3.471,318200.0,376900.0,329025.0,80.0,85.0,95.0,3.6,7.3,63.7,61140.0,31960.0,0.692906,326608609.0
4,57.0,78.4,76.9,461.4,66.9,1253871.0,566590.0,55.0,3.1,4.7,46910.0,112.5,192.8,213.7,226.0,218.3,112.2,86.2,4.4,6708000.0,121436000.0,190.519,97.1,306.379,3.95,3.19,3.924,4.068,4.159,4.223,4.104,4.07,3.402,318200.0,376900.0,329025.0,80.0,85.0,95.0,3.6,7.3,63.7,61140.0,31960.0,0.692906,326608609.0
5,56.0,81.8,83.8,473.5,71.3,1292389.0,539118.0,56.0,2.9,4.9,49085.0,112.6,193.6,213.9,226.6,216.1,113.9,88.3,4.3,6829000.0,123272000.0,192.243,95.0,307.314,3.88,3.17,4.049,4.17,4.252,4.264,4.162,4.108,3.412,318200.0,376900.0,329025.0,80.0,85.0,95.0,3.6,7.3,63.7,61140.0,31960.0,0.692906,326608609.0
6,48.0,69.2,79.4,482.8,69.4,1322676.0,533556.0,59.0,2.8,5.8,50273.0,113.9,193.5,215.9,227.6,216.9,113.9,86.8,4.3,6915000.0,124412000.0,193.487,93.4,308.173,3.92,3.2,3.975,4.093,4.233,4.235,4.1,4.086,3.401,320500.0,373200.0,355397.0,80.0,85.0,95.0,3.62,7.5,63.9,61140.0,31960.0,0.692906,326608609.0
7,45.0,76.6,78.1,493.8,65.6,1325376.0,500084.0,61.0,3.1,6.4,49957.0,113.9,193.8,214.1,233.6,222.1,113.9,88.0,4.4,6952000.0,124592000.0,194.32,96.8,309.479,3.82,3.12,3.917,4.056,4.167,4.138,4.032,3.983,3.331,320500.0,373200.0,355397.0,80.0,85.0,95.0,3.62,7.5,63.9,61140.0,31960.0,0.692906,326608609.0
8,50.0,66.6,72.5,498.1,68.2,1308624.0,439208.0,64.0,3.2,5.7,48694.0,113.9,194.8,215.7,240.4,220.7,113.9,88.3,4.3,6948000.0,124395000.0,194.79,95.1,310.268,3.83,3.13,3.93,4.121,4.189,4.173,4.098,4.004,3.407,320500.0,373200.0,355397.0,80.0,85.0,95.0,3.62,7.5,63.9,61140.0,31960.0,0.692906,326608609.0
9,49.0,71.0,75.7,500.0,73.3,1287341.0,428158.0,68.0,3.2,5.9,48002.0,114.5,194.9,211.5,241.5,223.6,113.9,85.2,4.2,6960000.0,124500000.0,195.055,100.7,311.501,3.94,3.25,3.979,4.235,4.247,4.216,4.147,4.061,3.49,337900.0,399700.0,339365.0,79.0,83.0,95.0,3.73,6.9,64.2,61140.0,31960.0,0.692906,326608609.0


In [6]:
comb_features.tail(12)

Unnamed: 0,HSN1FNSA,PERMIT1NSA,HOUST1FNSA,UNDCON1UNSA,COMPU1UNSA,ACTLISCOUUS,NEWLISCOUUS,MEDDAYONMARUS,MNMFS,MSACSRNSA,PRRESCON,WPU80,PPIACO,WPU101,WPU102,WPU081,WPU139902094,FMNHSHPSIUS,UNRATE,ADPMINDCONNERNSA,ADPMNUSNERNSA,CSUSHPINSA,UMCSENT,CUUR0000SEHA,MORTGAGE30US,MORTGAGE15US,OBMMIVA30YF,OBMMIJUMBO30YF,OBMMIFHA30YF,OBMMIC30YF,OBMMIUSDA30YF,OBMMIC30YFNA,OBMMIC15YF,MSPUS,ASPUS,RCMFLOACT,RCMFLOLTVPCT50,RCMFLOLTVPCT75,RCMFLOLTVPCT90,DRSFRMACBN,RRVRUSQ156N,RHORUSQ156N,MEHOINUSA646N,MEPAINUSA646N,SPPOPGROWUSA,POPTOTUSA647NWDB
84,58.0,77.2,70.3,664.6,61.8,665603.0,295190.0,69.0,2.7,7.9,62796.0,163.998,251.306,338.362,321.658,246.536,159.199,70.7,3.7,7877000.0,131172000.0,310.809,79.0,412.019,6.69,5.96,6.091,6.973,6.37,6.528,6.36,6.377,5.861,426800.0,519700.0,79061.0,76.0,84.0,95.0,1.73,6.6,65.6,83730.0,45140.0,0.976422,340110988.0
85,58.0,80.5,82.2,664.2,81.6,664745.0,339380.0,61.0,2.5,7.8,63898.0,163.963,254.926,344.739,322.158,248.576,158.408,72.8,3.9,7867000.0,130546000.0,312.735,76.9,413.695,6.94,6.26,6.5,7.347,6.655,6.885,6.766,6.752,6.344,426800.0,519700.0,79061.0,76.0,84.0,95.0,1.73,6.6,65.6,83730.0,45140.0,0.976422,340110988.0
86,65.0,86.0,88.8,673.4,78.9,694844.0,395536.0,50.0,2.8,7.0,73435.0,164.201,255.095,321.137,327.703,251.805,157.704,71.9,3.9,7890000.0,130578000.0,316.919,79.4,415.219,6.79,6.11,6.312,6.931,6.455,6.731,6.45,6.61,6.004,426800.0,519700.0,79061.0,76.0,84.0,95.0,1.73,6.6,65.6,83730.0,45140.0,0.976422,340110988.0
87,65.0,94.3,96.1,673.0,91.0,734324.0,432032.0,47.0,2.3,7.0,79721.0,164.816,256.978,314.128,336.562,254.976,161.653,71.9,3.9,7942000.0,131024000.0,320.848,77.2,416.386,7.17,6.44,6.798,7.396,6.909,7.242,6.825,7.12,6.632,414500.0,502200.0,108278.0,79.0,86.0,95.0,1.68,6.6,65.6,83730.0,45140.0,0.976422,340110988.0
88,61.0,94.4,91.6,676.6,86.2,787726.0,433906.0,45.0,2.4,7.6,85582.0,164.841,255.313,314.168,351.2,250.461,162.584,69.4,4.0,8048000.0,131666000.0,323.795,69.1,417.772,7.03,6.36,6.582,7.156,6.749,7.02,6.801,6.895,6.346,414500.0,502200.0,108278.0,79.0,86.0,95.0,1.68,6.6,65.6,83730.0,45140.0,0.976422,340110988.0
89,58.0,83.8,93.3,671.3,93.1,839960.0,426092.0,48.0,2.1,8.1,87280.0,165.347,255.914,308.611,351.993,250.044,161.738,72.6,4.1,8168000.0,133217000.0,325.348,68.2,418.82,6.86,6.16,6.462,7.182,6.665,6.938,6.711,6.749,6.379,414500.0,502200.0,108278.0,79.0,86.0,95.0,1.68,6.6,65.6,83730.0,45140.0,0.976422,340110988.0
90,61.0,85.7,80.9,658.6,91.3,883905.0,405404.0,51.0,2.2,7.7,87211.0,166.518,257.321,301.282,351.282,247.533,162.229,71.5,4.2,8274000.0,134401000.0,325.67,66.4,420.577,6.78,6.07,6.146,6.979,6.532,6.674,6.466,6.513,5.926,415300.0,498700.0,115373.0,78.0,85.0,95.0,1.7,6.9,65.6,83730.0,45140.0,0.976422,340110988.0
91,56.0,85.8,89.5,657.0,89.3,908944.0,383552.0,53.0,2.2,8.5,87396.0,166.513,255.463,295.464,342.036,251.601,161.64,72.1,4.2,8309000.0,134503000.0,325.113,67.9,422.223,6.35,5.51,5.786,6.639,6.13,6.368,6.212,6.192,5.677,415300.0,498700.0,115373.0,78.0,85.0,95.0,1.7,6.9,65.6,83730.0,45140.0,0.976422,340110988.0
92,58.0,76.4,89.4,661.2,84.6,940291.0,399754.0,55.0,2.5,8.2,81506.0,166.682,252.682,291.516,345.676,255.227,161.946,73.9,4.1,8298000.0,134280000.0,324.744,70.1,423.821,6.08,5.16,5.631,6.416,5.883,6.138,5.977,5.99,5.364,415300.0,498700.0,115373.0,78.0,85.0,95.0,1.7,6.9,65.6,83730.0,45140.0,0.976422,340110988.0
93,46.0,83.9,79.6,651.5,85.8,954201.0,365692.0,58.0,2.4,10.6,79615.0,166.36,253.081,294.235,353.984,258.077,162.647,74.6,4.1,8308000.0,134581000.0,324.065,70.5,425.381,6.72,5.99,6.359,6.823,6.425,6.786,6.601,6.639,6.056,419300.0,510900.0,120851.0,75.0,83.0,95.0,1.81,6.9,65.7,83730.0,45140.0,0.976422,340110988.0
