## UK HPI - Sourced Data Clean


### This script contains the following:
1. Importing libraries and data
2. Cleaning data set
3. Saving cleaned data set

In [1]:
# Import Libraries

import pandas as pd
import numpy as np
import os
import matplotlib.pyplot as plt
import seaborn as sns
import scipy


In [2]:
path = r'/Users/andrew/Documents/Data Analyst Course/Data Immersion/Achievement 6/UK HPI Project/'

In [3]:
df = pd.read_csv(os.path.join(path, 'Data', 'Original Data', 'UK_HPI.csv'))

In [4]:
df.head()

Unnamed: 0,Date,RegionName,AreaCode,AveragePrice,Index,IndexSA,1m%Change,12m%Change,AveragePriceSA,SalesVolume,...,NewIndex,New1m%Change,New12m%Change,NewSalesVolume,OldPrice,OldIndex,Old1m%Change,Old12m%Change,OldSalesVolume,Official Interest Rate
0,1/4/1968,East Midlands,E12000004,3025.670615,1.968954,,0.0,,,,...,,,,,,,,,,
1,1/4/1968,England,E92000001,3408.108064,1.680067,,0.0,,,,...,,,,,,,,,,
2,1/4/1968,London,E12000007,4418.489911,1.096815,,0.0,,,,...,,,,,,,,,,
3,1/4/1968,Northern Ireland,N92000001,3661.4855,3.30042,,0.0,,,,...,,,,,,,,,,
4,1/4/1968,Scotland,S92000003,2844.980688,2.108087,,0.0,,,,...,,,,,,,,,,


In [5]:
df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 134211 entries, 0 to 134210
Data columns (total 55 columns):
 #   Column                  Non-Null Count   Dtype  
---  ------                  --------------   -----  
 0   Date                    134211 non-null  object 
 1   RegionName              134211 non-null  object 
 2   AreaCode                134211 non-null  object 
 3   AveragePrice            134211 non-null  float64
 4   Index                   134211 non-null  float64
 5   IndexSA                 4434 non-null    float64
 6   1m%Change               133760 non-null  float64
 7   12m%Change              129075 non-null  float64
 8   AveragePriceSA          4434 non-null    float64
 9   SalesVolume             129700 non-null  float64
 10  DetachedPrice           128052 non-null  float64
 11  DetachedIndex           128052 non-null  float64
 12  Detached1m%Change       127635 non-null  float64
 13  Detached12m%Change      123072 non-null  float64
 14  SemiDetachedPrice   

In [6]:
# Check shape of df
df.shape

(134211, 55)

In [7]:
# check types 
df.dtypes

Date                       object
RegionName                 object
AreaCode                   object
AveragePrice              float64
Index                     float64
IndexSA                   float64
1m%Change                 float64
12m%Change                float64
AveragePriceSA            float64
SalesVolume               float64
DetachedPrice             float64
DetachedIndex             float64
Detached1m%Change         float64
Detached12m%Change        float64
SemiDetachedPrice         float64
SemiDetachedIndex         float64
SemiDetached1m%Change     float64
SemiDetached12m%Change    float64
TerracedPrice             float64
TerracedIndex             float64
Terraced1m%Change         float64
Terraced12m%Change        float64
FlatPrice                 float64
FlatIndex                 float64
Flat1m%Change             float64
Flat12m%Change            float64
CashPrice                 float64
CashIndex                 float64
Cash1m%Change             float64
Cash12m%Change

In [8]:
pd.options.display.max_columns = None

In [9]:
df.head()

Unnamed: 0,Date,RegionName,AreaCode,AveragePrice,Index,IndexSA,1m%Change,12m%Change,AveragePriceSA,SalesVolume,DetachedPrice,DetachedIndex,Detached1m%Change,Detached12m%Change,SemiDetachedPrice,SemiDetachedIndex,SemiDetached1m%Change,SemiDetached12m%Change,TerracedPrice,TerracedIndex,Terraced1m%Change,Terraced12m%Change,FlatPrice,FlatIndex,Flat1m%Change,Flat12m%Change,CashPrice,CashIndex,Cash1m%Change,Cash12m%Change,CashSalesVolume,MortgagePrice,MortgageIndex,Mortgage1m%Change,Mortgage12m%Change,MortgageSalesVolume,FTBPrice,FTBIndex,FTB1m%Change,FTB12m%Change,FOOPrice,FOOIndex,FOO1m%Change,FOO12m%Change,NewPrice,NewIndex,New1m%Change,New12m%Change,NewSalesVolume,OldPrice,OldIndex,Old1m%Change,Old12m%Change,OldSalesVolume,Official Interest Rate
0,1/4/1968,East Midlands,E12000004,3025.670615,1.968954,,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
1,1/4/1968,England,E92000001,3408.108064,1.680067,,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
2,1/4/1968,London,E12000007,4418.489911,1.096815,,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
3,1/4/1968,Northern Ireland,N92000001,3661.4855,3.30042,,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
4,1/4/1968,Scotland,S92000003,2844.980688,2.108087,,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,


In [10]:
# Check for duplicates
df_dups = df[df.duplicated()]

In [11]:
df_dups

Unnamed: 0,Date,RegionName,AreaCode,AveragePrice,Index,IndexSA,1m%Change,12m%Change,AveragePriceSA,SalesVolume,DetachedPrice,DetachedIndex,Detached1m%Change,Detached12m%Change,SemiDetachedPrice,SemiDetachedIndex,SemiDetached1m%Change,SemiDetached12m%Change,TerracedPrice,TerracedIndex,Terraced1m%Change,Terraced12m%Change,FlatPrice,FlatIndex,Flat1m%Change,Flat12m%Change,CashPrice,CashIndex,Cash1m%Change,Cash12m%Change,CashSalesVolume,MortgagePrice,MortgageIndex,Mortgage1m%Change,Mortgage12m%Change,MortgageSalesVolume,FTBPrice,FTBIndex,FTB1m%Change,FTB12m%Change,FOOPrice,FOOIndex,FOO1m%Change,FOO12m%Change,NewPrice,NewIndex,New1m%Change,New12m%Change,NewSalesVolume,OldPrice,OldIndex,Old1m%Change,Old12m%Change,OldSalesVolume,Official Interest Rate


In [12]:
# None found

In [13]:
# Drop AreaCode Column
df = df.drop(columns = ['AreaCode'])

In [14]:
# Drop IndexSA Column
df = df.drop(columns = ['IndexSA'])

In [15]:
# Drop AveragePriceSA Column
df = df.drop(columns = ['AveragePriceSA'])

In [16]:
# Check it's been updated
df.head()

Unnamed: 0,Date,RegionName,AveragePrice,Index,1m%Change,12m%Change,SalesVolume,DetachedPrice,DetachedIndex,Detached1m%Change,Detached12m%Change,SemiDetachedPrice,SemiDetachedIndex,SemiDetached1m%Change,SemiDetached12m%Change,TerracedPrice,TerracedIndex,Terraced1m%Change,Terraced12m%Change,FlatPrice,FlatIndex,Flat1m%Change,Flat12m%Change,CashPrice,CashIndex,Cash1m%Change,Cash12m%Change,CashSalesVolume,MortgagePrice,MortgageIndex,Mortgage1m%Change,Mortgage12m%Change,MortgageSalesVolume,FTBPrice,FTBIndex,FTB1m%Change,FTB12m%Change,FOOPrice,FOOIndex,FOO1m%Change,FOO12m%Change,NewPrice,NewIndex,New1m%Change,New12m%Change,NewSalesVolume,OldPrice,OldIndex,Old1m%Change,Old12m%Change,OldSalesVolume,Official Interest Rate
0,1/4/1968,East Midlands,3025.670615,1.968954,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
1,1/4/1968,England,3408.108064,1.680067,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
2,1/4/1968,London,4418.489911,1.096815,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
3,1/4/1968,Northern Ireland,3661.4855,3.30042,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
4,1/4/1968,Scotland,2844.980688,2.108087,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,


In [17]:
# Replace all NaN values with 0
df = df.replace(np.nan, 0)

In [18]:
df.head()

Unnamed: 0,Date,RegionName,AveragePrice,Index,1m%Change,12m%Change,SalesVolume,DetachedPrice,DetachedIndex,Detached1m%Change,Detached12m%Change,SemiDetachedPrice,SemiDetachedIndex,SemiDetached1m%Change,SemiDetached12m%Change,TerracedPrice,TerracedIndex,Terraced1m%Change,Terraced12m%Change,FlatPrice,FlatIndex,Flat1m%Change,Flat12m%Change,CashPrice,CashIndex,Cash1m%Change,Cash12m%Change,CashSalesVolume,MortgagePrice,MortgageIndex,Mortgage1m%Change,Mortgage12m%Change,MortgageSalesVolume,FTBPrice,FTBIndex,FTB1m%Change,FTB12m%Change,FOOPrice,FOOIndex,FOO1m%Change,FOO12m%Change,NewPrice,NewIndex,New1m%Change,New12m%Change,NewSalesVolume,OldPrice,OldIndex,Old1m%Change,Old12m%Change,OldSalesVolume,Official Interest Rate
0,1/4/1968,East Midlands,3025.670615,1.968954,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
1,1/4/1968,England,3408.108064,1.680067,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
2,1/4/1968,London,4418.489911,1.096815,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
3,1/4/1968,Northern Ireland,3661.4855,3.30042,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
4,1/4/1968,Scotland,2844.980688,2.108087,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


In [19]:
df.describe()

Unnamed: 0,AveragePrice,Index,1m%Change,12m%Change,SalesVolume,DetachedPrice,DetachedIndex,Detached1m%Change,Detached12m%Change,SemiDetachedPrice,SemiDetachedIndex,SemiDetached1m%Change,SemiDetached12m%Change,TerracedPrice,TerracedIndex,Terraced1m%Change,Terraced12m%Change,FlatPrice,FlatIndex,Flat1m%Change,Flat12m%Change,CashPrice,CashIndex,Cash1m%Change,Cash12m%Change,CashSalesVolume,MortgagePrice,MortgageIndex,Mortgage1m%Change,Mortgage12m%Change,MortgageSalesVolume,FTBPrice,FTBIndex,FTB1m%Change,FTB12m%Change,FOOPrice,FOOIndex,FOO1m%Change,FOO12m%Change,NewPrice,NewIndex,New1m%Change,New12m%Change,NewSalesVolume,OldPrice,OldIndex,Old1m%Change,Old12m%Change,OldSalesVolume,Official Interest Rate
count,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0,134211.0
mean,163427.4,79.255567,0.564992,6.264851,1157.696466,273770.2,76.880681,0.481296,5.848656,175090.5,76.380743,0.494443,6.006006,139050.7,75.793135,0.500217,6.094223,107796.5,79.334253,0.439878,5.417949,79109.26,38.227582,0.131417,1.382196,108.953215,82631.46,38.311919,0.136655,1.433418,242.505897,68519.9,38.509102,0.133282,1.385322,92187.62,38.338664,0.136555,1.439291,185428.6,76.848678,0.512866,6.02566,121.082075,156718.8,75.877106,0.478966,5.857645,1030.102957,3.037701
std,109334.0,33.828848,2.000833,8.940264,7374.891913,247854.2,35.270341,1.720731,8.019927,187899.3,35.886357,1.710257,8.459564,138705.5,36.154295,1.743957,8.800032,87320.9,35.215872,1.786325,9.180978,131766.9,52.628027,0.896041,3.319236,1169.381979,135310.0,52.775205,0.89457,3.35721,2584.114181,113093.5,52.684248,0.908627,3.355979,151778.7,52.814931,0.89601,3.353963,118196.1,36.497303,1.778515,8.284237,794.074005,111659.9,35.655336,1.745179,8.588847,6594.366115,2.736837
min,2712.016,1.096815,-30.297781,-35.786566,0.0,0.0,0.0,-19.628465,-30.193434,0.0,0.0,-19.668017,-29.358801,0.0,0.0,-19.960934,-29.446217,0.0,0.0,-30.295111,-28.841733,0.0,0.0,-19.179237,-27.416238,0.0,0.0,0.0,-19.090431,-27.917896,0.0,0.0,0.0,-19.083397,-28.292518,0.0,0.0,-19.133937,-27.435825,0.0,0.0,-29.816368,-28.851244,0.0,0.0,0.0,-30.587732,-30.341125,0.0,0.0
25%,91593.47,45.444697,-0.440224,0.800547,131.0,142945.4,44.845547,-0.399038,0.266908,87594.89,42.129922,-0.371709,0.254597,68051.2,40.104934,-0.395144,0.087125,57455.26,45.305394,-0.479876,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,99741.62,42.855799,-0.394824,0.340064,8.0,82871.07,41.717318,-0.392053,0.0,114.0,0.5
50%,144337.1,87.686225,0.518197,5.114394,206.0,225670.3,85.447358,0.410076,4.822487,141330.6,85.711544,0.422674,4.790006,113489.6,86.069521,0.426008,4.771888,93864.54,90.810242,0.354238,3.783462,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,175080.3,85.611239,0.436566,4.914291,19.0,140082.5,85.945399,0.39974,4.580468,182.0,3.5
75%,205503.9,104.108997,1.513763,10.433046,356.0,326322.9,102.072216,1.416553,9.95233,207354.8,102.583902,1.402442,9.987919,168959.3,103.101615,1.438311,10.26298,132941.8,106.769503,1.380445,9.689537,147652.1,99.291575,0.0,0.785533,40.0,156615.8,99.306142,0.0,1.00135,89.0,131515.8,99.421528,0.0,0.849049,172953.6,99.296917,0.0,1.017131,239089.8,102.518696,1.477428,10.256043,42.0,201332.8,102.519661,1.39778,9.965059,319.0,5.25
max,1463378.0,221.485238,35.286646,98.43794,146470.0,3755824.0,197.988967,34.812357,92.630423,3768069.0,191.991575,35.295354,101.591679,2589000.0,217.656918,36.277412,106.853691,1287157.0,205.906634,36.067605,102.677794,1461413.0,161.927419,21.105819,52.385088,51356.0,1465566.0,164.159602,21.48771,51.176273,84491.0,1278535.0,162.001177,24.250435,50.819283,1656861.0,164.566228,21.329996,51.963758,1264384.0,185.158633,34.946588,96.170727,21097.33333,1479584.0,207.47874,35.552952,98.648458,136069.0,17.0


In [20]:
df.shape

(134211, 52)

In [21]:
print(df.describe())

       AveragePrice          Index      1m%Change     12m%Change  \
count  1.342110e+05  134211.000000  134211.000000  134211.000000   
mean   1.634274e+05      79.255567       0.564992       6.264851   
std    1.093340e+05      33.828848       2.000833       8.940264   
min    2.712016e+03       1.096815     -30.297781     -35.786566   
25%    9.159347e+04      45.444697      -0.440224       0.800547   
50%    1.443371e+05      87.686225       0.518197       5.114394   
75%    2.055039e+05     104.108997       1.513763      10.433046   
max    1.463378e+06     221.485238      35.286646      98.437940   

         SalesVolume  DetachedPrice  DetachedIndex  Detached1m%Change  \
count  134211.000000   1.342110e+05  134211.000000      134211.000000   
mean     1157.696466   2.737702e+05      76.880681           0.481296   
std      7374.891913   2.478542e+05      35.270341           1.720731   
min         0.000000   0.000000e+00       0.000000         -19.628465   
25%       131.000000  

In [None]:
# Properties for England and Wales only begin to be added from 01/01/1995 so will remove all previous data before these dates

In [22]:
# Reset index to be the date
df_2 = df.set_index('Date')

In [23]:
# Filter out dates before 1st Jan 1995
df_2 = df_2.loc['1/1/1995':]

In [24]:
df_2.head()

Unnamed: 0_level_0,RegionName,AveragePrice,Index,1m%Change,12m%Change,SalesVolume,DetachedPrice,DetachedIndex,Detached1m%Change,Detached12m%Change,SemiDetachedPrice,SemiDetachedIndex,SemiDetached1m%Change,SemiDetached12m%Change,TerracedPrice,TerracedIndex,Terraced1m%Change,Terraced12m%Change,FlatPrice,FlatIndex,Flat1m%Change,Flat12m%Change,CashPrice,CashIndex,Cash1m%Change,Cash12m%Change,CashSalesVolume,MortgagePrice,MortgageIndex,Mortgage1m%Change,Mortgage12m%Change,MortgageSalesVolume,FTBPrice,FTBIndex,FTB1m%Change,FTB12m%Change,FOOPrice,FOOIndex,FOO1m%Change,FOO12m%Change,NewPrice,NewIndex,New1m%Change,New12m%Change,NewSalesVolume,OldPrice,OldIndex,Old1m%Change,Old12m%Change,OldSalesVolume,Official Interest Rate
Date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1
1/1/1995,Adur,54516.42545,21.83662,0.0,0.0,79.0,85482.01252,22.699081,0.0,0.0,59598.67451,21.526612,0.0,0.0,48955.96381,20.454703,0.0,0.0,38126.03274,23.79074,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,59255.49943,22.378461,0.0,0.0,11.0,54372.37389,21.788639,0.0,0.0,68.0,6.13
1/1/1995,Allerdale,44464.03724,32.815689,0.0,0.0,70.0,67547.91981,34.139554,0.0,0.0,42776.09928,32.499311,0.0,0.0,35513.54992,31.944308,0.0,0.0,32808.34708,35.8636,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,60041.84226,33.876423,0.0,0.0,9.0,43138.66035,32.908903,0.0,0.0,61.0,6.13
1/1/1995,Amber Valley,45424.80814,31.551992,0.0,0.0,114.0,66983.19796,32.574116,0.0,0.0,40407.89905,31.274357,0.0,0.0,33439.34928,30.722479,0.0,0.0,30527.41852,33.568263,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,63207.94539,31.262341,0.0,0.0,16.0,44721.87801,31.570205,0.0,0.0,98.0,6.13
1/1/1995,Arun,59473.60257,25.259505,0.0,0.0,222.0,95785.74537,25.677194,0.0,0.0,59760.25847,24.785972,0.0,0.0,47531.8149,23.787813,0.0,0.0,39097.34709,27.485736,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,67718.47861,24.467387,0.0,0.0,21.0,58827.71158,25.301688,0.0,0.0,201.0,6.13
1/1/1995,Ashfield,38911.87777,33.50047,0.0,0.0,97.0,56968.65464,35.040323,0.0,0.0,35332.04192,33.051218,0.0,0.0,28723.84563,32.349616,0.0,0.0,25217.73531,37.376892,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,48136.98634,32.748969,0.0,0.0,23.0,38664.77907,34.044514,0.0,0.0,74.0,6.13


In [25]:
# Save this dataset 
df_2.to_csv(os.path.join(path, 'Data','Prepared Data', 'UK_HPI_CLEANED_1995.csv'))