# Iteration 1 - Melbourne Pedestrian Counting System
This Jupyter Notebook is about preparing 'Melbourne Pedestrian Counting System' CSV file for being used in Mo-Buddy Website Solution.
1. Read Raw Data
2. Clean Raw Data
3. Export Clean Data

In [27]:
# Import Packages
import pandas as pd

In [28]:
# Set option to display all columns
pd.set_option('display.max_columns', None)

## 1. Read in Raw Data from a CSV file

In [29]:
# Function for reading in raw data from a CSV file
def read_in_data(file_path):
    """
    Function for reading in raw data from CSV file.
    Inputs: 
        - file_Path, type: string, desc: CSV file path
    Outputs:
        - raw_data, type: dataframe, desc: Raw data
    """

    raw_data = pd.read_csv(file_path)    
    
    return raw_data

In [30]:
# Months currently available to be read
months = ['January', 'February', 'March', 'April', 'June', 'July']
df_raw_full = pd.DataFrame()

# Loop to concatenate all dataframe into one single dataframe
for month in months:
    filepath_raw_data = 'DataBases\Pedestrian_' + month + '_2021.csv'
    df_raw_data = read_in_data(filepath_raw_data)
    df_raw_full = pd.concat([df_raw_full, df_raw_data], ignore_index='True')

In [31]:
# Check whether the concatenation is done
df_raw_full

Unnamed: 0,Date,Hour,Bourke Street Mall (North),Bourke Street Mall (South),Melbourne Central,Town Hall (West),Princes Bridge,Flinders Street Station Underpass,Birrarung Marr,Webb Bridge,Southern Cross Station,Victoria Point,Waterfront City,New Quay,Flagstaff Station,Sandridge Bridge,State Library,Collins St (North),Collins Place (South),Collins Place (North),Chinatown-Swanston St (North),Chinatown-Lt Bourke St (South),Bourke St-Russell St (West),Flinders St-Elizabeth St (East),Spencer St-Collins St (South),Spencer St-Collins St (North),Melbourne Convention Exhibition Centre,QV Market-Elizabeth St (West),QV Market-Peel St,The Arts Centre,St Kilda Rd-Alexandra Gardens,Lonsdale St (South),Lygon St (West),City Square,Flinders St-Spring St (West),Flinders St-Spark La,Southbank,Queen St (West),Lygon St (East),Flinders St-Swanston St (West),Alfred Place,Lonsdale St-Spring St (West),Grattan St-Swanston St (West),Monash Rd-Swanston St (West),Tin Alley-Swanston St (West),Little Collins St-Swanston St (East),Flinders La-Swanston St (West),Pelham St (South),Melbourne Central-Elizabeth St (East),QVM-Queen St (East),QVM-Therry St (South),Faraday St-Lygon St (West),QVM-Franklin St (North),Elizabeth St-Lonsdale St (South),Lincoln-Swanston (W),Elizabeth St-La Trobe St (East),Lonsdale St - Elizabeth St (North),Bourke St Bridge,Bourke St - Spencer St (North),RMIT Bld 80 - 445 Swanston Street,Flinders La-Swanston St (West) Temporary,RMIT Building 14,380 Elizabeth St,La Trobe St (North),231 Bourke St,Royal Pde - Grattan St,Swanston St - City Square,State Library - New,Flinders Ln - Degraves St (South),Flinders Ln - Degraves St (North),Flinders Ln - Degraves St (Crossing),Errol Street (East),Westwood Place,Flinders St - ACMI,Bourke St - Spencer St (South),Spring St - Flinders St (West),Macaulay Rd - Bellair St,Harbour Esplanade - Pedestrian Path,Harbour Esplanade - Bike Path
0,1/1/21,0,349,236,708,1461,3834,1678,250,270,62,60,308,988,-1,998,-1,196,79,33,413,500,575,1608,264,356,1093,171,50,753,9,446,119,undefined,-1,79,3579,201,107,undefined,14,86,9,3,5,638,2556,8,588,65,75,67,54,438,12,undefined,153,95,213,84,-1,183,769,95,424,15,747,697,-1,-1,-1,-1,12,742,124,-1,undefined,undefined,undefined
1,1/1/21,1,246,174,482,860,2123,1215,1027,112,34,56,72,349,-1,612,-1,159,51,30,341,302,506,1281,235,287,856,229,51,325,25,500,90,undefined,-1,47,1651,138,70,undefined,9,54,14,13,9,421,1716,14,494,78,112,49,73,401,15,undefined,151,116,298,62,-1,175,680,115,374,7,407,404,-1,-1,-1,-1,5,234,130,6,undefined,undefined,undefined
2,1/1/21,2,173,122,418,597,1057,862,58,71,35,31,24,178,-1,395,-1,122,62,26,224,130,331,993,159,267,292,192,35,235,22,325,40,undefined,-1,20,758,129,38,undefined,11,43,10,5,6,358,1160,7,390,50,64,30,46,307,13,undefined,155,59,152,65,-1,88,517,144,250,14,370,336,-1,-1,-1,13,8,133,116,-1,undefined,undefined,undefined
3,1/1/21,3,134,75,323,393,607,495,44,59,27,32,15,63,-1,310,-1,53,21,5,119,128,339,765,87,169,214,222,35,171,4,296,24,undefined,-1,10,246,57,4,undefined,11,23,12,6,3,277,1027,2,358,51,91,11,28,266,27,undefined,151,27,120,68,-1,96,439,92,211,13,204,165,-1,-1,-1,-1,3,55,108,-1,undefined,undefined,undefined
4,1/1/21,4,106,82,240,242,337,321,30,14,12,9,5,37,-1,230,-1,39,10,7,88,102,162,424,78,117,210,138,22,71,3,198,8,undefined,-1,5,167,74,15,undefined,-1,5,12,5,3,90,499,7,222,29,62,6,20,127,12,undefined,64,10,60,40,-1,35,308,65,123,6,57,98,-1,-1,-1,-1,5,44,30,-1,undefined,undefined,undefined
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
4339,31/7/21,19,889,253,277,1017,634,854,11,21,15,-1,8,23,-1,114,-1,166,113,17,1775,678,771,946,51,405,299,110,106,218,49,807,487,undefined,-1,2,694,100,609,undefined,28,153,32,18,8,383,1214,18,513,128,59,559,97,346,66,undefined,374,58,46,77,-1,137,1010,172,352,15,100,735,162,2,7,232,32,141,-1,-1,18,16,2
4340,31/7/21,20,305,138,317,654,347,477,7,166,15,-1,3,13,-1,67,-1,110,92,12,1291,517,665,751,51,403,136,35,47,141,18,829,463,undefined,-1,4,489,124,524,undefined,19,159,23,17,10,279,848,11,414,103,33,531,34,260,48,undefined,231,44,28,53,-1,122,582,135,312,7,69,580,123,3,5,156,1,153,-1,-1,7,10,4
4341,31/7/21,21,283,78,414,480,282,354,5,10,15,-1,5,22,-1,49,-1,79,69,16,1093,436,588,583,66,274,225,44,52,91,25,917,425,undefined,-1,1,68,194,399,undefined,8,108,19,18,8,277,642,23,281,65,39,253,54,266,48,undefined,183,17,29,48,-1,79,597,93,208,9,103,446,103,5,8,195,9,89,-1,-1,18,4,6
4342,31/7/21,22,175,107,390,344,217,404,2,9,10,-1,3,17,-1,81,-1,98,65,6,843,473,614,641,51,320,226,18,45,115,14,620,373,undefined,-1,6,68,118,304,undefined,16,114,18,29,8,248,645,3,238,80,31,267,40,181,23,undefined,112,23,30,40,-1,80,510,136,277,4,72,417,43,2,1,73,9,108,-1,-1,1,15,4


There are values less than 0 (negative). This suggests a negative value of count. One solution is to set 0 to those entries. Another solution is to delete those entries. Due to the solution one wants to provide to the webpage, the selected option is to impute those values with 0. Similarly, there are indefined values. In this case, the solutoin is to impute a negative value (-1) and after that proceed as the previous case (negative value). For example:
- Flagstaff Station --> -1
- State Library --> -1
- City Square --> undefined
- Flinders St-Spring St (West) --> -1
- Flinders St-Swanston St (West) --> undefined
- Elizabeth St-La Trobe St (East) --> undefined
- Flinders La-Swanston St (West) Temporary --> -1

## 2. Clean up Raw Data
1. Exploratory Data Analysis
2. Check Missing Data 
 - Check Undefined -> change from 'undefined' to '-1'
 - Check Negative Values -> change from '-1' to 0
3. Split Split Date --> Day - Month - Year

In [32]:
# Get list of all streets
all_streets = df_raw_full.iloc[:,2:].columns

### 2.1. Missing Data

In [33]:
# Filter negative values and replace with 0
for street in all_streets:
    undefined_value = (df_raw_full.loc[:,street] == 'undefined')
    df_raw_full.loc[undefined_value,street] = -1
    df_raw_full[street] = df_raw_full[street].astype('int')

In [34]:
# Check whether the imputation is done
df_raw_full.describe(include='all')

Unnamed: 0,Date,Hour,Bourke Street Mall (North),Bourke Street Mall (South),Melbourne Central,Town Hall (West),Princes Bridge,Flinders Street Station Underpass,Birrarung Marr,Webb Bridge,Southern Cross Station,Victoria Point,Waterfront City,New Quay,Flagstaff Station,Sandridge Bridge,State Library,Collins St (North),Collins Place (South),Collins Place (North),Chinatown-Swanston St (North),Chinatown-Lt Bourke St (South),Bourke St-Russell St (West),Flinders St-Elizabeth St (East),Spencer St-Collins St (South),Spencer St-Collins St (North),Melbourne Convention Exhibition Centre,QV Market-Elizabeth St (West),QV Market-Peel St,The Arts Centre,St Kilda Rd-Alexandra Gardens,Lonsdale St (South),Lygon St (West),City Square,Flinders St-Spring St (West),Flinders St-Spark La,Southbank,Queen St (West),Lygon St (East),Flinders St-Swanston St (West),Alfred Place,Lonsdale St-Spring St (West),Grattan St-Swanston St (West),Monash Rd-Swanston St (West),Tin Alley-Swanston St (West),Little Collins St-Swanston St (East),Flinders La-Swanston St (West),Pelham St (South),Melbourne Central-Elizabeth St (East),QVM-Queen St (East),QVM-Therry St (South),Faraday St-Lygon St (West),QVM-Franklin St (North),Elizabeth St-Lonsdale St (South),Lincoln-Swanston (W),Elizabeth St-La Trobe St (East),Lonsdale St - Elizabeth St (North),Bourke St Bridge,Bourke St - Spencer St (North),RMIT Bld 80 - 445 Swanston Street,Flinders La-Swanston St (West) Temporary,RMIT Building 14,380 Elizabeth St,La Trobe St (North),231 Bourke St,Royal Pde - Grattan St,Swanston St - City Square,State Library - New,Flinders Ln - Degraves St (South),Flinders Ln - Degraves St (North),Flinders Ln - Degraves St (Crossing),Errol Street (East),Westwood Place,Flinders St - ACMI,Bourke St - Spencer St (South),Spring St - Flinders St (West),Macaulay Rd - Bellair St,Harbour Esplanade - Pedestrian Path,Harbour Esplanade - Bike Path
count,4344,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0
unique,181,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
top,2/6/21,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
freq,24,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
mean,,11.5,621.180939,366.581722,287.129144,761.585175,800.877532,575.428867,144.064917,126.593923,143.270028,48.274171,42.418278,159.264273,-1.0,210.657459,-1.0,324.645718,195.999309,102.64802,295.636971,174.003453,307.972145,823.697284,145.156768,444.361648,489.546271,302.200967,81.843002,552.84047,106.121087,259.382827,154.234346,-1.0,-1.0,46.858656,267.718232,131.790516,104.437155,-1.0,59.395718,117.658379,80.577578,75.470994,33.708794,367.479742,1053.666897,31.513122,490.023481,133.560773,92.316989,187.614411,84.633287,187.262201,46.837477,-1.0,167.801565,231.985727,306.904696,255.77279,-1.0,190.225599,587.743324,103.798112,234.364871,85.265654,265.050645,451.948895,247.007597,121.387431,92.05732,105.315608,27.216851,189.766344,51.31837,34.472836,41.008517,74.082413,15.481123
std,,6.922983,739.895795,443.851973,327.491371,750.791072,782.454474,483.095128,247.646802,116.69179,230.169132,46.053039,43.426264,162.012221,0.0,171.998359,0.0,364.900815,219.51099,139.146496,307.079371,207.602337,278.893551,636.2528,145.967392,410.263168,455.934635,272.844115,78.614893,604.002189,207.429109,240.060705,168.021579,0.0,0.0,51.476709,393.873665,136.390528,112.014074,0.0,78.168228,115.153848,97.290722,103.042764,39.478808,367.195288,929.242819,35.177741,441.682904,142.558226,78.112904,176.040075,65.77904,165.763085,47.653213,0.0,143.331119,602.560459,287.256114,272.59108,0.0,171.922182,440.931072,76.095027,234.379623,112.65981,269.950465,517.534659,262.151856,151.207653,116.836286,116.126889,32.27844,213.913283,88.838042,38.991432,53.878926,130.117935,34.844725
min,,0.0,-1.0,-1.0,-1.0,1.0,6.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,7.0,-1.0,5.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,1.0,-1.0,4.0,-1.0,1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,9.0,1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0,-1.0
25%,,5.75,42.0,33.0,21.0,106.0,128.0,138.0,17.0,13.0,18.0,8.0,7.0,26.0,-1.0,57.75,-1.0,34.0,30.0,5.0,37.0,22.0,62.0,218.25,32.0,104.75,101.0,83.0,15.0,69.75,8.0,58.75,25.0,-1.0,-1.0,9.0,-1.0,22.0,15.0,-1.0,7.0,18.0,13.0,7.0,4.0,52.0,215.0,5.0,96.0,24.0,43.0,14.0,23.0,30.0,10.0,-1.0,34.0,3.75,69.0,33.0,-1.0,35.75,169.0,37.0,23.0,4.0,41.0,23.0,5.0,0.0,1.0,3.0,4.0,27.0,-1.0,6.0,-1.0,-1.0,-1.0
50%,,11.5,249.5,146.0,132.0,469.0,560.0,489.0,97.0,104.0,56.0,40.0,33.0,131.0,-1.0,182.0,-1.0,153.0,125.0,42.0,159.5,90.0,222.5,755.5,104.0,351.0,378.0,229.0,66.5,306.5,35.0,189.0,102.0,-1.0,-1.0,35.0,41.0,86.0,80.0,-1.0,31.0,87.0,47.0,36.0,19.0,244.5,776.0,21.0,345.5,100.0,75.0,145.0,79.0,147.5,31.0,-1.0,132.0,71.0,214.0,159.0,-1.0,149.0,530.0,95.0,178.0,39.0,184.0,205.5,147.0,33.0,29.0,51.0,15.0,115.0,2.0,29.0,5.0,-1.0,-1.0
75%,,17.25,1130.0,637.5,528.25,1339.0,1264.5,894.0,180.25,213.0,160.0,71.0,62.0,231.0,-1.0,322.0,-1.0,572.0,287.0,152.0,495.25,252.0,496.0,1311.0,204.0,658.0,736.0,417.25,121.0,874.0,123.0,399.0,222.0,-1.0,-1.0,72.0,427.25,211.0,157.0,-1.0,83.0,187.0,103.0,99.0,50.0,591.25,1754.0,45.0,825.0,188.25,112.0,327.0,128.25,319.0,71.0,-1.0,288.25,229.0,482.25,419.0,-1.0,300.0,959.0,155.0,394.0,127.0,412.0,813.0,468.0,238.0,180.0,196.0,39.0,273.0,75.0,54.0,88.0,124.0,9.25


In [35]:
# Filter negative values and replace with 0
for street in all_streets:
    negative_value = (df_raw_full.loc[:,street] < 0)
    df_raw_full.loc[negative_value,street] = 0

In [36]:
# Check whether the imputation is done
df_raw_full.describe(include='all')

Unnamed: 0,Date,Hour,Bourke Street Mall (North),Bourke Street Mall (South),Melbourne Central,Town Hall (West),Princes Bridge,Flinders Street Station Underpass,Birrarung Marr,Webb Bridge,Southern Cross Station,Victoria Point,Waterfront City,New Quay,Flagstaff Station,Sandridge Bridge,State Library,Collins St (North),Collins Place (South),Collins Place (North),Chinatown-Swanston St (North),Chinatown-Lt Bourke St (South),Bourke St-Russell St (West),Flinders St-Elizabeth St (East),Spencer St-Collins St (South),Spencer St-Collins St (North),Melbourne Convention Exhibition Centre,QV Market-Elizabeth St (West),QV Market-Peel St,The Arts Centre,St Kilda Rd-Alexandra Gardens,Lonsdale St (South),Lygon St (West),City Square,Flinders St-Spring St (West),Flinders St-Spark La,Southbank,Queen St (West),Lygon St (East),Flinders St-Swanston St (West),Alfred Place,Lonsdale St-Spring St (West),Grattan St-Swanston St (West),Monash Rd-Swanston St (West),Tin Alley-Swanston St (West),Little Collins St-Swanston St (East),Flinders La-Swanston St (West),Pelham St (South),Melbourne Central-Elizabeth St (East),QVM-Queen St (East),QVM-Therry St (South),Faraday St-Lygon St (West),QVM-Franklin St (North),Elizabeth St-Lonsdale St (South),Lincoln-Swanston (W),Elizabeth St-La Trobe St (East),Lonsdale St - Elizabeth St (North),Bourke St Bridge,Bourke St - Spencer St (North),RMIT Bld 80 - 445 Swanston Street,Flinders La-Swanston St (West) Temporary,RMIT Building 14,380 Elizabeth St,La Trobe St (North),231 Bourke St,Royal Pde - Grattan St,Swanston St - City Square,State Library - New,Flinders Ln - Degraves St (South),Flinders Ln - Degraves St (North),Flinders Ln - Degraves St (Crossing),Errol Street (East),Westwood Place,Flinders St - ACMI,Bourke St - Spencer St (South),Spring St - Flinders St (West),Macaulay Rd - Bellair St,Harbour Esplanade - Pedestrian Path,Harbour Esplanade - Bike Path
count,4344,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0,4344.0
unique,181,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
top,2/6/21,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
freq,24,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
mean,,11.5,621.228821,366.582182,287.315608,761.585175,800.877532,575.429098,144.094383,126.643186,143.287063,48.321133,42.474217,159.268416,0.0,210.662523,0.0,324.648711,196.001611,102.757827,295.639963,174.009438,307.981814,823.70511,145.159761,444.36326,489.561924,302.200967,81.851289,552.84047,106.194291,259.383517,154.243785,0.0,0.0,46.907228,268.087017,131.816068,104.452578,0.0,59.478821,117.678867,80.594843,75.533149,33.81814,367.480203,1053.666897,31.584254,490.023481,133.562615,92.316989,187.629144,84.634899,187.264273,46.856354,0.0,167.808011,232.191759,306.904926,255.774401,0.0,190.226289,587.743324,103.798112,234.49977,85.421961,265.054558,452.100599,247.206262,121.586096,92.255985,105.505064,27.288444,189.793738,51.815378,34.584254,41.38582,74.583564,16.10267
std,,6.922983,739.855552,443.851592,327.327471,750.791072,782.454474,483.094854,247.629595,116.6381,230.158488,46.003241,43.370895,162.008133,0.0,171.99214,0.0,364.898148,219.508929,139.065011,307.076485,207.597304,278.882854,636.242658,145.964405,410.26142,455.917806,272.844115,78.60621,604.002189,207.391456,240.059957,168.012885,0.0,0.0,51.431969,393.622221,136.365733,111.99962,0.0,78.104466,115.132817,97.276328,102.9969,39.38377,367.194826,929.242819,35.112861,441.682904,142.556494,78.112904,176.024327,65.776954,165.760738,47.63445,0.0,143.323548,602.480907,287.255868,272.589565,0.0,171.921416,440.931072,76.095027,234.244336,112.540618,269.946615,517.401964,261.964104,151.047258,116.678592,115.953932,32.216812,213.888908,88.546206,38.891186,53.586067,129.829329,34.552826
min,,0.0,0.0,0.0,0.0,1.0,6.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,7.0,0.0,5.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,4.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,9.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
25%,,5.75,42.0,33.0,21.0,106.0,128.0,138.0,17.0,13.0,18.0,8.0,7.0,26.0,0.0,57.75,0.0,34.0,30.0,5.0,37.0,22.0,62.0,218.25,32.0,104.75,101.0,83.0,15.0,69.75,8.0,58.75,25.0,0.0,0.0,9.0,0.0,22.0,15.0,0.0,7.0,18.0,13.0,7.0,4.0,52.0,215.0,5.0,96.0,24.0,43.0,14.0,23.0,30.0,10.0,0.0,34.0,3.75,69.0,33.0,0.0,35.75,169.0,37.0,23.0,4.0,41.0,23.0,5.0,0.0,1.0,3.0,4.0,27.0,0.0,6.0,0.0,0.0,0.0
50%,,11.5,249.5,146.0,132.0,469.0,560.0,489.0,97.0,104.0,56.0,40.0,33.0,131.0,0.0,182.0,0.0,153.0,125.0,42.0,159.5,90.0,222.5,755.5,104.0,351.0,378.0,229.0,66.5,306.5,35.0,189.0,102.0,0.0,0.0,35.0,41.0,86.0,80.0,0.0,31.0,87.0,47.0,36.0,19.0,244.5,776.0,21.0,345.5,100.0,75.0,145.0,79.0,147.5,31.0,0.0,132.0,71.0,214.0,159.0,0.0,149.0,530.0,95.0,178.0,39.0,184.0,205.5,147.0,33.0,29.0,51.0,15.0,115.0,2.0,29.0,5.0,0.0,0.0
75%,,17.25,1130.0,637.5,528.25,1339.0,1264.5,894.0,180.25,213.0,160.0,71.0,62.0,231.0,0.0,322.0,0.0,572.0,287.0,152.0,495.25,252.0,496.0,1311.0,204.0,658.0,736.0,417.25,121.0,874.0,123.0,399.0,222.0,0.0,0.0,72.0,427.25,211.0,157.0,0.0,83.0,187.0,103.0,99.0,50.0,591.25,1754.0,45.0,825.0,188.25,112.0,327.0,128.25,319.0,71.0,0.0,288.25,229.0,482.25,419.0,0.0,300.0,959.0,155.0,394.0,127.0,412.0,813.0,468.0,238.0,180.0,196.0,39.0,273.0,75.0,54.0,88.0,124.0,9.25


### 2.2. Split Date

In [37]:
date_split = df_raw_full['Date'].str.split('/')
df_raw_full.insert(1, 'Day', date_split.str[0])
df_raw_full.insert(2, 'Month', date_split.str[1])
df_raw_full.insert(3, 'Year', 2021)

In [38]:
df_raw_full

Unnamed: 0,Date,Day,Month,Year,Hour,Bourke Street Mall (North),Bourke Street Mall (South),Melbourne Central,Town Hall (West),Princes Bridge,Flinders Street Station Underpass,Birrarung Marr,Webb Bridge,Southern Cross Station,Victoria Point,Waterfront City,New Quay,Flagstaff Station,Sandridge Bridge,State Library,Collins St (North),Collins Place (South),Collins Place (North),Chinatown-Swanston St (North),Chinatown-Lt Bourke St (South),Bourke St-Russell St (West),Flinders St-Elizabeth St (East),Spencer St-Collins St (South),Spencer St-Collins St (North),Melbourne Convention Exhibition Centre,QV Market-Elizabeth St (West),QV Market-Peel St,The Arts Centre,St Kilda Rd-Alexandra Gardens,Lonsdale St (South),Lygon St (West),City Square,Flinders St-Spring St (West),Flinders St-Spark La,Southbank,Queen St (West),Lygon St (East),Flinders St-Swanston St (West),Alfred Place,Lonsdale St-Spring St (West),Grattan St-Swanston St (West),Monash Rd-Swanston St (West),Tin Alley-Swanston St (West),Little Collins St-Swanston St (East),Flinders La-Swanston St (West),Pelham St (South),Melbourne Central-Elizabeth St (East),QVM-Queen St (East),QVM-Therry St (South),Faraday St-Lygon St (West),QVM-Franklin St (North),Elizabeth St-Lonsdale St (South),Lincoln-Swanston (W),Elizabeth St-La Trobe St (East),Lonsdale St - Elizabeth St (North),Bourke St Bridge,Bourke St - Spencer St (North),RMIT Bld 80 - 445 Swanston Street,Flinders La-Swanston St (West) Temporary,RMIT Building 14,380 Elizabeth St,La Trobe St (North),231 Bourke St,Royal Pde - Grattan St,Swanston St - City Square,State Library - New,Flinders Ln - Degraves St (South),Flinders Ln - Degraves St (North),Flinders Ln - Degraves St (Crossing),Errol Street (East),Westwood Place,Flinders St - ACMI,Bourke St - Spencer St (South),Spring St - Flinders St (West),Macaulay Rd - Bellair St,Harbour Esplanade - Pedestrian Path,Harbour Esplanade - Bike Path
0,1/1/21,1,1,2021,0,349,236,708,1461,3834,1678,250,270,62,60,308,988,0,998,0,196,79,33,413,500,575,1608,264,356,1093,171,50,753,9,446,119,0,0,79,3579,201,107,0,14,86,9,3,5,638,2556,8,588,65,75,67,54,438,12,0,153,95,213,84,0,183,769,95,424,15,747,697,0,0,0,0,12,742,124,0,0,0,0
1,1/1/21,1,1,2021,1,246,174,482,860,2123,1215,1027,112,34,56,72,349,0,612,0,159,51,30,341,302,506,1281,235,287,856,229,51,325,25,500,90,0,0,47,1651,138,70,0,9,54,14,13,9,421,1716,14,494,78,112,49,73,401,15,0,151,116,298,62,0,175,680,115,374,7,407,404,0,0,0,0,5,234,130,6,0,0,0
2,1/1/21,1,1,2021,2,173,122,418,597,1057,862,58,71,35,31,24,178,0,395,0,122,62,26,224,130,331,993,159,267,292,192,35,235,22,325,40,0,0,20,758,129,38,0,11,43,10,5,6,358,1160,7,390,50,64,30,46,307,13,0,155,59,152,65,0,88,517,144,250,14,370,336,0,0,0,13,8,133,116,0,0,0,0
3,1/1/21,1,1,2021,3,134,75,323,393,607,495,44,59,27,32,15,63,0,310,0,53,21,5,119,128,339,765,87,169,214,222,35,171,4,296,24,0,0,10,246,57,4,0,11,23,12,6,3,277,1027,2,358,51,91,11,28,266,27,0,151,27,120,68,0,96,439,92,211,13,204,165,0,0,0,0,3,55,108,0,0,0,0
4,1/1/21,1,1,2021,4,106,82,240,242,337,321,30,14,12,9,5,37,0,230,0,39,10,7,88,102,162,424,78,117,210,138,22,71,3,198,8,0,0,5,167,74,15,0,0,5,12,5,3,90,499,7,222,29,62,6,20,127,12,0,64,10,60,40,0,35,308,65,123,6,57,98,0,0,0,0,5,44,30,0,0,0,0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
4339,31/7/21,31,7,2021,19,889,253,277,1017,634,854,11,21,15,0,8,23,0,114,0,166,113,17,1775,678,771,946,51,405,299,110,106,218,49,807,487,0,0,2,694,100,609,0,28,153,32,18,8,383,1214,18,513,128,59,559,97,346,66,0,374,58,46,77,0,137,1010,172,352,15,100,735,162,2,7,232,32,141,0,0,18,16,2
4340,31/7/21,31,7,2021,20,305,138,317,654,347,477,7,166,15,0,3,13,0,67,0,110,92,12,1291,517,665,751,51,403,136,35,47,141,18,829,463,0,0,4,489,124,524,0,19,159,23,17,10,279,848,11,414,103,33,531,34,260,48,0,231,44,28,53,0,122,582,135,312,7,69,580,123,3,5,156,1,153,0,0,7,10,4
4341,31/7/21,31,7,2021,21,283,78,414,480,282,354,5,10,15,0,5,22,0,49,0,79,69,16,1093,436,588,583,66,274,225,44,52,91,25,917,425,0,0,1,68,194,399,0,8,108,19,18,8,277,642,23,281,65,39,253,54,266,48,0,183,17,29,48,0,79,597,93,208,9,103,446,103,5,8,195,9,89,0,0,18,4,6
4342,31/7/21,31,7,2021,22,175,107,390,344,217,404,2,9,10,0,3,17,0,81,0,98,65,6,843,473,614,641,51,320,226,18,45,115,14,620,373,0,0,6,68,118,304,0,16,114,18,29,8,248,645,3,238,80,31,267,40,181,23,0,112,23,30,40,0,80,510,136,277,4,72,417,43,2,1,73,9,108,0,0,1,15,4


## 3. Export Clean Data to a CSV file

In [39]:
df_raw_full.to_csv('OK_Pedestrian_Melbourne_01_to_07_V1.csv')