# 1.2 Scaling Weather Dataset

#### Contents:

1. Installing Libraries
2. Importing Libraries
3. Importing Datasets
4. Scaling Data
5. Export Dataset

## 1. Installing Libraries

In [38]:
pip install pyarrow

Defaulting to user installation because normal site-packages is not writeable
Looking in links: /usr/share/pip-wheels
Note: you may need to restart the kernel to use updated packages.


## 2. Importing Libraries

In [36]:
import pandas as pd
import numpy as np
import seaborn as sns
import matplotlib
import matplotlib.pyplot as plt
import os
import sklearn
from sklearn.preprocessing import StandardScaler

## 3. Importing Datasets

In [3]:
path = r'/home/0668a905-109d-4403-be59-0a04abf51dd9/ClimateWins Analysis'

In [6]:
df = pd.read_csv(os.path.join(path, '01 Datasets', '01 Original Data', 'Dataset-weather-prediction-dataset-processed.csv'), index_col = False)

In [8]:
pd.set_option('display.max_columns', None)

In [10]:
pd.set_option('display.max_rows', None)

## 4. Scaling Data

### 4.1 Select Columns to Scale

In [12]:
df.head(3)

Unnamed: 0,DATE,MONTH,BASEL_cloud_cover,BASEL_wind_speed,BASEL_humidity,BASEL_pressure,BASEL_global_radiation,BASEL_precipitation,BASEL_snow_depth,BASEL_sunshine,BASEL_temp_mean,BASEL_temp_min,BASEL_temp_max,BELGRADE_cloud_cover,BELGRADE_humidity,BELGRADE_pressure,BELGRADE_global_radiation,BELGRADE_precipitation,BELGRADE_sunshine,BELGRADE_temp_mean,BELGRADE_temp_min,BELGRADE_temp_max,BUDAPEST_cloud_cover,BUDAPEST_humidity,BUDAPEST_pressure,BUDAPEST_global_radiation,BUDAPEST_precipitation,BUDAPEST_sunshine,BUDAPEST_temp_mean,BUDAPEST_temp_min,BUDAPEST_temp_max,DEBILT_cloud_cover,DEBILT_wind_speed,DEBILT_humidity,DEBILT_pressure,DEBILT_global_radiation,DEBILT_precipitation,DEBILT_sunshine,DEBILT_temp_mean,DEBILT_temp_min,DEBILT_temp_max,DUSSELDORF_cloud_cover,DUSSELDORF_wind_speed,DUSSELDORF_humidity,DUSSELDORF_pressure,DUSSELDORF_global_radiation,DUSSELDORF_precipitation,DUSSELDORF_snow_depth,DUSSELDORF_sunshine,DUSSELDORF_temp_mean,DUSSELDORF_temp_min,DUSSELDORF_temp_max,GDANSK_cloud_cover,GDANSK_humidity,GDANSK_precipitation,GDANSK_snow_depth,GDANSK_temp_mean,GDANSK_temp_min,GDANSK_temp_max,HEATHROW_cloud_cover,HEATHROW_humidity,HEATHROW_pressure,HEATHROW_global_radiation,HEATHROW_precipitation,HEATHROW_snow_depth,HEATHROW_sunshine,HEATHROW_temp_mean,HEATHROW_temp_min,HEATHROW_temp_max,KASSEL_wind_speed,KASSEL_humidity,KASSEL_pressure,KASSEL_global_radiation,KASSEL_precipitation,KASSEL_sunshine,KASSEL_temp_mean,KASSEL_temp_min,KASSEL_temp_max,LJUBLJANA_cloud_cover,LJUBLJANA_wind_speed,LJUBLJANA_humidity,LJUBLJANA_pressure,LJUBLJANA_global_radiation,LJUBLJANA_precipitation,LJUBLJANA_sunshine,LJUBLJANA_temp_mean,LJUBLJANA_temp_min,LJUBLJANA_temp_max,MAASTRICHT_cloud_cover,MAASTRICHT_wind_speed,MAASTRICHT_humidity,MAASTRICHT_pressure,MAASTRICHT_global_radiation,MAASTRICHT_precipitation,MAASTRICHT_sunshine,MAASTRICHT_temp_mean,MAASTRICHT_temp_min,MAASTRICHT_temp_max,MADRID_cloud_cover,MADRID_wind_speed,MADRID_humidity,MADRID_pressure,MADRID_global_radiation,MADRID_precipitation,MADRID_sunshine,MADRID_temp_mean,MADRID_temp_min,MADRID_temp_max,MUNCHENB_cloud_cover,MUNCHENB_humidity,MUNCHENB_global_radiation,MUNCHENB_precipitation,MUNCHENB_snow_depth,MUNCHENB_sunshine,MUNCHENB_temp_mean,MUNCHENB_temp_min,MUNCHENB_temp_max,OSLO_cloud_cover,OSLO_wind_speed,OSLO_humidity,OSLO_pressure,OSLO_global_radiation,OSLO_precipitation,OSLO_snow_depth,OSLO_sunshine,OSLO_temp_mean,OSLO_temp_min,OSLO_temp_max,ROMA_cloud_cover,ROMA_wind_speed,ROMA_humidity,ROMA_pressure,ROMA_sunshine,ROMA_temp_mean,SONNBLICK_cloud_cover,SONNBLICK_wind_speed,SONNBLICK_humidity,SONNBLICK_pressure,SONNBLICK_global_radiation,SONNBLICK_precipitation,SONNBLICK_sunshine,SONNBLICK_temp_mean,SONNBLICK_temp_min,SONNBLICK_temp_max,STOCKHOLM_cloud_cover,STOCKHOLM_pressure,STOCKHOLM_global_radiation,STOCKHOLM_precipitation,STOCKHOLM_sunshine,STOCKHOLM_temp_mean,STOCKHOLM_temp_min,STOCKHOLM_temp_max,TOURS_wind_speed,TOURS_humidity,TOURS_pressure,TOURS_global_radiation,TOURS_precipitation,TOURS_temp_mean,TOURS_temp_min,TOURS_temp_max,VALENTIA_cloud_cover,VALENTIA_humidity,VALENTIA_pressure,VALENTIA_global_radiation,VALENTIA_precipitation,VALENTIA_snow_depth,VALENTIA_sunshine,VALENTIA_temp_mean,VALENTIA_temp_min,VALENTIA_temp_max
0,19600101,1,7,2.1,0.85,1.018,0.32,0.09,0,0.7,6.5,0.8,10.9,1,0.81,1.0195,0.88,0.0,7.0,3.7,-0.9,7.9,4,0.67,1.017,0.44,0.01,2.3,2.4,-0.4,5.1,7,7.7,0.85,1.0032,0.07,0.25,0.0,9.3,7.4,11.0,8,5.4,0.83,1.0161,0.12,0.08,0,0.0,10.0,7.0,11.5,8,0.91,0.0,0,0.8,-0.3,1.6,7,0.91,1.001,0.13,0.22,0,0.0,10.6,9.4,8.3,2.9,0.82,1.0094,0.28,0.48,1.6,7.9,3.9,9.4,8,1.4,1.0,1.0173,0.2,0.0,0.0,-0.6,-1.9,0.5,7,8.7,0.83,1.0063,0.22,0.32,1.0,9.5,8.5,11.1,6,0.0,0.92,1.026,0.53,0.0,1.4,7.6,4.4,10.8,5,0.67,0.2,0.1,0,0.0,6.9,1.1,10.4,8,4.0,0.98,0.9978,0.04,1.14,0,0.0,4.9,3.8,5.9,3,2.6,0.73,1.0152,7.1,7.8,4,4.5,0.73,1.0304,0.48,0.01,2.3,-5.9,-8.5,-3.2,5,1.0114,0.05,0.32,0.0,4.2,2.2,4.9,3.8,0.76,1.0169,1.54,0.44,10.0,7.8,12.2,5,0.88,1.0003,0.45,0.34,0,4.7,8.5,6.0,10.9
1,19600102,1,6,2.1,0.84,1.018,0.36,1.05,0,1.1,6.1,3.3,10.1,6,0.84,1.0172,0.25,0.0,0.0,2.9,2.2,4.4,4,0.67,1.017,0.18,0.31,0.0,2.3,1.4,3.1,8,4.1,0.9,1.0056,0.14,0.06,0.1,7.7,6.4,8.3,8,3.6,0.89,1.0161,0.18,0.66,0,0.5,8.2,7.4,11.0,8,0.93,0.08,0,1.6,0.9,2.2,7,0.98,1.0051,0.13,0.23,0,0.0,6.1,3.9,10.6,1.9,0.86,1.0086,0.12,0.27,0.0,7.7,6.8,9.1,6,1.4,0.94,1.0173,0.56,0.13,3.2,2.1,-1.3,5.5,8,5.7,0.92,1.0062,0.17,1.34,0.4,8.6,7.5,9.9,7,0.8,0.86,1.0254,0.46,0.0,0.9,9.8,7.4,12.2,6,0.72,0.61,0.3,0,5.1,6.2,4.2,10.2,8,5.1,0.62,1.0139,0.04,0.0,0,0.0,3.4,2.8,4.9,3,2.6,0.73,1.0152,7.1,12.2,6,6.7,0.97,1.0292,0.21,0.61,0.0,-9.5,-10.5,-8.5,5,1.0114,0.05,0.06,0.0,4.0,3.0,5.0,3.8,0.76,1.0169,1.54,0.71,9.5,7.0,12.0,7,0.91,1.0007,0.25,0.84,0,0.7,8.9,5.6,12.1
2,19600103,1,8,2.1,0.9,1.018,0.18,0.3,0,0.0,8.5,5.1,9.9,6,0.77,1.0179,0.67,0.0,3.5,3.1,-0.5,6.4,4,0.67,1.017,0.3,0.0,0.6,2.7,1.7,5.3,6,3.1,0.92,1.0165,0.28,0.01,3.0,6.8,4.6,9.9,7,3.1,0.95,1.0161,0.12,0.07,0,0.0,7.1,6.9,9.1,8,0.94,0.15,0,0.7,0.4,1.7,8,0.96,1.0166,0.15,0.07,0,0.1,8.4,6.1,12.2,1.3,0.91,1.0129,0.12,0.6,0.0,6.5,6.0,8.0,8,1.4,0.96,1.0173,0.2,0.12,0.0,4.6,0.9,6.3,7,3.6,0.97,1.0167,0.12,0.46,0.0,6.9,5.5,9.9,5,1.9,0.9,1.0287,0.63,0.0,2.3,8.6,6.4,10.8,6,0.91,0.2,0.3,0,0.0,5.8,4.0,8.0,8,2.3,0.69,1.0234,0.04,0.08,0,0.0,1.9,0.6,3.1,3,2.6,0.73,1.0152,7.1,10.2,8,7.5,0.93,1.032,0.21,3.2,0.0,-9.5,-10.0,-8.9,5,1.0114,0.05,0.02,0.0,2.4,1.3,4.1,3.8,0.76,1.0169,1.54,0.1,10.3,9.0,11.6,7,0.91,1.0096,0.17,0.08,0,0.1,10.5,8.1,12.9


In [14]:
df.dtypes

DATE                             int64
MONTH                            int64
BASEL_cloud_cover                int64
BASEL_wind_speed               float64
BASEL_humidity                 float64
BASEL_pressure                 float64
BASEL_global_radiation         float64
BASEL_precipitation            float64
BASEL_snow_depth                 int64
BASEL_sunshine                 float64
BASEL_temp_mean                float64
BASEL_temp_min                 float64
BASEL_temp_max                 float64
BELGRADE_cloud_cover             int64
BELGRADE_humidity              float64
BELGRADE_pressure              float64
BELGRADE_global_radiation      float64
BELGRADE_precipitation         float64
BELGRADE_sunshine              float64
BELGRADE_temp_mean             float64
BELGRADE_temp_min              float64
BELGRADE_temp_max              float64
BUDAPEST_cloud_cover             int64
BUDAPEST_humidity              float64
BUDAPEST_pressure              float64
BUDAPEST_global_radiation

In [42]:
# Save original order of columns

original_order = df.columns.tolist()

In [44]:
# Define columns to drop & define as subset dataframe

cols_to_drop = ['DATE', 'MONTH']
dropped_cols = df[cols_to_drop]
dropped_cols.head(1)

Unnamed: 0,DATE,MONTH
0,19600101,1


In [46]:
# Drop columns and create new df for scaling

df_scaled = df.drop(columns = cols_to_drop)

### 4.2 Checking for Missing Data

In [49]:
df_scaled.isnull().sum() #no missing

BASEL_cloud_cover              0
BASEL_wind_speed               0
BASEL_humidity                 0
BASEL_pressure                 0
BASEL_global_radiation         0
BASEL_precipitation            0
BASEL_snow_depth               0
BASEL_sunshine                 0
BASEL_temp_mean                0
BASEL_temp_min                 0
BASEL_temp_max                 0
BELGRADE_cloud_cover           0
BELGRADE_humidity              0
BELGRADE_pressure              0
BELGRADE_global_radiation      0
BELGRADE_precipitation         0
BELGRADE_sunshine              0
BELGRADE_temp_mean             0
BELGRADE_temp_min              0
BELGRADE_temp_max              0
BUDAPEST_cloud_cover           0
BUDAPEST_humidity              0
BUDAPEST_pressure              0
BUDAPEST_global_radiation      0
BUDAPEST_precipitation         0
BUDAPEST_sunshine              0
BUDAPEST_temp_mean             0
BUDAPEST_temp_min              0
BUDAPEST_temp_max              0
DEBILT_cloud_cover             0
DEBILT_win

### 4.3 Scaling

In [52]:
#create scaler object using StandardScaler from sklearn.preprocessing

scaler = StandardScaler()

In [54]:
#create new df with scaled data

df_scaled = pd.DataFrame(scaler.fit_transform(df_scaled), columns = df_scaled.columns.values, index = df_scaled.index)
df_scaled.head()

Unnamed: 0,BASEL_cloud_cover,BASEL_wind_speed,BASEL_humidity,BASEL_pressure,BASEL_global_radiation,BASEL_precipitation,BASEL_snow_depth,BASEL_sunshine,BASEL_temp_mean,BASEL_temp_min,BASEL_temp_max,BELGRADE_cloud_cover,BELGRADE_humidity,BELGRADE_pressure,BELGRADE_global_radiation,BELGRADE_precipitation,BELGRADE_sunshine,BELGRADE_temp_mean,BELGRADE_temp_min,BELGRADE_temp_max,BUDAPEST_cloud_cover,BUDAPEST_humidity,BUDAPEST_pressure,BUDAPEST_global_radiation,BUDAPEST_precipitation,BUDAPEST_sunshine,BUDAPEST_temp_mean,BUDAPEST_temp_min,BUDAPEST_temp_max,DEBILT_cloud_cover,DEBILT_wind_speed,DEBILT_humidity,DEBILT_pressure,DEBILT_global_radiation,DEBILT_precipitation,DEBILT_sunshine,DEBILT_temp_mean,DEBILT_temp_min,DEBILT_temp_max,DUSSELDORF_cloud_cover,DUSSELDORF_wind_speed,DUSSELDORF_humidity,DUSSELDORF_pressure,DUSSELDORF_global_radiation,DUSSELDORF_precipitation,DUSSELDORF_snow_depth,DUSSELDORF_sunshine,DUSSELDORF_temp_mean,DUSSELDORF_temp_min,DUSSELDORF_temp_max,GDANSK_cloud_cover,GDANSK_humidity,GDANSK_precipitation,GDANSK_snow_depth,GDANSK_temp_mean,GDANSK_temp_min,GDANSK_temp_max,HEATHROW_cloud_cover,HEATHROW_humidity,HEATHROW_pressure,HEATHROW_global_radiation,HEATHROW_precipitation,HEATHROW_snow_depth,HEATHROW_sunshine,HEATHROW_temp_mean,HEATHROW_temp_min,HEATHROW_temp_max,KASSEL_wind_speed,KASSEL_humidity,KASSEL_pressure,KASSEL_global_radiation,KASSEL_precipitation,KASSEL_sunshine,KASSEL_temp_mean,KASSEL_temp_min,KASSEL_temp_max,LJUBLJANA_cloud_cover,LJUBLJANA_wind_speed,LJUBLJANA_humidity,LJUBLJANA_pressure,LJUBLJANA_global_radiation,LJUBLJANA_precipitation,LJUBLJANA_sunshine,LJUBLJANA_temp_mean,LJUBLJANA_temp_min,LJUBLJANA_temp_max,MAASTRICHT_cloud_cover,MAASTRICHT_wind_speed,MAASTRICHT_humidity,MAASTRICHT_pressure,MAASTRICHT_global_radiation,MAASTRICHT_precipitation,MAASTRICHT_sunshine,MAASTRICHT_temp_mean,MAASTRICHT_temp_min,MAASTRICHT_temp_max,MADRID_cloud_cover,MADRID_wind_speed,MADRID_humidity,MADRID_pressure,MADRID_global_radiation,MADRID_precipitation,MADRID_sunshine,MADRID_temp_mean,MADRID_temp_min,MADRID_temp_max,MUNCHENB_cloud_cover,MUNCHENB_humidity,MUNCHENB_global_radiation,MUNCHENB_precipitation,MUNCHENB_snow_depth,MUNCHENB_sunshine,MUNCHENB_temp_mean,MUNCHENB_temp_min,MUNCHENB_temp_max,OSLO_cloud_cover,OSLO_wind_speed,OSLO_humidity,OSLO_pressure,OSLO_global_radiation,OSLO_precipitation,OSLO_snow_depth,OSLO_sunshine,OSLO_temp_mean,OSLO_temp_min,OSLO_temp_max,ROMA_cloud_cover,ROMA_wind_speed,ROMA_humidity,ROMA_pressure,ROMA_sunshine,ROMA_temp_mean,SONNBLICK_cloud_cover,SONNBLICK_wind_speed,SONNBLICK_humidity,SONNBLICK_pressure,SONNBLICK_global_radiation,SONNBLICK_precipitation,SONNBLICK_sunshine,SONNBLICK_temp_mean,SONNBLICK_temp_min,SONNBLICK_temp_max,STOCKHOLM_cloud_cover,STOCKHOLM_pressure,STOCKHOLM_global_radiation,STOCKHOLM_precipitation,STOCKHOLM_sunshine,STOCKHOLM_temp_mean,STOCKHOLM_temp_min,STOCKHOLM_temp_max,TOURS_wind_speed,TOURS_humidity,TOURS_pressure,TOURS_global_radiation,TOURS_precipitation,TOURS_temp_mean,TOURS_temp_min,TOURS_temp_max,VALENTIA_cloud_cover,VALENTIA_humidity,VALENTIA_pressure,VALENTIA_global_radiation,VALENTIA_precipitation,VALENTIA_snow_depth,VALENTIA_sunshine,VALENTIA_temp_mean,VALENTIA_temp_min,VALENTIA_temp_max
0,0.660514,-0.02793,0.826097,-0.001949,-1.101066,-0.265148,-0.179228,-0.902918,-0.528623,-0.845652,-0.478356,-1.206433,0.90527,0.321771,-0.743149,-0.371315,0.283983,-1.016876,-1.22021,-0.949203,-0.25524,-0.010098,-0.005876,-1.118537,-0.321868,-0.773378,-1.099163,-1.119431,-1.136839,0.713782,2.78134,0.357839,-1.232471,-1.197013,0.049619,-1.077312,-0.114356,0.263326,-0.411047,1.232526,0.815394,0.625746,-0.005606,-1.157575,-0.305938,-0.131344,-1.014908,-0.105836,0.060555,-0.410423,1.317965,0.660721,-0.348893,-0.268791,-0.927601,-0.667864,-1.158624,0.833387,1.332572,-1.376592,-1.18737,0.141032,-0.073841,-1.064721,-0.106469,0.39347,-1.038492,0.420616,0.449867,-0.801741,-1.06969,0.747355,-0.647708,-0.182904,-0.251893,-0.466503,1.205492,-0.02373,1.864672,-0.008724,-1.203514,-0.40643,-1.149211,-1.370824,-1.12511,-1.578385,0.703568,2.336053,0.267752,-1.043873,-1.052433,0.252496,-0.810834,-0.097084,0.382899,-0.387967,0.855172,-1.419038,1.887115,1.149046,-1.423735,-0.315682,-1.521762,-0.98828,-0.877723,-1.044732,-0.093824,-0.746542,-1.244144,-0.282933,-0.30647,-1.098059,-0.265742,-0.505735,-0.350849,1.111743,0.816809,1.544023,-1.1424,-1.06787,1.925426,-0.470091,-1.018677,-0.186575,0.094958,-0.474865,-0.096926,-0.01198,-0.023247,-0.00114,-0.00636,-1.28045,-0.428835,-0.663322,-0.62943,0.095234,-1.24444,-0.649856,-0.550327,-0.124331,-0.170125,-0.063322,-0.060102,-0.003465,-1.079126,0.479131,-1.013295,-0.391072,-0.290439,-0.639538,-0.029802,-0.029569,-0.000607,-0.003383,0.619704,-0.257321,0.085361,-0.495396,-0.443701,0.761754,-1.299744,-0.806427,-0.088407,-0.024706,0.372147,-0.668215,-0.519743,-0.752237
1,0.244897,-0.02793,0.73576,-0.001949,-1.058108,1.65876,-0.179228,-0.810126,-0.582946,-0.46245,-0.569988,0.652846,1.119118,0.016838,-1.418387,-0.371315,-1.333204,-1.107669,-0.818702,-1.298119,-0.25524,-0.010098,-0.005876,-1.415938,0.371622,-1.344065,-1.110927,-0.878727,-1.341204,1.17606,0.44607,0.866945,-0.987868,-1.118559,-0.367169,-1.05282,-0.367511,0.090631,-0.781002,1.232526,-0.174978,1.143615,-0.005606,-1.089208,1.084926,-0.131344,-0.893696,-0.370915,0.125463,-0.473486,1.317965,0.726127,-0.133555,-0.268791,-0.825294,-0.506386,-1.089557,0.833387,2.00487,-0.984359,-1.18737,0.167279,-0.073841,-1.064721,-0.892676,-0.639866,-0.687774,-0.420953,0.818506,-0.897454,-1.267817,0.199693,-1.074723,-0.212437,0.231491,-0.504162,0.371461,-0.02373,1.399628,-0.008724,-0.828505,-0.266591,-0.420517,-1.043881,-1.043446,-1.056415,1.146094,0.779536,1.072259,-1.054624,-1.107754,2.569483,-0.958969,-0.232112,0.216034,-0.542607,1.22561,-0.910841,1.548493,1.06807,-1.496755,-0.315682,-1.642337,-0.69174,-0.411866,-0.882444,0.318678,-0.344471,-0.809683,0.065552,-0.30647,0.043394,-0.353714,-0.076441,-0.372683,1.111743,1.526267,-0.712374,0.190182,-1.06787,-0.455841,-0.470091,-1.018677,-0.368598,-0.033545,-0.582847,-0.096926,-0.01198,-0.023247,-0.00114,-0.00636,-0.539569,0.350125,-0.108112,0.727065,0.067319,-1.55317,0.186476,-1.073269,-0.650834,-0.456455,-0.839563,-0.060102,-0.003465,-1.079126,-0.251691,-1.013295,-0.415953,-0.18361,-0.62855,-0.029802,-0.029569,-0.000607,-0.003383,1.27722,-0.335759,-0.05668,-0.521727,0.783085,1.18358,-1.262455,-1.042055,0.503361,-0.024706,-0.829285,-0.548046,-0.629054,-0.407141
2,1.07613,-0.02793,1.277781,-0.001949,-1.25142,0.155707,-0.179228,-1.065304,-0.25701,-0.186545,-0.592896,0.652846,0.620141,0.109644,-0.968228,-0.371315,-0.524611,-1.084971,-1.168403,-1.098738,-0.25524,-0.010098,-0.005876,-1.278676,-0.344984,-1.19519,-1.063873,-0.83861,-1.116403,0.251504,-0.202616,1.070588,0.123041,-0.96165,-0.47685,-0.342557,-0.509912,-0.220221,-0.56177,0.78567,-0.450081,1.661484,-0.005606,-1.157575,-0.329918,-0.131344,-1.014908,-0.532908,0.044328,-0.713127,1.317965,0.75883,0.054865,-0.268791,-0.940389,-0.573669,-1.147113,1.324799,1.812785,0.115808,-1.164817,-0.252671,-0.073841,-1.039671,-0.490837,-0.226532,-0.443796,-0.925895,1.279304,-0.382997,-1.267817,1.060304,-1.074723,-0.389635,0.098144,-0.642248,1.205492,-0.02373,1.554643,-0.008724,-1.203514,-0.277348,-1.149211,-0.741156,-0.744013,-0.9729,0.703568,-0.310026,1.519207,0.074279,-1.163075,0.570514,-1.057726,-0.487164,-0.117697,-0.542607,0.484733,-0.21207,1.774241,1.513435,-1.31942,-0.315682,-1.304726,-0.85349,-0.567152,-1.044732,0.318678,1.183399,-1.244144,0.065552,-0.30647,-1.098059,-0.403983,-0.104138,-0.612852,1.111743,-0.279627,-0.27363,0.976489,-1.06787,-0.288735,-0.470091,-1.018677,-0.55062,-0.316251,-0.777215,-0.096926,-0.01198,-0.023247,-0.00114,-0.00636,-0.876333,1.129085,0.093782,0.500982,0.132454,-1.55317,3.796642,-1.073269,-0.650834,-0.384873,-0.898147,-0.060102,-0.003465,-1.079126,-0.364125,-1.013295,-0.615003,-0.410621,-0.727444,-0.029802,-0.029569,-0.000607,-0.003383,-0.208279,-0.210258,0.298424,-0.57439,0.783085,1.18358,-0.432779,-1.136306,-0.396127,-0.024706,-1.0095,-0.067372,0.054135,-0.177078
3,-1.001953,-0.02793,1.458455,-0.001949,-0.821838,-0.445514,-0.179228,-0.114186,-0.555784,-0.38581,-0.512718,1.396557,1.760659,1.289601,-1.418387,-0.371315,-1.333204,-1.209812,-1.362681,-1.437685,-0.25524,-0.010098,-0.005876,-1.404499,-0.344984,-1.344065,-1.146217,-1.012452,-1.208367,1.17606,1.483968,1.376051,1.142224,-1.185805,-0.301361,-1.077312,-0.525734,-0.392916,-0.534366,1.232526,-0.670163,0.88468,-0.005606,-1.157575,-0.44982,-0.131344,-1.014908,-0.577088,-0.49116,-0.851866,0.906985,0.660721,-0.348893,-0.268791,-1.042696,-0.748602,-1.112579,1.324799,2.00487,0.728074,-1.18737,-0.4364,-0.073841,-1.064721,-0.316124,-0.113804,-0.947,-0.841738,0.910666,1.543227,-1.267817,-0.504443,-1.074723,-0.493001,-0.035203,-0.830547,0.371461,-0.02373,1.399628,-0.008724,-0.901423,-0.40643,-0.648234,-0.910682,-0.730403,-0.899824,0.703568,0.468232,0.80409,1.256939,-1.118818,-0.474402,-0.983659,-0.472161,-0.534861,-0.52972,-1.367458,-0.720267,0.927685,1.43246,-0.766551,-0.315682,0.238641,-0.624345,-0.862194,-0.430357,0.318678,1.102985,-1.244144,-0.439751,-0.30647,-1.098059,-0.642763,-0.214923,-0.896689,1.111743,0.752313,1.544023,1.059258,-1.06787,0.27525,-0.470091,-1.018677,-0.417137,-0.341951,-0.582847,-0.096926,-0.01198,-0.023247,-0.00114,-0.00636,-0.775304,-0.039355,0.093782,0.500982,0.418586,-1.541736,0.86948,-1.073269,-0.943336,-0.800052,-1.059254,-0.060102,-0.003465,-1.079126,-0.420342,-1.013295,-0.76429,-0.530804,-0.925231,-0.029802,-0.029569,-0.000607,-0.003383,-0.208279,-0.069069,0.45822,-0.442733,0.783085,0.480538,0.387574,-1.183432,0.669056,-0.024706,-1.039536,-0.998679,-0.164486,-0.838511
4,0.244897,-0.02793,1.729466,-0.001949,-0.746661,-0.164944,-0.179228,0.187388,-1.003946,-1.075573,-1.039603,1.396557,2.188353,1.528244,-1.418387,-0.253655,-1.333204,-1.209812,-1.01298,-1.457623,-0.25524,-0.010098,-0.005876,-1.404499,-0.344984,-1.344065,-1.0874,-0.918844,-1.116403,0.251504,2.132654,0.866945,0.918004,-1.230636,0.356726,-1.077312,-0.320045,-0.60015,-0.383643,0.78567,0.320208,1.40255,-0.005606,-1.157575,0.989004,-0.131344,-1.014908,-0.444548,-0.06926,-0.473486,0.906985,0.75883,0.1087,-0.268791,-0.978754,-0.856254,-1.170135,-0.149436,0.660275,1.158574,-0.995669,-0.4364,-0.073841,-0.538678,-0.403481,0.29953,-1.206227,0.420616,0.818506,1.208231,-1.255434,1.347174,-1.074723,-0.552067,-0.28523,-0.893313,0.788477,-0.02373,1.399628,-0.008724,-1.203514,-0.40643,-1.149211,-0.862246,-0.812066,-1.129491,0.703568,1.038955,1.072259,1.063413,-1.163075,0.797669,-1.057726,-0.307127,-0.618294,-0.387967,-0.626581,-0.720267,0.306877,1.270509,-0.82914,-0.315682,0.021605,-0.381721,-0.287638,-0.441949,-0.093824,0.700914,-0.767297,1.215552,-0.30647,0.155301,-0.906678,-1.073511,-0.831188,1.111743,-0.795597,1.418668,-0.198832,-1.057482,0.087255,-0.470091,-1.018677,-0.332193,-0.020694,-0.582847,-0.096926,-0.01198,-0.023247,-0.00114,-0.00636,-0.926848,-1.207796,0.775175,-0.516389,0.388345,-0.970013,-0.649856,0.313663,-0.621584,-0.671203,-0.546642,-0.060102,-0.003465,-1.079126,3.289982,-1.013295,-0.503037,-0.477389,-0.705467,-0.029802,-0.029569,-0.000607,-0.003383,-0.451803,-0.037694,0.600262,-0.521727,-1.670486,-0.363113,1.72997,-0.794645,-0.49081,-0.024706,0.672505,-1.509396,-1.339569,-1.471186


### 4.4 Check Distribution

In [57]:
print(df_scaled.describe())

       BASEL_cloud_cover  BASEL_wind_speed  BASEL_humidity  BASEL_pressure  \
count       2.295000e+04      2.295000e+04    2.295000e+04    2.295000e+04   
mean       -1.975278e-16     -8.817541e-16    6.935145e-16   -1.690442e-15   
std         1.000022e+00      1.000022e+00    1.000022e+00    1.000022e+00   
min        -2.248803e+00     -2.894398e+00   -3.690749e+00   -6.619945e+00   
25%        -5.863365e-01     -2.793014e-02   -7.096309e-01   -3.381979e-01   
50%         2.448969e-01     -2.793014e-02    1.034013e-01   -1.948634e-03   
75%         6.605137e-01     -2.793014e-02    7.357597e-01    3.190165e-01   
max         1.076130e+00      1.935485e+01    2.181150e+00    4.155315e+00   

       BASEL_global_radiation  BASEL_precipitation  BASEL_snow_depth  \
count            2.295000e+04         2.295000e+04      2.295000e+04   
mean            -2.179617e-16        -6.997066e-17     -4.953675e-18   
std              1.000022e+00         1.000022e+00      1.000022e+00   
min      

### 4.5 Concat with Date Columns

In [60]:
df_final = pd.concat([dropped_cols, df_scaled], axis = 1)
df_final.head(3)

Unnamed: 0,DATE,MONTH,BASEL_cloud_cover,BASEL_wind_speed,BASEL_humidity,BASEL_pressure,BASEL_global_radiation,BASEL_precipitation,BASEL_snow_depth,BASEL_sunshine,BASEL_temp_mean,BASEL_temp_min,BASEL_temp_max,BELGRADE_cloud_cover,BELGRADE_humidity,BELGRADE_pressure,BELGRADE_global_radiation,BELGRADE_precipitation,BELGRADE_sunshine,BELGRADE_temp_mean,BELGRADE_temp_min,BELGRADE_temp_max,BUDAPEST_cloud_cover,BUDAPEST_humidity,BUDAPEST_pressure,BUDAPEST_global_radiation,BUDAPEST_precipitation,BUDAPEST_sunshine,BUDAPEST_temp_mean,BUDAPEST_temp_min,BUDAPEST_temp_max,DEBILT_cloud_cover,DEBILT_wind_speed,DEBILT_humidity,DEBILT_pressure,DEBILT_global_radiation,DEBILT_precipitation,DEBILT_sunshine,DEBILT_temp_mean,DEBILT_temp_min,DEBILT_temp_max,DUSSELDORF_cloud_cover,DUSSELDORF_wind_speed,DUSSELDORF_humidity,DUSSELDORF_pressure,DUSSELDORF_global_radiation,DUSSELDORF_precipitation,DUSSELDORF_snow_depth,DUSSELDORF_sunshine,DUSSELDORF_temp_mean,DUSSELDORF_temp_min,DUSSELDORF_temp_max,GDANSK_cloud_cover,GDANSK_humidity,GDANSK_precipitation,GDANSK_snow_depth,GDANSK_temp_mean,GDANSK_temp_min,GDANSK_temp_max,HEATHROW_cloud_cover,HEATHROW_humidity,HEATHROW_pressure,HEATHROW_global_radiation,HEATHROW_precipitation,HEATHROW_snow_depth,HEATHROW_sunshine,HEATHROW_temp_mean,HEATHROW_temp_min,HEATHROW_temp_max,KASSEL_wind_speed,KASSEL_humidity,KASSEL_pressure,KASSEL_global_radiation,KASSEL_precipitation,KASSEL_sunshine,KASSEL_temp_mean,KASSEL_temp_min,KASSEL_temp_max,LJUBLJANA_cloud_cover,LJUBLJANA_wind_speed,LJUBLJANA_humidity,LJUBLJANA_pressure,LJUBLJANA_global_radiation,LJUBLJANA_precipitation,LJUBLJANA_sunshine,LJUBLJANA_temp_mean,LJUBLJANA_temp_min,LJUBLJANA_temp_max,MAASTRICHT_cloud_cover,MAASTRICHT_wind_speed,MAASTRICHT_humidity,MAASTRICHT_pressure,MAASTRICHT_global_radiation,MAASTRICHT_precipitation,MAASTRICHT_sunshine,MAASTRICHT_temp_mean,MAASTRICHT_temp_min,MAASTRICHT_temp_max,MADRID_cloud_cover,MADRID_wind_speed,MADRID_humidity,MADRID_pressure,MADRID_global_radiation,MADRID_precipitation,MADRID_sunshine,MADRID_temp_mean,MADRID_temp_min,MADRID_temp_max,MUNCHENB_cloud_cover,MUNCHENB_humidity,MUNCHENB_global_radiation,MUNCHENB_precipitation,MUNCHENB_snow_depth,MUNCHENB_sunshine,MUNCHENB_temp_mean,MUNCHENB_temp_min,MUNCHENB_temp_max,OSLO_cloud_cover,OSLO_wind_speed,OSLO_humidity,OSLO_pressure,OSLO_global_radiation,OSLO_precipitation,OSLO_snow_depth,OSLO_sunshine,OSLO_temp_mean,OSLO_temp_min,OSLO_temp_max,ROMA_cloud_cover,ROMA_wind_speed,ROMA_humidity,ROMA_pressure,ROMA_sunshine,ROMA_temp_mean,SONNBLICK_cloud_cover,SONNBLICK_wind_speed,SONNBLICK_humidity,SONNBLICK_pressure,SONNBLICK_global_radiation,SONNBLICK_precipitation,SONNBLICK_sunshine,SONNBLICK_temp_mean,SONNBLICK_temp_min,SONNBLICK_temp_max,STOCKHOLM_cloud_cover,STOCKHOLM_pressure,STOCKHOLM_global_radiation,STOCKHOLM_precipitation,STOCKHOLM_sunshine,STOCKHOLM_temp_mean,STOCKHOLM_temp_min,STOCKHOLM_temp_max,TOURS_wind_speed,TOURS_humidity,TOURS_pressure,TOURS_global_radiation,TOURS_precipitation,TOURS_temp_mean,TOURS_temp_min,TOURS_temp_max,VALENTIA_cloud_cover,VALENTIA_humidity,VALENTIA_pressure,VALENTIA_global_radiation,VALENTIA_precipitation,VALENTIA_snow_depth,VALENTIA_sunshine,VALENTIA_temp_mean,VALENTIA_temp_min,VALENTIA_temp_max
0,19600101,1,0.660514,-0.02793,0.826097,-0.001949,-1.101066,-0.265148,-0.179228,-0.902918,-0.528623,-0.845652,-0.478356,-1.206433,0.90527,0.321771,-0.743149,-0.371315,0.283983,-1.016876,-1.22021,-0.949203,-0.25524,-0.010098,-0.005876,-1.118537,-0.321868,-0.773378,-1.099163,-1.119431,-1.136839,0.713782,2.78134,0.357839,-1.232471,-1.197013,0.049619,-1.077312,-0.114356,0.263326,-0.411047,1.232526,0.815394,0.625746,-0.005606,-1.157575,-0.305938,-0.131344,-1.014908,-0.105836,0.060555,-0.410423,1.317965,0.660721,-0.348893,-0.268791,-0.927601,-0.667864,-1.158624,0.833387,1.332572,-1.376592,-1.18737,0.141032,-0.073841,-1.064721,-0.106469,0.39347,-1.038492,0.420616,0.449867,-0.801741,-1.06969,0.747355,-0.647708,-0.182904,-0.251893,-0.466503,1.205492,-0.02373,1.864672,-0.008724,-1.203514,-0.40643,-1.149211,-1.370824,-1.12511,-1.578385,0.703568,2.336053,0.267752,-1.043873,-1.052433,0.252496,-0.810834,-0.097084,0.382899,-0.387967,0.855172,-1.419038,1.887115,1.149046,-1.423735,-0.315682,-1.521762,-0.98828,-0.877723,-1.044732,-0.093824,-0.746542,-1.244144,-0.282933,-0.30647,-1.098059,-0.265742,-0.505735,-0.350849,1.111743,0.816809,1.544023,-1.1424,-1.06787,1.925426,-0.470091,-1.018677,-0.186575,0.094958,-0.474865,-0.096926,-0.01198,-0.023247,-0.00114,-0.00636,-1.28045,-0.428835,-0.663322,-0.62943,0.095234,-1.24444,-0.649856,-0.550327,-0.124331,-0.170125,-0.063322,-0.060102,-0.003465,-1.079126,0.479131,-1.013295,-0.391072,-0.290439,-0.639538,-0.029802,-0.029569,-0.000607,-0.003383,0.619704,-0.257321,0.085361,-0.495396,-0.443701,0.761754,-1.299744,-0.806427,-0.088407,-0.024706,0.372147,-0.668215,-0.519743,-0.752237
1,19600102,1,0.244897,-0.02793,0.73576,-0.001949,-1.058108,1.65876,-0.179228,-0.810126,-0.582946,-0.46245,-0.569988,0.652846,1.119118,0.016838,-1.418387,-0.371315,-1.333204,-1.107669,-0.818702,-1.298119,-0.25524,-0.010098,-0.005876,-1.415938,0.371622,-1.344065,-1.110927,-0.878727,-1.341204,1.17606,0.44607,0.866945,-0.987868,-1.118559,-0.367169,-1.05282,-0.367511,0.090631,-0.781002,1.232526,-0.174978,1.143615,-0.005606,-1.089208,1.084926,-0.131344,-0.893696,-0.370915,0.125463,-0.473486,1.317965,0.726127,-0.133555,-0.268791,-0.825294,-0.506386,-1.089557,0.833387,2.00487,-0.984359,-1.18737,0.167279,-0.073841,-1.064721,-0.892676,-0.639866,-0.687774,-0.420953,0.818506,-0.897454,-1.267817,0.199693,-1.074723,-0.212437,0.231491,-0.504162,0.371461,-0.02373,1.399628,-0.008724,-0.828505,-0.266591,-0.420517,-1.043881,-1.043446,-1.056415,1.146094,0.779536,1.072259,-1.054624,-1.107754,2.569483,-0.958969,-0.232112,0.216034,-0.542607,1.22561,-0.910841,1.548493,1.06807,-1.496755,-0.315682,-1.642337,-0.69174,-0.411866,-0.882444,0.318678,-0.344471,-0.809683,0.065552,-0.30647,0.043394,-0.353714,-0.076441,-0.372683,1.111743,1.526267,-0.712374,0.190182,-1.06787,-0.455841,-0.470091,-1.018677,-0.368598,-0.033545,-0.582847,-0.096926,-0.01198,-0.023247,-0.00114,-0.00636,-0.539569,0.350125,-0.108112,0.727065,0.067319,-1.55317,0.186476,-1.073269,-0.650834,-0.456455,-0.839563,-0.060102,-0.003465,-1.079126,-0.251691,-1.013295,-0.415953,-0.18361,-0.62855,-0.029802,-0.029569,-0.000607,-0.003383,1.27722,-0.335759,-0.05668,-0.521727,0.783085,1.18358,-1.262455,-1.042055,0.503361,-0.024706,-0.829285,-0.548046,-0.629054,-0.407141
2,19600103,1,1.07613,-0.02793,1.277781,-0.001949,-1.25142,0.155707,-0.179228,-1.065304,-0.25701,-0.186545,-0.592896,0.652846,0.620141,0.109644,-0.968228,-0.371315,-0.524611,-1.084971,-1.168403,-1.098738,-0.25524,-0.010098,-0.005876,-1.278676,-0.344984,-1.19519,-1.063873,-0.83861,-1.116403,0.251504,-0.202616,1.070588,0.123041,-0.96165,-0.47685,-0.342557,-0.509912,-0.220221,-0.56177,0.78567,-0.450081,1.661484,-0.005606,-1.157575,-0.329918,-0.131344,-1.014908,-0.532908,0.044328,-0.713127,1.317965,0.75883,0.054865,-0.268791,-0.940389,-0.573669,-1.147113,1.324799,1.812785,0.115808,-1.164817,-0.252671,-0.073841,-1.039671,-0.490837,-0.226532,-0.443796,-0.925895,1.279304,-0.382997,-1.267817,1.060304,-1.074723,-0.389635,0.098144,-0.642248,1.205492,-0.02373,1.554643,-0.008724,-1.203514,-0.277348,-1.149211,-0.741156,-0.744013,-0.9729,0.703568,-0.310026,1.519207,0.074279,-1.163075,0.570514,-1.057726,-0.487164,-0.117697,-0.542607,0.484733,-0.21207,1.774241,1.513435,-1.31942,-0.315682,-1.304726,-0.85349,-0.567152,-1.044732,0.318678,1.183399,-1.244144,0.065552,-0.30647,-1.098059,-0.403983,-0.104138,-0.612852,1.111743,-0.279627,-0.27363,0.976489,-1.06787,-0.288735,-0.470091,-1.018677,-0.55062,-0.316251,-0.777215,-0.096926,-0.01198,-0.023247,-0.00114,-0.00636,-0.876333,1.129085,0.093782,0.500982,0.132454,-1.55317,3.796642,-1.073269,-0.650834,-0.384873,-0.898147,-0.060102,-0.003465,-1.079126,-0.364125,-1.013295,-0.615003,-0.410621,-0.727444,-0.029802,-0.029569,-0.000607,-0.003383,-0.208279,-0.210258,0.298424,-0.57439,0.783085,1.18358,-0.432779,-1.136306,-0.396127,-0.024706,-1.0095,-0.067372,0.054135,-0.177078


## 5. Export Dataset

In [44]:
df_final.to_pickle(os.path.join(path, '01 Datasets', '02 Prepared Data', 'weather_scaled.pkl'))

In [63]:
df_final.to_parquet(os.path.join(path, '01 Datasets', '02 Prepared Data', 'weather_scaled.parquet'), compression='snappy')