## Imports

In [2]:
import numpy as np
import pandas as pd
import seaborn as sns
import scipy.stats as st
import matplotlib.pyplot as plt

## Data

In [11]:
df = pd.read_csv('icl_train.zip', 
                 compression='zip',
                 sep=',',
                 parse_dates=['date'],
                 index_col='date')
df.head()

Unnamed: 0_level_0,zone,Вызов специальной бригады,Перевозка плановая,Перевозка экстренная,авария ( сбило машиной) постр.,аллергия( задыхается),аллергия( отекло лицо),аллергия( сыпь),аритмия,без сознания,...,травма позвоночника,травма ребер( задыхается),травма ребер( не задыхается),травма руки,травма руки( кровотечение),тяж.ст.опьянения,укусила собака,умер?,умер?( хронический больной),умирает
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
2019-01-01 07:00:00,П/станция 1,0,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
2019-01-01 08:00:00,П/станция 1,0,0,0,0,0,0,0,0,0,...,0,0,0,1,0,0,0,0,0,1
2019-01-01 09:00:00,П/станция 1,0,0,0,0,0,0,0,0,1,...,0,0,0,0,0,0,0,0,0,1
2019-01-01 10:00:00,П/станция 1,0,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
2019-01-01 11:00:00,П/станция 1,1,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0


#### Погода

In [23]:
weather_df = pd.read_csv('weather_prepared_interpolated.csv', 
                         encoding='cp1251',
                         parse_dates=[0],
                         index_col=0)
weather_df.head()

Unnamed: 0,weather,temp,w_spid,p
2019-01-01 03:00:00,пасмурно,-8.0,3.0,765.0
2019-01-01 04:00:00,пасмурно,-8.333333,2.666667,765.0
2019-01-01 05:00:00,пасмурно,-8.666667,2.333333,765.0
2019-01-01 06:00:00,пасмурно,-9.0,2.0,765.0
2019-01-01 07:00:00,пасмурно,-9.333333,2.0,765.0


#### Лунные фазы

In [24]:
moon_df = pd.read_csv('moon_prepared_interpolated.csv', 
                      encoding='cp1251',
                      parse_dates=[0],
                      index_col=0)
moon_df.head()

Unnamed: 0,новая луна,первая четверь,полнолуние,третья четверть
2019-01-01 00:00:00,1.0,0.0,0.0,0.0
2019-01-01 01:00:00,1.0,0.0,0.0,0.0
2019-01-01 02:00:00,1.0,0.0,0.0,0.0
2019-01-01 03:00:00,1.0,0.0,0.0,0.0
2019-01-01 04:00:00,1.0,0.0,0.0,0.0


#### Динамика по ковиду

In [43]:
covid_df = pd.read_csv('covid_interpolated.csv', 
                       encoding='cp1251',
                       parse_dates=[0],
                       index_col=0)
covid_df.head()

Unnamed: 0,Заражений за день
2019-01-01 00:00:00,0.0
2019-01-01 01:00:00,0.0
2019-01-01 02:00:00,0.0
2019-01-01 03:00:00,0.0
2019-01-01 04:00:00,0.0


### Агрегируем данные

In [44]:
df_new = df.copy()
df_new[weather_df.columns] = weather_df.loc[df.index]
df_new[moon_df.columns] = moon_df.loc[df.index]
df_new[covid_df.columns] = covid_df.loc[df.index]

In [45]:
df_new.head()

Unnamed: 0_level_0,zone,Вызов специальной бригады,Перевозка плановая,Перевозка экстренная,авария ( сбило машиной) постр.,аллергия( задыхается),аллергия( отекло лицо),аллергия( сыпь),аритмия,без сознания,...,умирает,weather,temp,w_spid,p,новая луна,первая четверь,полнолуние,третья четверть,Заражений за день
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
2019-01-01 07:00:00,П/станция 1,0,0,0,0,0,0,0,0,0,...,0,пасмурно,-9.333333,2.0,765.0,1.0,0.0,0.0,0.0,0.0
2019-01-01 08:00:00,П/станция 1,0,0,0,0,0,0,0,0,0,...,1,пасмурно,-9.666667,2.0,765.0,1.0,0.0,0.0,0.0,0.0
2019-01-01 09:00:00,П/станция 1,0,0,0,0,0,0,0,0,1,...,1,малооблачно,-10.0,2.0,765.0,1.0,0.0,0.0,0.0,0.0
2019-01-01 10:00:00,П/станция 1,0,0,0,0,0,0,0,0,0,...,0,малооблачно,-9.666667,2.006102,764.666667,1.0,0.0,0.0,0.0,0.0
2019-01-01 11:00:00,П/станция 1,1,0,0,0,0,0,0,0,0,...,0,малооблачно,-9.333333,2.012205,764.333333,1.0,0.0,0.0,0.0,0.0


## Pipeline