In [10]:
#Imports
import csv
import pandas as pd
import numpy as np
from sklearn.model_selection import train_test_split, GridSearchCV
from sklearn.linear_model import LinearRegression,LogisticRegression
from sklearn.svm import SVC,LinearSVC
from sklearn.tree import DecisionTreeClassifier
from sklearn.preprocessing import LabelEncoder, MinMaxScaler
from sklearn.metrics import accuracy_score,confusion_matrix
%matplotlib inline

#Leitura dos ficheiros
train = pd.read_csv('datasets/training_data.csv',encoding='cp1252')
test = pd.read_csv('datasets/test_data.csv',encoding='cp1252')

#Funções auxiliares
ordem = {'None':0, 'Low':1, 'Medium':2, 'High':3, 'Very_High':4}

def round_pred(pred,predictions):
    for n in pred:
        n = int(round(n))
        if n == 0: predictions.append('None')
        elif n == 1: predictions.append('Low')
        elif n == 2: predictions.append('Medium')
        elif n == 3: predictions.append('High')
        else: predictions.append('Very_High')

In [2]:
#Tratamento de dados

#Feriados e Dias da semana
feriados = ['2018-01-01', '2018-02-13', '2018-03-30', '2018-04-01', '2018-04-25', '2018-05-01', '2018-05-31', 
            '2018-06-10', '2018-08-15', '2018-10-05', '2018-11-01', '2018-12-01', '2018-12-08', '2018-12-25',
            '2019-01-01', '2019-03-05', '2019-04-19', '2019-04-21', '2019-04-25', '2019-05-01', '2019-06-10', 
            '2019-06-20', '2019-08-15', '2019-10-05', '2019-11-01', '2019-12-01', '2019-12-08', '2019-12-25']

for index,row in train.iterrows():
    data = row[1].split(' ')[0]
    dia = pd.Timestamp(data)
    train.at[index,'Dia'] = dia.day_name()
    if data in feriados: train.at[index,'Feriado'] = True
    else: train.at[index,'Feriado'] = False
        
for index,row in test.iterrows():
    data = row[1].split(' ')[0]
    dia = pd.Timestamp(data)
    test.at[index,'Dia'] = dia.day_name()
    if data in feriados: test.at[index,'Feriado'] = True
    else: test.at[index,'Feriado'] = False
        
del train['AVERAGE_PRECIPITATION']
del test['AVERAGE_PRECIPITATION']
del train['city_name']
del test['city_name']
del train['record_date']
del test['record_date']

train['AVERAGE_CLOUDINESS'].fillna(method ='pad',inplace=True)
train['AVERAGE_CLOUDINESS'].fillna(method ='bfill',inplace=True)
train['AVERAGE_RAIN'].fillna(method ='pad',inplace=True)
train['AVERAGE_RAIN'].fillna(method ='bfill',inplace=True)

In [3]:
#Substituir outliers
q = train['AVERAGE_TIME_DIFF'].quantile(0.9)
train.loc[train.AVERAGE_TIME_DIFF > q, 'AVERAGE_TIME_DIFF'] = np.nan
train.fillna(q,inplace=True)

In [4]:
#Preparação para colocar nos modelos
X = train.drop(['AVERAGE_SPEED_DIFF'],axis=1)
Y = train['AVERAGE_SPEED_DIFF'].to_frame()
Y_2 = train['AVERAGE_SPEED_DIFF'].map(ordem)
X_test = test

luminosity = LabelEncoder()
cloudiness = LabelEncoder()
rain = LabelEncoder()
feriado = LabelEncoder()
day = LabelEncoder()
luminosity_t = LabelEncoder()
cloudiness_t = LabelEncoder()
rain_t = LabelEncoder()
feriado_t = LabelEncoder()
day_t = LabelEncoder()

X['LUMINOSITY_n'] = luminosity.fit_transform(X['LUMINOSITY'])
X['AVERAGE_CLOUDINESS_n'] = cloudiness.fit_transform(X['AVERAGE_CLOUDINESS'])
X['AVERAGE_RAIN_n'] = rain.fit_transform(X['AVERAGE_RAIN'])
X['Feriado_n'] = feriado.fit_transform(X['Feriado'])
X['Dia_n'] = day.fit_transform(X['Dia'])

X_test['LUMINOSITY_n'] = luminosity_t.fit_transform(X_test['LUMINOSITY'])
X_test['AVERAGE_CLOUDINESS_n'] = cloudiness_t.fit_transform(X_test['AVERAGE_CLOUDINESS'])
X_test['AVERAGE_RAIN_n'] = rain_t.fit_transform(X_test['AVERAGE_RAIN'])
X_test['Feriado_n'] = feriado_t.fit_transform(X_test['Feriado'])
X_test['Dia_n'] = day_t.fit_transform(X_test['Dia'])

X = X.drop(['LUMINOSITY', 'AVERAGE_CLOUDINESS', 'AVERAGE_RAIN','Dia','Feriado'],axis=1)
X_test = X_test.drop(['LUMINOSITY', 'AVERAGE_CLOUDINESS', 'AVERAGE_RAIN','Dia','Feriado'],axis=1)

In [6]:
#DecisionTreeClassifier
dtc = DecisionTreeClassifier(random_state= 2021)
dtc.fit(X,Y)
predictions = dtc.predict(X_test)
predictions

array(['None', 'Medium', 'None', ..., 'None', 'Very_High', 'Low'],
      dtype=object)

In [7]:
#Linear Regression
lr = LinearRegression()
lr.fit(X,Y_2)
pred = lr.predict(X_test)
predictions = []
round_pred(pred,predictions)
predictions

['None',
 'Low',
 'None',
 'High',
 'Low',
 'Medium',
 'Low',
 'Low',
 'Low',
 'Medium',
 'None',
 'Low',
 'Medium',
 'High',
 'High',
 'High',
 'None',
 'High',
 'Low',
 'None',
 'None',
 'Low',
 'Low',
 'None',
 'Medium',
 'Medium',
 'Medium',
 'None',
 'None',
 'Very_High',
 'Low',
 'Low',
 'Very_High',
 'Low',
 'Low',
 'Low',
 'Low',
 'High',
 'Medium',
 'None',
 'Low',
 'None',
 'High',
 'Very_High',
 'High',
 'Low',
 'Low',
 'Low',
 'Low',
 'Low',
 'Low',
 'Low',
 'Very_High',
 'Medium',
 'None',
 'Medium',
 'High',
 'Very_High',
 'Very_High',
 'None',
 'None',
 'Low',
 'Low',
 'Low',
 'Very_High',
 'None',
 'Very_High',
 'Low',
 'Medium',
 'Very_High',
 'None',
 'Low',
 'Low',
 'Low',
 'Very_High',
 'High',
 'Low',
 'None',
 'Medium',
 'Medium',
 'Low',
 'Low',
 'Very_High',
 'None',
 'None',
 'Low',
 'None',
 'Medium',
 'None',
 'High',
 'Medium',
 'None',
 'None',
 'High',
 'Medium',
 'None',
 'Very_High',
 'None',
 'None',
 'Very_High',
 'Medium',
 'Low',
 'None',
 'None',
 '

In [11]:
#Logistic Regression
logr = LogisticRegression(max_iter=10000)
logr.fit(X,Y_2)
pred = logr.predict(X_test)
predictions = []
round_pred(pred,predictions)
predictions

['None',
 'Medium',
 'None',
 'Medium',
 'None',
 'Medium',
 'Low',
 'Medium',
 'None',
 'Medium',
 'None',
 'None',
 'Medium',
 'Medium',
 'High',
 'High',
 'None',
 'High',
 'Medium',
 'None',
 'None',
 'None',
 'Low',
 'None',
 'Medium',
 'Medium',
 'High',
 'None',
 'None',
 'Very_High',
 'None',
 'Low',
 'Very_High',
 'Medium',
 'None',
 'None',
 'Medium',
 'High',
 'Medium',
 'None',
 'None',
 'None',
 'High',
 'Very_High',
 'High',
 'Medium',
 'Low',
 'None',
 'Low',
 'Low',
 'Medium',
 'Medium',
 'High',
 'Medium',
 'None',
 'High',
 'High',
 'High',
 'Very_High',
 'None',
 'None',
 'Low',
 'None',
 'Medium',
 'Very_High',
 'None',
 'Very_High',
 'Low',
 'High',
 'Very_High',
 'None',
 'Medium',
 'Medium',
 'Medium',
 'Very_High',
 'High',
 'Low',
 'None',
 'Medium',
 'Medium',
 'Low',
 'Medium',
 'Very_High',
 'None',
 'None',
 'Low',
 'None',
 'Medium',
 'None',
 'High',
 'Medium',
 'None',
 'None',
 'High',
 'Medium',
 'None',
 'Very_High',
 'None',
 'None',
 'Very_High',
 '

In [16]:
#LinearSVC
model = LinearSVC(dual=False)
model.fit(X,Y)

predictions = model.predict(X_test)
predictions

  y = column_or_1d(y, warn=True)


array(['None', 'Low', 'None', ..., 'None', 'Very_High', 'Medium'],
      dtype=object)

In [14]:
#GridSearch
param_grid = {'C': [0.1,1,10,100,1000], 'gamma': [1,0.1,0.01,0.001,0.0001],'kernel': ['rbf']}
grid = GridSearchCV(SVC(random_state=2021),param_grid,refit=True,verbose=3)
grid.fit(X,Y)

predictions = grid.predict(X_test)
predictions

Fitting 5 folds for each of 25 candidates, totalling 125 fits


  y = column_or_1d(y, warn=True)


[CV 1/5] END ........C=0.1, gamma=1, kernel=rbf;, score=0.323 total time=   7.2s


  y = column_or_1d(y, warn=True)


[CV 2/5] END ........C=0.1, gamma=1, kernel=rbf;, score=0.323 total time=   5.8s


  y = column_or_1d(y, warn=True)


[CV 3/5] END ........C=0.1, gamma=1, kernel=rbf;, score=0.323 total time=   5.4s


  y = column_or_1d(y, warn=True)


[CV 4/5] END ........C=0.1, gamma=1, kernel=rbf;, score=0.323 total time=   6.1s


  y = column_or_1d(y, warn=True)


[CV 5/5] END ........C=0.1, gamma=1, kernel=rbf;, score=0.323 total time=   4.9s


  y = column_or_1d(y, warn=True)


[CV 1/5] END ......C=0.1, gamma=0.1, kernel=rbf;, score=0.323 total time=   3.4s


  y = column_or_1d(y, warn=True)


[CV 2/5] END ......C=0.1, gamma=0.1, kernel=rbf;, score=0.323 total time=   3.4s


  y = column_or_1d(y, warn=True)


[CV 3/5] END ......C=0.1, gamma=0.1, kernel=rbf;, score=0.323 total time=   3.5s


  y = column_or_1d(y, warn=True)


[CV 4/5] END ......C=0.1, gamma=0.1, kernel=rbf;, score=0.323 total time=   3.6s


  y = column_or_1d(y, warn=True)


[CV 5/5] END ......C=0.1, gamma=0.1, kernel=rbf;, score=0.323 total time=   3.3s


  y = column_or_1d(y, warn=True)


[CV 1/5] END .....C=0.1, gamma=0.01, kernel=rbf;, score=0.699 total time=   1.9s


  y = column_or_1d(y, warn=True)


[CV 2/5] END .....C=0.1, gamma=0.01, kernel=rbf;, score=0.701 total time=   1.9s


  y = column_or_1d(y, warn=True)


[CV 3/5] END .....C=0.1, gamma=0.01, kernel=rbf;, score=0.725 total time=   1.9s


  y = column_or_1d(y, warn=True)


[CV 4/5] END .....C=0.1, gamma=0.01, kernel=rbf;, score=0.714 total time=   1.9s


  y = column_or_1d(y, warn=True)


[CV 5/5] END .....C=0.1, gamma=0.01, kernel=rbf;, score=0.696 total time=   1.8s


  y = column_or_1d(y, warn=True)


[CV 1/5] END ....C=0.1, gamma=0.001, kernel=rbf;, score=0.743 total time=   1.2s


  y = column_or_1d(y, warn=True)


[CV 2/5] END ....C=0.1, gamma=0.001, kernel=rbf;, score=0.756 total time=   1.1s


  y = column_or_1d(y, warn=True)


[CV 3/5] END ....C=0.1, gamma=0.001, kernel=rbf;, score=0.775 total time=   1.2s


  y = column_or_1d(y, warn=True)


[CV 4/5] END ....C=0.1, gamma=0.001, kernel=rbf;, score=0.744 total time=   1.1s


  y = column_or_1d(y, warn=True)


[CV 5/5] END ....C=0.1, gamma=0.001, kernel=rbf;, score=0.758 total time=   1.2s


  y = column_or_1d(y, warn=True)


[CV 1/5] END ...C=0.1, gamma=0.0001, kernel=rbf;, score=0.669 total time=   1.6s


  y = column_or_1d(y, warn=True)


[CV 2/5] END ...C=0.1, gamma=0.0001, kernel=rbf;, score=0.701 total time=   1.7s


  y = column_or_1d(y, warn=True)


[CV 3/5] END ...C=0.1, gamma=0.0001, kernel=rbf;, score=0.709 total time=   1.6s


  y = column_or_1d(y, warn=True)


[CV 4/5] END ...C=0.1, gamma=0.0001, kernel=rbf;, score=0.708 total time=   1.5s


  y = column_or_1d(y, warn=True)


[CV 5/5] END ...C=0.1, gamma=0.0001, kernel=rbf;, score=0.698 total time=   1.5s


  y = column_or_1d(y, warn=True)


[CV 1/5] END ..........C=1, gamma=1, kernel=rbf;, score=0.323 total time=   5.1s


  y = column_or_1d(y, warn=True)


[CV 2/5] END ..........C=1, gamma=1, kernel=rbf;, score=0.323 total time=   4.8s


  y = column_or_1d(y, warn=True)


[CV 3/5] END ..........C=1, gamma=1, kernel=rbf;, score=0.323 total time=   5.0s


  y = column_or_1d(y, warn=True)


[CV 4/5] END ..........C=1, gamma=1, kernel=rbf;, score=0.323 total time=   4.9s


  y = column_or_1d(y, warn=True)


[CV 5/5] END ..........C=1, gamma=1, kernel=rbf;, score=0.323 total time=   4.9s


  y = column_or_1d(y, warn=True)


[CV 1/5] END ........C=1, gamma=0.1, kernel=rbf;, score=0.415 total time=   3.4s


  y = column_or_1d(y, warn=True)


[CV 2/5] END ........C=1, gamma=0.1, kernel=rbf;, score=0.405 total time=   3.6s


  y = column_or_1d(y, warn=True)


[CV 3/5] END ........C=1, gamma=0.1, kernel=rbf;, score=0.412 total time=   3.6s


  y = column_or_1d(y, warn=True)


[CV 4/5] END ........C=1, gamma=0.1, kernel=rbf;, score=0.405 total time=   3.5s


  y = column_or_1d(y, warn=True)


[CV 5/5] END ........C=1, gamma=0.1, kernel=rbf;, score=0.421 total time=   3.7s


  y = column_or_1d(y, warn=True)


[CV 1/5] END .......C=1, gamma=0.01, kernel=rbf;, score=0.759 total time=   1.7s


  y = column_or_1d(y, warn=True)


[CV 2/5] END .......C=1, gamma=0.01, kernel=rbf;, score=0.768 total time=   1.9s


  y = column_or_1d(y, warn=True)


[CV 3/5] END .......C=1, gamma=0.01, kernel=rbf;, score=0.772 total time=   1.7s


  y = column_or_1d(y, warn=True)


[CV 4/5] END .......C=1, gamma=0.01, kernel=rbf;, score=0.775 total time=   1.6s


  y = column_or_1d(y, warn=True)


[CV 5/5] END .......C=1, gamma=0.01, kernel=rbf;, score=0.767 total time=   1.5s


  y = column_or_1d(y, warn=True)


[CV 1/5] END ......C=1, gamma=0.001, kernel=rbf;, score=0.771 total time=   0.9s


  y = column_or_1d(y, warn=True)


[CV 2/5] END ......C=1, gamma=0.001, kernel=rbf;, score=0.779 total time=   0.9s


  y = column_or_1d(y, warn=True)


[CV 3/5] END ......C=1, gamma=0.001, kernel=rbf;, score=0.795 total time=   1.0s


  y = column_or_1d(y, warn=True)


[CV 4/5] END ......C=1, gamma=0.001, kernel=rbf;, score=0.761 total time=   0.9s


  y = column_or_1d(y, warn=True)


[CV 5/5] END ......C=1, gamma=0.001, kernel=rbf;, score=0.779 total time=   1.0s


  y = column_or_1d(y, warn=True)


[CV 1/5] END .....C=1, gamma=0.0001, kernel=rbf;, score=0.752 total time=   1.0s


  y = column_or_1d(y, warn=True)


[CV 2/5] END .....C=1, gamma=0.0001, kernel=rbf;, score=0.764 total time=   1.1s


  y = column_or_1d(y, warn=True)


[CV 3/5] END .....C=1, gamma=0.0001, kernel=rbf;, score=0.786 total time=   1.0s


  y = column_or_1d(y, warn=True)


[CV 4/5] END .....C=1, gamma=0.0001, kernel=rbf;, score=0.760 total time=   1.0s


  y = column_or_1d(y, warn=True)


[CV 5/5] END .....C=1, gamma=0.0001, kernel=rbf;, score=0.766 total time=   1.0s


  y = column_or_1d(y, warn=True)


[CV 1/5] END .........C=10, gamma=1, kernel=rbf;, score=0.323 total time=   5.5s


  y = column_or_1d(y, warn=True)


[CV 2/5] END .........C=10, gamma=1, kernel=rbf;, score=0.324 total time=   5.5s


  y = column_or_1d(y, warn=True)


[CV 3/5] END .........C=10, gamma=1, kernel=rbf;, score=0.323 total time=   5.7s


  y = column_or_1d(y, warn=True)


[CV 4/5] END .........C=10, gamma=1, kernel=rbf;, score=0.323 total time=   5.5s


  y = column_or_1d(y, warn=True)


[CV 5/5] END .........C=10, gamma=1, kernel=rbf;, score=0.324 total time=   5.3s


  y = column_or_1d(y, warn=True)


[CV 1/5] END .......C=10, gamma=0.1, kernel=rbf;, score=0.439 total time=   3.4s


  y = column_or_1d(y, warn=True)


[CV 2/5] END .......C=10, gamma=0.1, kernel=rbf;, score=0.428 total time=   3.6s


  y = column_or_1d(y, warn=True)


[CV 3/5] END .......C=10, gamma=0.1, kernel=rbf;, score=0.445 total time=   3.4s


  y = column_or_1d(y, warn=True)


[CV 4/5] END .......C=10, gamma=0.1, kernel=rbf;, score=0.441 total time=   3.7s


  y = column_or_1d(y, warn=True)


[CV 5/5] END .......C=10, gamma=0.1, kernel=rbf;, score=0.458 total time=   3.8s


  y = column_or_1d(y, warn=True)


[CV 1/5] END ......C=10, gamma=0.01, kernel=rbf;, score=0.726 total time=   1.7s


  y = column_or_1d(y, warn=True)


[CV 2/5] END ......C=10, gamma=0.01, kernel=rbf;, score=0.737 total time=   1.7s


  y = column_or_1d(y, warn=True)


[CV 3/5] END ......C=10, gamma=0.01, kernel=rbf;, score=0.735 total time=   2.1s


  y = column_or_1d(y, warn=True)


[CV 4/5] END ......C=10, gamma=0.01, kernel=rbf;, score=0.742 total time=   1.8s


  y = column_or_1d(y, warn=True)


[CV 5/5] END ......C=10, gamma=0.01, kernel=rbf;, score=0.738 total time=   1.7s


  y = column_or_1d(y, warn=True)


[CV 1/5] END .....C=10, gamma=0.001, kernel=rbf;, score=0.781 total time=   0.8s


  y = column_or_1d(y, warn=True)


[CV 2/5] END .....C=10, gamma=0.001, kernel=rbf;, score=0.777 total time=   0.8s


  y = column_or_1d(y, warn=True)


[CV 3/5] END .....C=10, gamma=0.001, kernel=rbf;, score=0.793 total time=   0.8s


  y = column_or_1d(y, warn=True)


[CV 4/5] END .....C=10, gamma=0.001, kernel=rbf;, score=0.778 total time=   0.9s


  y = column_or_1d(y, warn=True)


[CV 5/5] END .....C=10, gamma=0.001, kernel=rbf;, score=0.778 total time=   0.9s


  y = column_or_1d(y, warn=True)


[CV 1/5] END ....C=10, gamma=0.0001, kernel=rbf;, score=0.770 total time=   0.8s


  y = column_or_1d(y, warn=True)


[CV 2/5] END ....C=10, gamma=0.0001, kernel=rbf;, score=0.775 total time=   0.9s


  y = column_or_1d(y, warn=True)


[CV 3/5] END ....C=10, gamma=0.0001, kernel=rbf;, score=0.795 total time=   0.9s


  y = column_or_1d(y, warn=True)


[CV 4/5] END ....C=10, gamma=0.0001, kernel=rbf;, score=0.770 total time=   0.8s


  y = column_or_1d(y, warn=True)


[CV 5/5] END ....C=10, gamma=0.0001, kernel=rbf;, score=0.782 total time=   0.8s


  y = column_or_1d(y, warn=True)


[CV 1/5] END ........C=100, gamma=1, kernel=rbf;, score=0.323 total time=   5.5s


  y = column_or_1d(y, warn=True)


[CV 2/5] END ........C=100, gamma=1, kernel=rbf;, score=0.324 total time=   5.4s


  y = column_or_1d(y, warn=True)


[CV 3/5] END ........C=100, gamma=1, kernel=rbf;, score=0.323 total time=   5.2s


  y = column_or_1d(y, warn=True)


[CV 4/5] END ........C=100, gamma=1, kernel=rbf;, score=0.323 total time=   5.4s


  y = column_or_1d(y, warn=True)


[CV 5/5] END ........C=100, gamma=1, kernel=rbf;, score=0.324 total time=   5.3s


  y = column_or_1d(y, warn=True)


[CV 1/5] END ......C=100, gamma=0.1, kernel=rbf;, score=0.439 total time=   3.5s


  y = column_or_1d(y, warn=True)


[CV 2/5] END ......C=100, gamma=0.1, kernel=rbf;, score=0.428 total time=   3.5s


  y = column_or_1d(y, warn=True)


[CV 3/5] END ......C=100, gamma=0.1, kernel=rbf;, score=0.445 total time=   3.8s


  y = column_or_1d(y, warn=True)


[CV 4/5] END ......C=100, gamma=0.1, kernel=rbf;, score=0.441 total time=   3.5s


  y = column_or_1d(y, warn=True)


[CV 5/5] END ......C=100, gamma=0.1, kernel=rbf;, score=0.458 total time=   3.4s


  y = column_or_1d(y, warn=True)


[CV 1/5] END .....C=100, gamma=0.01, kernel=rbf;, score=0.712 total time=   2.0s


  y = column_or_1d(y, warn=True)


[CV 2/5] END .....C=100, gamma=0.01, kernel=rbf;, score=0.712 total time=   1.8s


  y = column_or_1d(y, warn=True)


[CV 3/5] END .....C=100, gamma=0.01, kernel=rbf;, score=0.706 total time=   1.9s


  y = column_or_1d(y, warn=True)


[CV 4/5] END .....C=100, gamma=0.01, kernel=rbf;, score=0.720 total time=   2.1s


  y = column_or_1d(y, warn=True)


[CV 5/5] END .....C=100, gamma=0.01, kernel=rbf;, score=0.728 total time=   2.2s


  y = column_or_1d(y, warn=True)


[CV 1/5] END ....C=100, gamma=0.001, kernel=rbf;, score=0.750 total time=   1.2s


  y = column_or_1d(y, warn=True)


[CV 2/5] END ....C=100, gamma=0.001, kernel=rbf;, score=0.767 total time=   1.3s


  y = column_or_1d(y, warn=True)


[CV 3/5] END ....C=100, gamma=0.001, kernel=rbf;, score=0.766 total time=   1.3s


  y = column_or_1d(y, warn=True)


[CV 4/5] END ....C=100, gamma=0.001, kernel=rbf;, score=0.771 total time=   1.5s


  y = column_or_1d(y, warn=True)


[CV 5/5] END ....C=100, gamma=0.001, kernel=rbf;, score=0.764 total time=   1.3s


  y = column_or_1d(y, warn=True)


[CV 1/5] END ...C=100, gamma=0.0001, kernel=rbf;, score=0.770 total time=   1.0s


  y = column_or_1d(y, warn=True)


[CV 2/5] END ...C=100, gamma=0.0001, kernel=rbf;, score=0.784 total time=   0.9s


  y = column_or_1d(y, warn=True)


[CV 3/5] END ...C=100, gamma=0.0001, kernel=rbf;, score=0.798 total time=   0.9s


  y = column_or_1d(y, warn=True)


[CV 4/5] END ...C=100, gamma=0.0001, kernel=rbf;, score=0.780 total time=   0.8s


  y = column_or_1d(y, warn=True)


[CV 5/5] END ...C=100, gamma=0.0001, kernel=rbf;, score=0.783 total time=   0.8s


  y = column_or_1d(y, warn=True)


[CV 1/5] END .......C=1000, gamma=1, kernel=rbf;, score=0.323 total time=   5.5s


  y = column_or_1d(y, warn=True)


[CV 2/5] END .......C=1000, gamma=1, kernel=rbf;, score=0.324 total time=   5.5s


  y = column_or_1d(y, warn=True)


[CV 3/5] END .......C=1000, gamma=1, kernel=rbf;, score=0.323 total time=   5.2s


  y = column_or_1d(y, warn=True)


[CV 4/5] END .......C=1000, gamma=1, kernel=rbf;, score=0.323 total time=   5.5s


  y = column_or_1d(y, warn=True)


[CV 5/5] END .......C=1000, gamma=1, kernel=rbf;, score=0.324 total time=   5.3s


  y = column_or_1d(y, warn=True)


[CV 1/5] END .....C=1000, gamma=0.1, kernel=rbf;, score=0.439 total time=   3.4s


  y = column_or_1d(y, warn=True)


[CV 2/5] END .....C=1000, gamma=0.1, kernel=rbf;, score=0.428 total time=   3.4s


  y = column_or_1d(y, warn=True)


[CV 3/5] END .....C=1000, gamma=0.1, kernel=rbf;, score=0.445 total time=   3.4s


  y = column_or_1d(y, warn=True)


[CV 4/5] END .....C=1000, gamma=0.1, kernel=rbf;, score=0.441 total time=   3.4s


  y = column_or_1d(y, warn=True)


[CV 5/5] END .....C=1000, gamma=0.1, kernel=rbf;, score=0.458 total time=   3.4s


  y = column_or_1d(y, warn=True)


[CV 1/5] END ....C=1000, gamma=0.01, kernel=rbf;, score=0.713 total time=   1.8s


  y = column_or_1d(y, warn=True)


[CV 2/5] END ....C=1000, gamma=0.01, kernel=rbf;, score=0.712 total time=   1.8s


  y = column_or_1d(y, warn=True)


[CV 3/5] END ....C=1000, gamma=0.01, kernel=rbf;, score=0.699 total time=   2.0s


  y = column_or_1d(y, warn=True)


[CV 4/5] END ....C=1000, gamma=0.01, kernel=rbf;, score=0.719 total time=   1.9s


  y = column_or_1d(y, warn=True)


[CV 5/5] END ....C=1000, gamma=0.01, kernel=rbf;, score=0.728 total time=   1.8s


  y = column_or_1d(y, warn=True)


[CV 1/5] END ...C=1000, gamma=0.001, kernel=rbf;, score=0.735 total time=   3.3s


  y = column_or_1d(y, warn=True)


[CV 2/5] END ...C=1000, gamma=0.001, kernel=rbf;, score=0.736 total time=   3.7s


  y = column_or_1d(y, warn=True)


[CV 3/5] END ...C=1000, gamma=0.001, kernel=rbf;, score=0.750 total time=   3.8s


  y = column_or_1d(y, warn=True)


[CV 4/5] END ...C=1000, gamma=0.001, kernel=rbf;, score=0.756 total time=   4.3s


  y = column_or_1d(y, warn=True)


[CV 5/5] END ...C=1000, gamma=0.001, kernel=rbf;, score=0.756 total time=   3.7s


  y = column_or_1d(y, warn=True)


[CV 1/5] END ..C=1000, gamma=0.0001, kernel=rbf;, score=0.773 total time=   1.4s


  y = column_or_1d(y, warn=True)


[CV 2/5] END ..C=1000, gamma=0.0001, kernel=rbf;, score=0.788 total time=   1.7s


  y = column_or_1d(y, warn=True)


[CV 3/5] END ..C=1000, gamma=0.0001, kernel=rbf;, score=0.796 total time=   1.5s


  y = column_or_1d(y, warn=True)


[CV 4/5] END ..C=1000, gamma=0.0001, kernel=rbf;, score=0.775 total time=   1.4s


  y = column_or_1d(y, warn=True)


[CV 5/5] END ..C=1000, gamma=0.0001, kernel=rbf;, score=0.782 total time=   1.3s


  y = column_or_1d(y, warn=True)


array(['None', 'Low', 'None', ..., 'None', 'Very_High', 'Low'],
      dtype=object)

In [17]:
submission = open("submissions/submission15.csv", "w", newline='')
writer = csv.writer(submission)
writer.writerow(['RowId', 'Speed_Diff'])
rowId = list(range(0, 1500))
for i in range(1500):
    writer.writerow([rowId[i]+1, predictions[i]])

submission.close()

In [13]:
X

Unnamed: 0,AVERAGE_FREE_FLOW_SPEED,AVERAGE_TIME_DIFF,AVERAGE_FREE_FLOW_TIME,AVERAGE_TEMPERATURE,AVERAGE_ATMOSP_PRESSURE,AVERAGE_HUMIDITY,AVERAGE_WIND_SPEED,LUMINOSITY_n,AVERAGE_CLOUDINESS_n,AVERAGE_RAIN_n,Feriado_n,Dia_n
0,41.5,11.5,71.4,15.0,1019.0,100.0,3.0,1,1,6,0,4
1,41.7,48.3,87.4,21.0,1021.0,53.0,5.0,1,1,6,0,0
2,38.6,38.4,85.2,26.0,1014.0,61.0,4.0,1,1,6,0,3
3,37.4,61.0,94.1,18.0,1025.0,48.0,4.0,1,1,6,0,5
4,41.6,50.4,77.0,15.0,1008.0,82.0,10.0,1,1,6,0,4
...,...,...,...,...,...,...,...,...,...,...,...,...
6807,41.2,3.7,86.9,9.0,1030.0,71.0,4.0,1,1,6,0,2
6808,38.9,51.9,76.9,17.0,1020.0,63.0,6.0,1,1,6,0,2
6809,39.6,0.0,89.1,15.0,1020.0,39.0,4.0,0,1,6,0,5
6810,41.6,0.0,85.5,8.0,1018.0,81.0,1.0,0,0,6,0,6
