# **Testing best model on Blind Test set (ML-CUP22)**

In [None]:
# Importing libraries
import pandas as pd
import numpy as np
import seaborn as sns
import csv

# SVM
from sklearn.svm import SVR
from sklearn.multioutput import MultiOutputRegressor

In [None]:
# Mount google drive to access data loaded on Drive
from google.colab import drive
drive.mount('/content/drive', force_remount=True)

------
## **Data preparation**

In [None]:
# Loading the training set ML-CUP22
path_TR = '/content/drive/MyDrive/data/Data_CUP/ML-CUP22-TR.csv'
col_names_TR = ['a1', 'a2', 'a3', 'a4', 'a5', 'a6', 'a7', 'a8', 'a9', 'x', 'y']
data_TR = pd.read_csv(path_TR, names=col_names_TR, comment='#')
data_TR.shape

In [None]:
# Loading the test (blind) set ML-CUP22
path_TS = '/content/drive/MyDrive/data/Data_CUP/ML-CUP22-TS.csv'
col_names_TS = ['a1', 'a2', 'a3', 'a4', 'a5', 'a6', 'a7', 'a8', 'a9']
data_TS = pd.read_csv(path_TS, names=col_names_TS, comment='#')
data_TS.shape

In [None]:
# X_train, y_train split
X_train, y_train = data_TR.iloc[:, :-2], data_TR.loc[:, ['x', 'y']]
print(f'X_train shape: {X_train.shape}')
print(f'y_train shape: {y_train.shape}')
print()

In [None]:
# X_test
X_test = data_TS.loc[:,:]
print(f'X_test shape: {X_test.shape}')

----
## **Support Vector Machine (SVM) - Radial Basis Function (RBF)**

In [None]:
# Define the best model for SVM
model_svm = MultiOutputRegressor(SVR(C=4, kernel='rbf', epsilon=0.22, gamma='auto'))

In [None]:
# Fit the model
model_svm.fit(X_train, y_train)

In [None]:
# Make prediction
y_pred = model_svm.predict(X_test)

In [None]:
# Generate CSV output file
filename = '/content/drive/MyDrive/NoPt_ML-CUP22-TS.csv'

df = pd.DataFrame(y_pred)

df.index = np.arange(1, len(df)+1)

with open(filename, 'w') as f:
  f.write('# Cosimo Faeti Riccardo Galarducci\n')
  f.write('# NoPt\n')
  f.write('# ML-CUP22\n')
  f.write('# 06/07/2023\n')
df.to_csv(filename, header= False, mode='a', index=True)