In [None]:
#Importing required Python packages 
%matplotlib inline 
import matplotlib.pyplot as plt 
import numpy as np 
from pprint import pprint 
import pandas as pd 
import zipfile 
import requests 
import io 
import datetime 
import seaborn 
from sklearn import svm
from sklearn.model_selection import GridSearchCV

np.random.seed(sum(map(ord, "aesthetics"))) 
seaborn.set_context('notebook') 

pd.set_option('display.mpl_style', 'default') # Make the graphs a bit prettier 
plt.rcParams['figure.figsize'] = (15, 5)

In [None]:
#Load the first abalone dataset
abalone = pd.read_csv('abalone.data', header=None)
abalone = pd.get_dummies(abalone)
#abalone = abalone.as_matrix()
Y_abalone = abalone[8].as_matrix() # Column 8 is the label
del abalone[8]

X_abalone = abalone.as_matrix()

In [None]:
# Load the wine dataset
wine = np.loadtxt('winequality-white.csv', delimiter=';')
X_wine = wine[:,:11]
Y_wine = wine[:,11]

In [None]:
# Load the covtype dataset
covtype = np.loadtxt('covtype.data', delimiter=',')
print(covtype.shape)

In [None]:
X_cov = covtype[:,:54]
Y_cov = covtype[:,54]
print(X_cov.shape, Y_cov.shape)

In [None]:
# Load the adult dataset
adult = pd.read_csv('adult.data', header=None)
adult = pd.get_dummies(adult)
adult_matrix = adult.as_matrix()
print(adult_matrix.shape)

X_adult = adult_matrix[:, :109]
Y_adult = adult_matrix[:, 109] # binary. 1 represents > 50k, 0 represents <= 50k
print(X_adult.shape, Y_adult.shape)

In [None]:
from sklearn.model_selection import train_test_split

X_train_val, X_test, Y_train_val, Y_test = \
train_test_split(X_abalone, Y_abalone, test_size=0.2, random_state=42)  
print(X_train_val.shape, X_test.shape, Y_train_val.shape, Y_test.shape)

In [None]:
classifier = svm.SVC(kernel='linear')
# Set the parameters by cross-validation
C_list = [ 10**-6, 10**-5, 10**-4, 10**-3, 10**-2, 10**-1] # Different C to try.
tuned = {'C': C_list}
clf = GridSearchCV(classifier, param_grid=tuned, return_train_score=True)
clf.fit(X_train_val, Y_train_val)
print("Best C for linear is:",clf.best_params_['C'])