In [1]:
from sklearn.svm import SVC
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler
from sklearn import datasets
from sklearn.metrics import accuracy_score

In [None]:
# Load the data set; In this example, the breast cancer dataset is loaded.
b_cancer = datasets.load_breast_cancer()
X = b_cancer.data
y = b_cancer.target
print(X.shape)
print(y.shape)

# Create training and test split
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=1, stratify=y)

In [3]:
# StandardScaler normalizes the data to have 0 mean and std of 1
sc = StandardScaler()

# fit function is used to compute the mean and std to transform (scale / normalize) the data later.
sc.fit(X_train)

# Both the training and testing data will be scaled according to the std and mean of the training data
X_train_std = sc.transform(X_train)
X_test_std = sc.transform(X_test)

In [None]:
# Instantiate the Support Vector Classifier (SVC)
svc = SVC(C=1.0, random_state=1, kernel='linear')

# Try other kernels: linear, poly, rbf

# Fit the model
svc.fit(X_train_std, y_train)

In [None]:
# Make the predictions
y_predict = svc.predict(X_test_std)

# Measure the performance
print(accuracy_score(y_test, y_predict))