## Importing the libraries

In [1]:
import pandas as pd

## Importing the dataset

In [2]:
dataset = pd.read_csv('breast_cancer.csv')
X = dataset.iloc[:, 1:-1].values
y = dataset.iloc[:, -1].values

## Splitting the dataset into the Training set and Test set

In [3]:
from sklearn.model_selection import train_test_split
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size = 0.2, random_state = 0)

## Training the Logistic Regression model on the Training set

In [4]:
from sklearn.linear_model import LogisticRegression
classifier = LogisticRegression(random_state = 0)
classifier.fit(X_train, y_train)

LogisticRegression(random_state=0)

## Predicting the Test set results

In [5]:
y_pred = classifier.predict(X_test)

## Making the Confusion Matrix

In [6]:
from sklearn.metrics import confusion_matrix
cm = confusion_matrix(y_test, y_pred)
print(cm)

[[84  3]
 [ 3 47]]


In [7]:
from sklearn.metrics import accuracy_score
accuracy_score(y_test, y_pred)

0.9562043795620438

## Computing the accuracy with k-Fold Cross Validation

In [8]:
from sklearn.model_selection import cross_val_score
accuracies = cross_val_score(estimator = classifier, X = X_train, y = y_train, cv = 10)
print("Accuracy: {:.2f} %".format(accuracies.mean()*100))
print("Standard Deviation: {:.2f} %".format(accuracies.std()*100))

Accuracy: 96.70 %
Standard Deviation: 1.97 %


## KNN

In [9]:
from sklearn.neighbors import KNeighborsClassifier
classifierKNN = KNeighborsClassifier(n_neighbors = 5, metric = 'minkowski', p = 2)
classifierKNN.fit(X_train, y_train)

KNeighborsClassifier()

In [10]:
from sklearn.metrics import confusion_matrix, accuracy_score
y_predKNN = classifierKNN.predict(X_test)
cm = confusion_matrix(y_test, y_predKNN)
print(cm)
accuracy_score(y_test, y_predKNN)

[[84  3]
 [ 1 49]]


0.9708029197080292

In [11]:
accuraciesKNN = cross_val_score(estimator = classifierKNN, X = X_train, y = y_train, cv = 10)
print("Accuracy: {:.2f} %".format(accuraciesKNN.mean()*100))
print("Standard Deviation: {:.2f} %".format(accuraciesKNN.std()*100))

Accuracy: 97.44 %
Standard Deviation: 1.85 %


## Kernel SVM

In [12]:
from sklearn.svm import SVC
classifierkSVM = SVC(kernel = 'rbf', random_state = 0)
classifierkSVM.fit(X_train, y_train)

SVC(random_state=0)

In [13]:
y_predSVM = classifierkSVM.predict(X_test)
cm = confusion_matrix(y_test, y_predSVM)
print(cm)
accuracy_score(y_test, y_predSVM)

[[83  4]
 [ 1 49]]


0.9635036496350365

In [14]:
accuraciesSVM = cross_val_score(estimator = classifierkSVM, X = X_train, y = y_train, cv = 10)
print("Accuracy: {:.2f} %".format(accuraciesSVM.mean()*100))
print("Standard Deviation: {:.2f} %".format(accuraciesSVM.std()*100))

Accuracy: 96.89 %
Standard Deviation: 2.17 %


## Naive Bayes

In [15]:
from sklearn.naive_bayes import GaussianNB
classifierNB = GaussianNB()
classifierNB.fit(X_train, y_train)

GaussianNB()

In [16]:
y_predNB = classifierNB.predict(X_test)
cm = confusion_matrix(y_test, y_predNB)
print(cm)
accuracy_score(y_test, y_predNB)

[[80  7]
 [ 0 50]]


0.948905109489051

In [17]:
accuraciesNB = cross_val_score(estimator = classifierNB, X = X_train, y = y_train, cv = 10)
print("Accuracy: {:.2f} %".format(accuraciesNB.mean()*100))
print("Standard Deviation: {:.2f} %".format(accuraciesNB.std()*100))

Accuracy: 96.52 %
Standard Deviation: 2.24 %


## Random Forest Classifier

In [18]:
from sklearn.ensemble import RandomForestClassifier
classifierRFC = RandomForestClassifier(n_estimators = 10, criterion = 'entropy', random_state = 0)
classifierRFC.fit(X_train, y_train)

RandomForestClassifier(criterion='entropy', n_estimators=10, random_state=0)

In [19]:
y_predRFC = classifierRFC.predict(X_test)
cm = confusion_matrix(y_test, y_predRFC)
print(cm)
accuracy_score(y_test, y_predRFC)

[[83  4]
 [ 3 47]]


0.948905109489051

In [20]:
accuraciesRFC = cross_val_score(estimator = classifierRFC, X = X_train, y = y_train, cv = 10)
print("Accuracy: {:.2f} %".format(accuraciesRFC.mean()*100))
print("Standard Deviation: {:.2f} %".format(accuraciesRFC.std()*100))

Accuracy: 96.33 %
Standard Deviation: 2.01 %
