# Data Processing

In [29]:
import numpy as np
import pandas as pd
from sklearn import datasets
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler
from sklearn.metrics import accuracy_score

In [30]:
iris = datasets.load_iris()
X = iris.data[:,[0,3]]
y = iris.target
x_train,x_test,y_train,y_test = train_test_split(X,y,test_size=0.3,random_state=0)

sc = StandardScaler()
sc.fit(x_train)

x_train = sc.transform(x_train)
x_test = sc.transform(x_test)

# 1. Perceptron

In [106]:
from sklearn.linear_model import Perceptron

In [115]:
ppn = Perceptron(eta0=0.1, max_iter=88, tol=0.001, random_state=0)
ppn.fit(x_train, y_train)
y_pred = ppn.predict(x_test)

print("Accuracy: %0.2f" % accuracy_score(y_pred,y_test))
print("Accuracy in training: %0.2f" % ppn.score(x_train,y_train))


Accuracy: 0.96
Accuracy in training: 0.93


# 2. Adaline

In [39]:
from sklearn.linear_model import SGDClassifier

In [119]:
ada = SGDClassifier(eta0=0.1, max_iter=88, tol=0.001, random_state=0)
ada.fit(x_train, y_train)
y_pred = ada.predict(x_test)
print("Accuracy: %.2f" % accuracy_score(y_pred, y_test))
print("Accuracy of training data: %.2f" % ada.score(x_train, y_train))

Accuracy: 0.82
Accuracy of training data: 0.86


# 3. Logistic Regression

In [27]:
from sklearn.linear_model import LogisticRegression

In [32]:
reg = LogisticRegression(max_iter=88, tol=0.001, random_state=0)
reg.fit(x_train, y_train)
y_pred = reg.predict(x_test)
print("Accuracy: %.2f" % accuracy_score(y_pred, y_test))
print("Accurscy of training data: %0.2f" % reg.score(x_train,y_train))

Accuracy: 0.80
Accurscy of training data: 0.88




# 4. Besiyan Network

In [131]:
from sklearn.naive_bayes import GaussianNB

In [132]:
gnb = GaussianNB()
gnb.fit(x_train, y_train)
y_pred = gnb.predict(x_test)
print("Accuracy: %.2f" % accuracy_score(y_pred, y_test))
print("Accuracy of the training data: %.2f" % gnb.score(x_train, y_train))

Accuracy: 0.98
Accuracy of the training data: 0.95


# 5. Support Vector Machine

In [86]:
from sklearn.svm import SVC

In [90]:
svm = SVC(kernel='linear', C=88, random_state=0)
svm.fit(x_train, y_train)
y_pred = svm.predict(x_test)
print("Accuracy: %0.2f" % accuracy_score(y_pred, y_test))
print("Accuract of training data: %0.2f" % svm.score(x_train, y_train))

Accuracy: 0.98
Accuract of training data: 0.95


# 6. k-Nearest Neighbors

In [127]:
from sklearn.neighbors import KNeighborsClassifier

In [130]:
knn = KNeighborsClassifier(n_neighbors=1)
knn.fit(x_train, y_train)
y_pred = knn.predict(x_test)
print("Accuracy: %.2f" % accuracy_score(y_pred, y_test))
print("Accuracy of training data: %.2f" % knn.score(x_train, y_train))

Accuracy: 0.93
Accuracy of training data: 0.98


# 7. Decision Tree

In [91]:
from sklearn.tree import DecisionTreeClassifier

In [97]:
clf = DecisionTreeClassifier(criterion='entropy', max_depth=3, random_state=0)
clf.fit(x_train, y_train)
y_pred = clf.predict(x_test)
print("Accuracy: %0.2f" % accuracy_score(y_pred, y_test))
print("Accuracy of training data: %.2f" % clf.score(x_train, y_train))

Accuracy: 0.98
Accuracy of training data: 0.95


# 8. Random Forest Classifier

In [95]:
from sklearn.ensemble import RandomForestClassifier

In [135]:
clf = RandomForestClassifier(criterion='entropy', max_depth=3, n_estimators=3, random_state=0)
clf.fit(x_train, y_train)
y_pred = clf.predict(x_test)
print("Accuracy: %.2f" % accuracy_score(y_pred, y_test))
print("Accuracy of training data: %0.2f" % clf.score(x_train, y_train))

Accuracy: 0.98
Accuracy of training data: 0.95


# All important sklearn library name

In [39]:
from sklearn.linear_model import Perceptron
from sklearn.linear_model import SGDClassifier # Adaline
from sklearn.linear_model import LogisticRegression
from sklearn.naive_bayes import GaussianNB
from sklearn.svm import SVC
from sklearn.neighbors import KNeighborsClassifier
from sklearn.tree import DecisionTreeClassifier, export_graphviz
from sklearn.ensemble import RandomForestClassifier


from sklearn.decomposition import PCA, KernelPCA   # n_components
from sklearn.discriminant_analysis import LinearDiscriminantAnalysis # n_components
from sklearn.pipeline import Pipeline # Pipeline()
from sklearn.model_selection import GridSearchCV, KFold, StratifiedKFold, cross_val_score, learning_curve
from sklearn.preprocessing import Imputer,LabelEncoder,StandardScaler,OneHotEncoder