In [None]:
from __future__ import print_function

from sklearn import datasets
import pandas
import numpy
from sklearn.model_selection import train_test_split
from sklearn.model_selection import GridSearchCV
from sklearn.metrics import classification_report
import matplotlib.pyplot as plt
from sklearn.svm import SVC
from sklearn.neighbors import KNeighborsClassifier
from sklearn.tree import DecisionTreeClassifier
from sklearn.ensemble import RandomForestClassifier
from sklearn.preprocessing import MinMaxScaler


In [None]:
digits = datasets.load_digits()
digits.data.shape 
plt.gray() 
plt.matshow(digits.images[0]) 
plt.show() 

In [None]:
n_samples = len(digits.images)
x = digits.images.reshape((n_samples, -1))
y = digits.target

x_train, x_test, y_train, y_test = train_test_split(x, y, test_size=0.5, random_state=0)
x_train

In [None]:
classifiers = [
    {'clf': KNeighborsClassifier(), 'params': {'n_neighbors': range(1, 5),}},
    {'clf': DecisionTreeClassifier(random_state=numpy.random.seed(10)), 'params': {'criterion': ['gini', 'entropy'], 'max_depth': range(6, 20), 'min_samples_split': range(2, 10), 'min_samples_leaf': range(1, 10)}},
    {'clf': RandomForestClassifier(random_state=numpy.random.seed(10)), 'params': {'n_estimators': range(40, 60), 'criterion': ['gini', 'entropy'], 'max_depth': range(5, 10)}},
]

In [None]:
for cls in classifiers:
    clf = GridSearchCV(cls['clf'], cls['params'], cv=10)
    clf.fit(x_train,y_train)
    print('model:', cls['clf'])
    print("Best parameters set found on development set:", clf.best_params_)
    print("Grid scores on development set:")
    means = clf.cv_results_['mean_test_score']
    stds = clf.cv_results_['std_test_score']
    for mean, std, params in zip(means, stds, clf.cv_results_['params']):
        print("%0.3f (+/-%0.03f) for %r"
              % (mean, std * 2, params))
    print()
    y_true, y_pred = y_test, clf.predict(x_test)
    print(classification_report(y_true, y_pred))
