# Classifying digits dataset with PolyACO+

In [20]:
from sklearn import datasets, neighbors, linear_model
from sklearn.cross_validation import train_test_split
from sklearn.svm import SVC

import sys
import os.path as osp
import time
sys.path.append(osp.dirname(osp.dirname(osp.abspath('__file__'))))

import acoc
import utils
from config import CLASSIFIER_CONFIG

In [21]:
data_set = datasets.load_digits()

In [22]:
X = data_set.data
y = data_set.target
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.33)

class_indices = list(set(y))

## SVM classification

In [23]:
r = []
for _ in range(100):
    X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.33)
    clf = SVC(gamma=0.001)
    clf.fit(X_train, y_train)
    r.append(clf.score(X_test, y_test) * 100)
print("Classification score: {}".format(sum(r) / len(r)))

Classification score: 98.97643097643106


## Naive Bayes classification

In [24]:
r = []
for _ in range(100):
    X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.33)
    clf = neighbors.KNeighborsClassifier()
    clf.fit(X_train, y_train)
    r.append(clf.score(X_test, y_test)*100)
print("Classification score: {}".format(sum(r) / len(r)))

Classification score: 98.43265993265992


## Logistic regression

In [25]:
r = []
for _ in range(100):
    X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.33)
    clf = linear_model.LogisticRegression()
    clf.fit(X_train, y_train)
    r.append(clf.score(X_test, y_test)*100)
print("Classification score: {}".format(sum(r) / len(r)))

Classification score: 95.55892255892259


## PolyACO+ classification

In [26]:
CLASSIFIER_CONFIG.max_level = 3
CLASSIFIER_CONFIG.level_convergence_rate = 2000

In [None]:
clf = acoc.PolyACO(X.shape[1], class_indices, CLASSIFIER_CONFIG)
clf.train(X_train, y_train)
predictions = clf.evaluate(X_test)
print("\rClassification score: {}".format(acoc.compute_score(predictions, y_test)))