### Import stuff

In [10]:
import random
from src.read_data import DataReader
from src.classification import CommonClassification

### Setup parameters

In [11]:
DATA_DIR = "../data"
TRAIN_TEST_SPLIT_RATIO = 0.25

### Create required objects

In [12]:
data_reader = DataReader(DATA_DIR)
common_classifier = CommonClassification()

### Load all KEEL datasets from directory

In [13]:
keel_data = data_reader.read_keel_dat_directory()
print('Read KEEL Datasets: %s' % len(keel_data))

Read KEEL Datasets: 9


### Select random KEEL dataset

In [14]:
random_keel_data = random.choice(keel_data)
random_keel_data.print_info()

Keel Dataset Info:
==> File Name: led7digit-0-2-4-5-6-7-8-9_vs_1.dat
==> Size: 442
==> Features: 7
==> Imbalance Ratio: 10.945945945945946
==> Sample Entry: [0. 0. 1. 1. 0. 0. 1. 0.]


### Convert KEEL data to testable collections

In [15]:
random_testable_keel_data = random_keel_data.as_testable(test_size=TRAIN_TEST_SPLIT_RATIO)
random_testable_keel_data.print_info()

Keel Testable Dataset Info:
==> File Name: led7digit-0-2-4-5-6-7-8-9_vs_1.dat
==> Size: 442
==> Features: 7
==> Classes: 2
==> Test-Train Split Ratio: 0.25
==> Train Size: 331
==> Test Size: 111


### Classify with Naive Bayes Gaussian Classifier

In [16]:
classification_result = common_classifier.naive_bayes_gaussian_classification(random_testable_keel_data)
print('Accuracy: %s' % classification_result.accuracy)

Accuracy: 0.9099099099099099


### Classify with Decision Tree Classifier

In [17]:
classification_result = common_classifier.decision_tree_classification(random_testable_keel_data)
print('Accuracy: %s' % classification_result.accuracy)

Accuracy: 0.963963963963964


### Classify with Random Forest Classifier


In [18]:
classification_result = common_classifier.random_forest_classification(random_testable_keel_data)
print('Accuracy: %s' % classification_result.accuracy)

Accuracy: 0.963963963963964
