# Classification on Wine Quality Dataset - Model selection

## Imports

In [1]:
from tiblib import load_wine
from tiblib.model_selection import grid_cv_multiprior
from tiblib.preprocessing import Gaussianizer, StandardScaler, PCA

## GMM

In [None]:
from tiblib.classification import GaussianMixtureClassifier

X_train, X_test, y_train, y_test = load_wine()

model = GaussianMixtureClassifier
hyperparams = {'tied':[False, True],
               'diag':[False, True],
               'n_components':[4,8,16],
               'alpha':[0.1, 0.5, 1]}
prefix = 'gmm'
pis = [0.1, 0.5, 0.9]
gaussianizer = Gaussianizer()
scaler = StandardScaler()
pca1 = PCA(n_dims=9)
pca2 = PCA(n_dims=5)
preprocessings = [
    [],
    [gaussianizer],
    [scaler],
]
for pr in preprocessings:
    if len(pr) > 0:
        filename = '_'.join([str(p) for p in pr])
    else:
        filename = 'no_preproc'
    print(filename) # Prints current preprocessings in string form
    grid_cv_multiprior(X_train, y_train, pis=pis,
            preprocessing=pr,
            classifier=model, hyperparams=hyperparams, filename=f'results/results_{prefix}_{filename}.csv')

no_preproc
Showing results for pi = [0.1, 0.5, 0.9]
GMM (4 components, $\alpha = 0.1$)		& 0.812	& 0.326	& 0.748	\\
GMM (4 components, $\alpha = 0.5$)		& 0.847	& 0.327	& 0.695	\\
GMM (4 components, $\alpha = 1$)		& 0.772	& 0.321	& 0.740	\\
GMM (8 components, $\alpha = 0.1$)		& 0.842	& 0.330	& 0.786	\\
GMM (8 components, $\alpha = 0.5$)		& 0.784	& 0.325	& 0.802	\\
GMM (8 components, $\alpha = 1$)		& 0.725	& 0.300	& 0.775	\\
GMM (16 components, $\alpha = 0.1$)		& 0.850	& 0.350	& 0.893	\\
GMM (16 components, $\alpha = 0.5$)		& 0.830	& 0.346	& 0.950	\\
GMM (16 components, $\alpha = 1$)		& 0.679	& 0.303	& 0.852	\\
GMM (Diag, 4 components, $\alpha = 0.1$)		& 0.801	& 0.400	& 0.847	\\
GMM (Diag, 4 components, $\alpha = 0.5$)		& 0.865	& 0.376	& 0.828	\\
GMM (Diag, 4 components, $\alpha = 1$)		& 0.837	& 0.316	& 0.781	\\
GMM (Diag, 8 components, $\alpha = 0.1$)		& 0.894	& 0.388	& 0.852	\\
GMM (Diag, 8 components, $\alpha = 0.5$)		& 0.851	& 0.375	& 0.839	\\
GMM (Diag, 8 components, $\alpha = 1$)		&