In [None]:
import numpy as np
import matplotlib.pyplot as plt
from matplotlib.colors import LogNorm
from sklearn import mixture
%matplotlib inline

from plotting.plots import *

# generate random sample, two components
np.random.seed(0)

In [None]:
n_samples = 300

# generate spherical data centered on (20, 20)
shifted_gaussian = np.random.randn(n_samples, 2) + np.array([20, 20])

# generate zero centered stretched Gaussian data
C = np.array([[0., -0.4], [3, .6]])
stretched_gaussian = np.dot(np.random.randn(n_samples, 2), C)

# concatenate the two datasets into the final training set
X_train = np.vstack([shifted_gaussian, stretched_gaussian])
X_train = stretched_gaussian
X_o = np.array([[0,1], [2,0], [0,0]])

# fit a Gaussian Mixture Model with two components
clf = mixture.GaussianMixture(n_components=1, covariance_type='full')
clf.fit(X_train)

# display predicted scores by the model as a contour plot
x = np.linspace(-10., 10.)
y = np.linspace(-2.5, 2.5)
X, Y = np.meshgrid(x, y)
XX = np.array([X.ravel(), Y.ravel()]).T
Z = -clf.score_samples(XX)
Z = Z.reshape(X.shape)

CS = plt.contour(X, Y, Z, cmap=plt.cm.RdBu, levels=np.logspace(0, 1, 6), linewidths=(1,))
# CB = plt.colorbar(CS, shrink=0.8, extend='both')
plt.scatter(X_train[:, 0], X_train[:, 1], 5)
plt.plot(X_o[:, 0], X_o[:, 1], 'or')

arrowd = dict(
    arrowstyle="wedge,tail_width=1.",
    fc=(1.0, 0.7, 0.7, .5), ec=(1., .7, .7, .0),
    patchA=None, #patchB=el,
    relpos=(0.2, 0.8),
    connectionstyle="arc3,rad=-0.1"
)

commond = dict(
    xycoords='data', textcoords='offset points',
    bbox=dict(boxstyle="round", fc=(1., .7, .7), ec=(.0, .0, .0, 0), ),
    arrowprops=arrowd
)

plt.annotate('O', xy=(X_o[2,0], X_o[2,1]), xytext=(-8, -50), size=20, **commond)
plt.annotate('A', xy=(X_o[1,0], X_o[1,1]), xytext=(20, -40), size=20, **commond)
plt.annotate('B', xy=(X_o[0,0], X_o[0,1]), xytext=(-50, 10), size=20, **commond)


# plt.title('Correlated data')
plt.axis('tight')

commonStyles(plt.gca())
plt.gcf().set_size_inches(10, 2.5)
plt.tight_layout(pad=0.0, w_pad=1.0, h_pad=3.0)
plt.savefig('../thesis-distance-metric-learning/graphs/correlated_data.pdf')
plt.show()

In [None]:
from metric_learn import Covariance

# generate random sample, two components
np.random.seed(0)

n_samples = 300

# generate spherical data centered on (20, 20)
shifted_gaussian = np.random.randn(n_samples, 2) + np.array([20, 20])

# generate zero centered stretched Gaussian data
C = np.array([[0., -0.4], [3, .6]])
stretched_gaussian = np.dot(np.random.randn(n_samples, 2), C)

# concatenate the two datasets into the final training set
X_train = np.vstack([shifted_gaussian, stretched_gaussian])
tr = Covariance()
X_train_t = tr.fit_transform(stretched_gaussian)
X_o = np.array([[0,1], [2,0], [0,0]])
X_o = tr.transform(X_o)

# fit a Gaussian Mixture Model with two components
clf = mixture.GaussianMixture(n_components=1, covariance_type='full')
clf.fit(X_train_t)

# display predicted scores by the model as a contour plot
x = np.linspace(-10., 10.)
y = np.linspace(-2.5, 2.5)
X, Y = np.meshgrid(x, y)
XX = np.array([X.ravel(), Y.ravel()]).T
Z = -clf.score_samples(XX)
Z = Z.reshape(X.shape)

CS = plt.contour(X, Y, Z, cmap=plt.cm.RdBu, levels=np.logspace(0, 1, 6), linewidths=(1,))
# CB = plt.colorbar(CS, shrink=0.8, extend='both')
plt.scatter(X_train_t[:, 0], X_train_t[:, 1], 5)
plt.plot(X_o[:, 0], X_o[:, 1], 'or')

plt.annotate('O', xy=(X_o[2,0], X_o[2,1]), xytext=(-60, -50), size=20, **commond)
plt.annotate('A', xy=(X_o[1,0], X_o[1,1]), xytext=(40, -30), size=20, **commond)
plt.annotate('B', xy=(X_o[0,0], X_o[0,1]), xytext=(40, -20), size=20, **commond)

# plt.title('Correlated data')
plt.axis('tight')

commonStyles(plt.gca())
plt.gcf().set_size_inches(10, 2.5)
plt.tight_layout(pad=0.0, w_pad=1.0, h_pad=3.0)
plt.savefig('../thesis-distance-metric-learning/graphs/uncorrelated_data.pdf')
plt.show()

In [None]:
from sklearn.decomposition import PCA

pca = PCA(n_components=2, whiten=True)
X_train_t = pca.fit_transform(stretched_gaussian)
X_o = np.array([[0,1], [2,0], [0,0]])
X_o = tr.transform(X_o)

# fit a Gaussian Mixture Model with two components
clf = mixture.GaussianMixture(n_components=1, covariance_type='full')
clf.fit(X_train_t)

# display predicted scores by the model as a contour plot
x = np.linspace(-10., 10.)
y = np.linspace(-2.5, 2.5)
X, Y = np.meshgrid(x, y)
XX = np.array([X.ravel(), Y.ravel()]).T
Z = -clf.score_samples(XX)
Z = Z.reshape(X.shape)

CS = plt.contour(X, Y, Z, cmap=plt.cm.RdBu, levels=np.logspace(0, 1, 6), linewidths=(1,))
# CB = plt.colorbar(CS, shrink=0.8, extend='both')
plt.scatter(X_train_t[:, 0], X_train_t[:, 1], 5)
plt.plot(X_o[:, 0], X_o[:, 1], 'or')

# plt.title('Correlated data')
plt.axis('tight')

commonStyles(plt.gca())
plt.gcf().set_size_inches(10, 2.5)
plt.tight_layout(pad=0.0, w_pad=1.0, h_pad=3.0)
# plt.savefig('../thesis-distance-metric-learning/thesis/graphs/uncorrelated_data.pdf')
plt.show()

In [None]:
clf.precisions_cholesky_

In [None]:
tr.M_

In [None]:
tr.transformer()

In [None]:
from sklearn.decomposition import PCA

In [None]:
pca = PCA(whiten=True)

In [None]:
pca.fit_transform(X_train)

In [None]:
pca.get_covariance()

In [None]:
pca.components_