In [420]:
%reload_ext autoreload
%autoreload 2
%matplotlib inline
from denn import *
import pandas as pd
import seaborn as sns
import io 

In [421]:
# Functions
nn_p = 5
nn_w = 5
nn_tw = 1
freqlimit = str(30)
labels_order = ['noNN_RI', 'NN_RI','noNN_HMu',  'NN_HMu', 'noNN_No', 
                 'NN_No','noNN_Rst', 'NN_Rst']#'noNN_CwN', 'NN_CwN',
path= Path(f'../../data/cluster_results')
col_by_freq = True
col_palette = 'Set3'

pat = re.compile('.*/(exp\d)/(\w*)/nonn/freq([0-9\.]+)div(\w+)/(\w+)_\w+.csv')
decode_keys = ['experiment','function','freq','div','method']

nn_pat = re.compile('.*/(exp\d)/(\w*)/nn/freq([0-9\.]+)nn_w(\d+)nn_p(\d+)\w+nn_tw(\d+)\w+div([A-Za-z]+)/(\w+)_(\w+)_\w+.csv')
nn_decode_keys = ['experiment','function','freq','nnw','nnp','nntw','div','method','replace_mech']#,

def get_files(m): return list(path.glob(f'**/nonn/**/*{m}.csv'))
def get_nn_files(m): return list(path.glob(f'**/nn/**/*{m}.csv'))

def read_csv(f,m):
    df = pd.read_csv(f)
    for k,v in zip(decode_keys,pat.search(str(f)).groups()): df[k] = v
    df['freq'] = df['freq'].astype(float)
    df['method'] = df['method'] + '_' + df['div']
#     df['method'] = df['method'].str.replace('noNNRestart', 'noNN_Rst')
    df['method'] = df['method'].str.replace('noNNRestart_No', 'noNN_Rst')
    df.drop('div', axis=1, inplace=True)
    df.rename({'0':m.upper(), m:m.upper()}, axis=1, inplace=True)
    return df

def read_nn_csv(f,m):
    df = pd.read_csv(f)
    for k,v in zip(nn_decode_keys,nn_pat.search(str(f)).groups()): df[k] = v
    df['freq'] = df['freq'].astype(float)
    df['method'] = df['method'] + '_' + df['replace_mech'] + '_' + df['div']
    df['method'] = df['method'].str.replace('NNnorm_Worst', 'NN')
    df['method'] = df['method'].str.replace('NNconv_Worst', 'NN')
    df.drop(['replace_mech','div'], axis=1, inplace=True)
    df.rename({'0':m.upper(), m:m.upper()}, axis=1, inplace=True)
    return df

def get_data(m, normalize=False):
    files = get_files(m)
    nn_files = get_nn_files(m)
#     data = pd.concat([read_csv(f,m) for f in files] + [read_nn_csv(f,m) for f in nn_files])
    nn_data = pd.concat([read_nn_csv(f,m) for f in nn_files])
    nn_data = nn_data[nn_data['nnw']==str(nn_w)]
    nn_data = nn_data[nn_data['nntw']==str(nn_tw)]
    nn_data = nn_data[nn_data['nnp']==str(nn_p)]
    nonn_data = pd.concat([read_csv(f,m) for f in files])
    data = pd.concat([nn_data , nonn_data])

    if normalize:
        data_norm = (data.groupby(['experiment','function','freq','method'])[m.upper()].mean().reset_index()
                         .groupby(['experiment','function'])[m.upper()].min().reset_index()
                         .rename({m.upper():m.upper()+'_norm'}, axis=1))
        data = data.merge(data_norm, 'left')
        data[m.upper()+'_norm'] = data[m.upper()] / data[m.upper()+'_norm']
    return data.reset_index(drop=True)
    return data

def plot_one(data, m, normalize=False, title='', title_size=14, col_by_freq=col_by_freq, col_palette=col_palette,
             legend=False, hide_x=True, hide_y=True, ax=None, do_lim=True, ll=0.2, ul=0.8):
    m = m.upper()
    if normalize: m = m + '_norm' 
    if ax is None: fig,ax = plt.subplots(1,1,figsize=(6,4))
    sns.boxplot('method' if col_by_freq else 'freq', m, hue='freq' if col_by_freq else 'method',
                data=data, palette=col_palette,
                # width=2.5,
                linewidth=0.5, fliersize=0, ax=ax)
    if not legend: ax.get_legend().remove()
    if do_lim:
        ax.set_ylim(-0.05,1.05)
    else:
        g = data.groupby(['method','freq'])[m]
        q1,q3 = g.quantile(ll),g.quantile(ul)
        iqr = q3-q1
        lower_lim = (q1 - 1.5*iqr).min()
        upper_lim = (q3 + 1.5*iqr).max()
        lower_lim = data[m][data[m]>=lower_lim].min()
        upper_lim = data[m][data[m]<=upper_lim].max()
        ax.set_ylim(lower_lim,upper_lim)
        
    ax.set_xlabel('')
    if hide_x: ax.set_xticklabels([])
    if hide_y: ax.set_ylabel('')
    ax.set_title(title, size=title_size)
    return ax

def plot_all_vertical(m, normalize=False, title_size=14, col_by_freq=col_by_freq, col_palette=col_palette, do_lim=True,
                      ll=0.2, ul=0.8):
    data = get_data(m, normalize=normalize)
#     fig,axss = plt.subplots(4, 3, figsize=(14,16), sharex=do_lim, sharey=do_lim)
    fig,axss = plt.subplots(4, 3, figsize=(26,18), sharex=False, sharey=False)
    for i,(axs,exp) in enumerate(zip(axss,['exp1','exp2','exp3','exp4'])):
        first_exp = i==0
        for j,(ax,func) in enumerate(zip(axs,['sphere', 'rosenbrock', 'rastrigin'])):
            first_func = j==0
            test = data.query(f'experiment=={exp!r} and function=={func!r}').sort_values('method', ascending=False)
            plot_one(test, m, normalize=normalize, title=f'{exp}-{func.title()}', title_size=title_size, hide_x=False,
                     hide_y=not first_func, col_by_freq=col_by_freq, col_palette=col_palette, ax=ax,
                     do_lim=do_lim, ll=ll, ul=ul)
        ax.legend(loc='upper left', ncol=3)
    plt.tight_layout()
    return fig,axss

def plot_all_horizontal(m, normalize=False, title_size=14, col_by_freq=col_by_freq, col_palette=col_palette, do_lim=True,
                        ll=0.2, ul=0.8):
    data = get_data(m, normalize=normalize)
#     fig,axss = plt.subplots(4, 3, figsize=(14,16), sharex=do_lim, sharey=do_lim)
    fig,axss = plt.subplots(3, 4, figsize=(28,20), sharex=False, sharey=False)#20,12
    for i,exp in enumerate(['exp1','exp2','exp3','exp4']):#
        first_exp = i==0
        axs = axss[:,i]
        for j,(ax,func) in enumerate(zip(axs,['sphere', 'rosenbrock', 'rastrigin'])):
            first_func = i==0
            test = data.query(f'experiment=={exp!r} and function=={func!r}').sort_values('method', ascending=False)
            plot_one(test, m, normalize=normalize, title=f'{exp}-{func.title()}', title_size=title_size, hide_x=False,
                     hide_y=not first_func, col_by_freq=col_by_freq, col_palette=col_palette, ax=ax,
                     do_lim=do_lim, ll=ll, ul=ul)
        
    for axs in axss: axs[-1].legend(loc='upper right', ncol=3)
    plt.tight_layout()
    return fig,axss

def get_heatmap_data(m):
    df = get_data(m)
    df = df[df.nnp.isna() | (df.nnp == str(nn_p))].drop('nnp', axis=1)
    df.function = df.function.str.title()
    m = m.upper()
    df_pivot = df.pivot_table(index=['experiment','function','freq'], columns=['method'], values=[m],
                              aggfunc='mean')[m]
    return df_pivot

# Plots

In [422]:
df_pivot = get_heatmap_data('mof')[labels_order]
df_pivot_rank = df_pivot.rank(axis=1)
df_pivot = df_pivot.reset_index()
df_pivot.experiment = df_pivot.experiment.str.slice(3)
df_pivot.set_index(['experiment','function','freq'], inplace=True)

Sorting because non-concatenation axis is not aligned. A future version
of pandas will change to not sort by default.

To accept the future behavior, pass 'sort=False'.




In [423]:
df_pivot_rank = df_pivot_rank.query(f'freq=={freqlimit}')
df_pivot = df_pivot.query(f'freq=={freqlimit}')

In [424]:
df_pivot.style.background_gradient(cmap=plt.cm.Greens, axis=1)

Unnamed: 0_level_0,Unnamed: 1_level_0,method,noNN_RI,NN_RI,noNN_HMu,NN_HMu,noNN_No,NN_No,noNN_Rst,NN_Rst
experiment,function,freq,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1
1,Rastrigin,30.0,25.7925,20.1892,40.6723,29.9467,517.726,471.468,37.803,44.6836
1,Rosenbrock,30.0,5690.82,3603.36,16619.7,4647.47,1989250.0,4607.58,7314.17,9838.24
1,Sphere,30.0,1.3464,1.06683,3.65941,1.29549,546.63,1.19391,2.30997,2.89661
2,Rastrigin,30.0,20.7059,20.5654,20.5718,21.3377,34.4265,20.9023,49.8757,60.6789
2,Rosenbrock,30.0,86.4507,104.033,268.0,298.808,1191.83,30.3643,2147.87,1753.48
2,Sphere,30.0,0.108428,0.131869,0.279029,0.350543,5.8504,0.0602415,1.63383,1.57362
3,Rastrigin,30.0,28.8391,37.8908,66.5058,82.1328,955.832,901.98,16.4998,21.6867
3,Rosenbrock,30.0,18.2729,13.3656,26.7793,14.0573,19.6344,14.0766,20548.5,24408.6
3,Sphere,30.0,1.397,0.0231923,5.97691,0.116422,885.513,0.0385511,3.42827,4.74939
4,Rastrigin,30.0,148.405,55.0923,111.795,55.4085,4083.47,327.976,41.4062,53.5629


In [425]:
df_pivot_rank.style.background_gradient(cmap=plt.cm.Greens, axis=1)

Unnamed: 0_level_0,Unnamed: 1_level_0,method,noNN_RI,NN_RI,noNN_HMu,NN_HMu,noNN_No,NN_No,noNN_Rst,NN_Rst
experiment,function,freq,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1
exp1,Rastrigin,30.0,2,1,5,3,8,7,4,6
exp1,Rosenbrock,30.0,4,1,7,3,8,2,5,6
exp1,Sphere,30.0,4,1,7,3,8,2,5,6
exp2,Rastrigin,30.0,3,1,2,5,6,4,7,8
exp2,Rosenbrock,30.0,2,3,4,5,6,1,8,7
exp2,Sphere,30.0,2,3,4,5,8,1,7,6
exp3,Rastrigin,30.0,3,4,5,6,8,7,1,2
exp3,Rosenbrock,30.0,4,1,6,2,5,3,7,8
exp3,Sphere,30.0,4,1,7,3,8,2,5,6
exp4,Rastrigin,30.0,6,3,5,4,8,7,1,2


In [426]:
summary = df_pivot.groupby(['experiment', 'function']).mean()
summary.round(2).style.background_gradient(cmap=plt.cm.Greens, axis=1)

Unnamed: 0_level_0,method,noNN_RI,NN_RI,noNN_HMu,NN_HMu,noNN_No,NN_No,noNN_Rst,NN_Rst
experiment,function,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
1,Rastrigin,25.79,20.19,40.67,29.95,517.73,471.47,37.8,44.68
1,Rosenbrock,5690.82,3603.36,16619.7,4647.47,1989250.0,4607.58,7314.17,9838.24
1,Sphere,1.35,1.07,3.66,1.3,546.63,1.19,2.31,2.9
2,Rastrigin,20.71,20.57,20.57,21.34,34.43,20.9,49.88,60.68
2,Rosenbrock,86.45,104.03,268.0,298.81,1191.83,30.36,2147.87,1753.48
2,Sphere,0.11,0.13,0.28,0.35,5.85,0.06,1.63,1.57
3,Rastrigin,28.84,37.89,66.51,82.13,955.83,901.98,16.5,21.69
3,Rosenbrock,18.27,13.37,26.78,14.06,19.63,14.08,20548.5,24408.6
3,Sphere,1.4,0.02,5.98,0.12,885.51,0.04,3.43,4.75
4,Rastrigin,148.4,55.09,111.79,55.41,4083.47,327.98,41.41,53.56


In [427]:
out = summary.round(2).style
for i in range(len(labels_order)//2): 
    out = out.highlight_min(axis=1, subset=labels_order[i*2:(i+1)*2])

out

Unnamed: 0_level_0,method,noNN_RI,NN_RI,noNN_HMu,NN_HMu,noNN_No,NN_No,noNN_Rst,NN_Rst
experiment,function,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
1,Rastrigin,25.79,20.19,40.67,29.95,517.73,471.47,37.8,44.68
1,Rosenbrock,5690.82,3603.36,16619.7,4647.47,1989250.0,4607.58,7314.17,9838.24
1,Sphere,1.35,1.07,3.66,1.3,546.63,1.19,2.31,2.9
2,Rastrigin,20.71,20.57,20.57,21.34,34.43,20.9,49.88,60.68
2,Rosenbrock,86.45,104.03,268.0,298.81,1191.83,30.36,2147.87,1753.48
2,Sphere,0.11,0.13,0.28,0.35,5.85,0.06,1.63,1.57
3,Rastrigin,28.84,37.89,66.51,82.13,955.83,901.98,16.5,21.69
3,Rosenbrock,18.27,13.37,26.78,14.06,19.63,14.08,20548.5,24408.6
3,Sphere,1.4,0.02,5.98,0.12,885.51,0.04,3.43,4.75
4,Rastrigin,148.4,55.09,111.79,55.41,4083.47,327.98,41.41,53.56


# Interactive

In [403]:
from ipywidgets import interact
def show_table(dm):
    out = summary[[f'noNN_{dm}', f'NN_{dm}']].round(2)
    return out.style.background_gradient(cmap=plt.cm.Blues_r, axis=1)
    
interact(show_table, dm=['RI', 'HMu','No','Rst'])

interactive(children=(Dropdown(description='dm', options=('RI', 'HMu', 'No', 'Rst'), value='RI'), Output()), _…

<function __main__.show_table(dm)>