In [339]:
%reload_ext autoreload
%autoreload 2
%matplotlib inline
from denn import *
import pandas as pd
import seaborn as sns
import io 

In [353]:
# Functions
nn_p = 3
nn_w = 7
nn_tw = 1
freqlimit = str(10)
labels_order = ['noNN_RI', 'NN_RI','noNN_HMu',  'NN_HMu', 'noNN_CwN', 'NN_CwN', 'noNN_No', 
                 'NN_No','noNN_Rst', 'NN_Rst']
path= Path(f'../../data/cluster_results')
col_by_freq = True
col_palette = 'Set3'

pat = re.compile('.*/(exp\d)/(\w*)/nonn/freq([0-9\.]+)div(\w+)/(\w+)_\w+.csv')
decode_keys = ['experiment','function','freq','div','method']

nn_pat = re.compile('.*/(exp\d)/(\w*)/nn/freq([0-9\.]+)nn_w(\d+)nn_p(\d+)\w+nn_tw(\d+)\w+div([A-Za-z]+)/(\w+)_(\w+)_\w+.csv')
nn_decode_keys = ['experiment','function','freq','nnw','nnp','nntw','div','method','replace_mech']#,

def get_files(m): return list(path.glob(f'**/nonn/**/*{m}.csv'))
def get_nn_files(m): return list(path.glob(f'**/nn/**/*{m}.csv'))

def read_csv(f,m):
    df = pd.read_csv(f)
    for k,v in zip(decode_keys,pat.search(str(f)).groups()): df[k] = v
    df['freq'] = df['freq'].astype(float)
    df['method'] = df['method'] + '_' + df['div']
#     df['method'] = df['method'].str.replace('noNNRestart', 'noNN_Rst')
    df['method'] = df['method'].str.replace('noNNRestart_No', 'noNN_Rst')
    df.drop('div', axis=1, inplace=True)
    df.rename({'0':m.upper(), m:m.upper()}, axis=1, inplace=True)
    return df

def read_nn_csv(f,m):
    df = pd.read_csv(f)
    for k,v in zip(nn_decode_keys,nn_pat.search(str(f)).groups()): df[k] = v
    df['freq'] = df['freq'].astype(float)
    df['method'] = df['method'] + '_' + df['replace_mech'] + '_' + df['div']
    df['method'] = df['method'].str.replace('NNnorm_Worst', 'NN')
    df['method'] = df['method'].str.replace('NNconv_Worst', 'NN')
    df.drop(['replace_mech','div'], axis=1, inplace=True)
    df.rename({'0':m.upper(), m:m.upper()}, axis=1, inplace=True)
    return df

def get_data(m, normalize=False):
    files = get_files(m)
    nn_files = get_nn_files(m)
#     data = pd.concat([read_csv(f,m) for f in files] + [read_nn_csv(f,m) for f in nn_files])
    nn_data = pd.concat([read_nn_csv(f,m) for f in nn_files])
    nn_data = nn_data[nn_data['nnw']==str(nn_w)]
    nn_data = nn_data[nn_data['nntw']==str(nn_tw)]
    nonn_data = pd.concat([read_csv(f,m) for f in files])
    data = pd.concat([nn_data , nonn_data])

    if normalize:
        data_norm = (data.groupby(['experiment','function','freq','method'])[m.upper()].mean().reset_index()
                         .groupby(['experiment','function'])[m.upper()].min().reset_index()
                         .rename({m.upper():m.upper()+'_norm'}, axis=1))
        data = data.merge(data_norm, 'left')
        data[m.upper()+'_norm'] = data[m.upper()] / data[m.upper()+'_norm']
    return data.reset_index(drop=True)
    return data

def plot_one(data, m, normalize=False, title='', title_size=14, col_by_freq=col_by_freq, col_palette=col_palette,
             legend=False, hide_x=True, hide_y=True, ax=None, do_lim=True, ll=0.2, ul=0.8):
    m = m.upper()
    if normalize: m = m + '_norm' 
    if ax is None: fig,ax = plt.subplots(1,1,figsize=(6,4))
    sns.boxplot('method' if col_by_freq else 'freq', m, hue='freq' if col_by_freq else 'method',
                data=data, palette=col_palette,
                # width=2.5,
                linewidth=0.5, fliersize=0, ax=ax)
    if not legend: ax.get_legend().remove()
    if do_lim:
        ax.set_ylim(-0.05,1.05)
    else:
        g = data.groupby(['method','freq'])[m]
        q1,q3 = g.quantile(ll),g.quantile(ul)
        iqr = q3-q1
        lower_lim = (q1 - 1.5*iqr).min()
        upper_lim = (q3 + 1.5*iqr).max()
        lower_lim = data[m][data[m]>=lower_lim].min()
        upper_lim = data[m][data[m]<=upper_lim].max()
        ax.set_ylim(lower_lim,upper_lim)
        
    ax.set_xlabel('')
    if hide_x: ax.set_xticklabels([])
    if hide_y: ax.set_ylabel('')
    ax.set_title(title, size=title_size)
    return ax

def plot_all_vertical(m, normalize=False, title_size=14, col_by_freq=col_by_freq, col_palette=col_palette, do_lim=True,
                      ll=0.2, ul=0.8):
    data = get_data(m, normalize=normalize)
#     fig,axss = plt.subplots(4, 3, figsize=(14,16), sharex=do_lim, sharey=do_lim)
    fig,axss = plt.subplots(4, 3, figsize=(26,18), sharex=False, sharey=False)
    for i,(axs,exp) in enumerate(zip(axss,['exp1','exp2','exp3','exp4'])):
        first_exp = i==0
        for j,(ax,func) in enumerate(zip(axs,['sphere', 'rosenbrock', 'rastrigin'])):
            first_func = j==0
            test = data.query(f'experiment=={exp!r} and function=={func!r}').sort_values('method', ascending=False)
            plot_one(test, m, normalize=normalize, title=f'{exp}-{func.title()}', title_size=title_size, hide_x=False,
                     hide_y=not first_func, col_by_freq=col_by_freq, col_palette=col_palette, ax=ax,
                     do_lim=do_lim, ll=ll, ul=ul)
        ax.legend(loc='upper left', ncol=3)
    plt.tight_layout()
    return fig,axss

def plot_all_horizontal(m, normalize=False, title_size=14, col_by_freq=col_by_freq, col_palette=col_palette, do_lim=True,
                        ll=0.2, ul=0.8):
    data = get_data(m, normalize=normalize)
#     fig,axss = plt.subplots(4, 3, figsize=(14,16), sharex=do_lim, sharey=do_lim)
    fig,axss = plt.subplots(3, 4, figsize=(28,20), sharex=False, sharey=False)#20,12
    for i,exp in enumerate(['exp1','exp2','exp3','exp4']):#
        first_exp = i==0
        axs = axss[:,i]
        for j,(ax,func) in enumerate(zip(axs,['sphere', 'rosenbrock', 'rastrigin'])):
            first_func = i==0
            test = data.query(f'experiment=={exp!r} and function=={func!r}').sort_values('method', ascending=False)
            plot_one(test, m, normalize=normalize, title=f'{exp}-{func.title()}', title_size=title_size, hide_x=False,
                     hide_y=not first_func, col_by_freq=col_by_freq, col_palette=col_palette, ax=ax,
                     do_lim=do_lim, ll=ll, ul=ul)
        
    for axs in axss: axs[-1].legend(loc='upper right', ncol=3)
    plt.tight_layout()
    return fig,axss

def get_heatmap_data(m):
    df = get_data(m)
    df = df[df.nnp.isna() | (df.nnp == str(nn_p))].drop('nnp', axis=1)
    df.function = df.function.str.title()
    m = m.upper()
    df_pivot = df.pivot_table(index=['experiment','function','freq'], columns=['method'], values=[m],
                              aggfunc='mean')[m]
    return df_pivot

# Plots

In [354]:
df_pivot = get_heatmap_data('mof')[labels_order]
df_pivot_rank = df_pivot.rank(axis=1)
df_pivot = df_pivot.reset_index()
df_pivot.experiment = df_pivot.experiment.str.slice(3)
df_pivot.set_index(['experiment','function','freq'], inplace=True)

Sorting because non-concatenation axis is not aligned. A future version
of pandas will change to not sort by default.

To accept the future behavior, pass 'sort=False'.




In [355]:
df_pivot_rank = df_pivot_rank.query(f'freq=={freqlimit}')
df_pivot = df_pivot.query(f'freq=={freqlimit}')

In [356]:
df_pivot.style.background_gradient(cmap=plt.cm.Greens, axis=1)

Unnamed: 0_level_0,Unnamed: 1_level_0,method,noNN_RI,NN_RI,noNN_HMu,NN_HMu,noNN_CwN,NN_CwN,noNN_No,NN_No,noNN_Rst,NN_Rst
experiment,function,freq,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
1,Rastrigin,10.0,1.36267,1.66026,1.99793,2.17304,7.0696,14.0461,22.4543,21.9945,3.2472,3.69305
1,Rosenbrock,10.0,594.454,634.086,972.517,666.106,27032.6,14162.0,86304.9,5392.92,1068.32,1469.1
1,Sphere,10.0,0.169582,0.173184,0.258767,0.200819,6.82405,3.60949,23.7185,1.55556,0.337735,0.431844
2,Rastrigin,10.0,0.956105,0.973346,1.00653,1.09218,5.72148,1.98657,1.65409,1.05765,4.51222,5.05207
2,Rosenbrock,10.0,12.4061,14.6251,26.0371,31.464,1077.3,188.907,36.5449,5.86362,287.251,258.821
2,Sphere,10.0,0.0144111,0.0192547,0.0280285,0.0374946,1.52633,0.348362,0.576106,0.00967665,0.221952,0.237264
3,Rastrigin,10.0,1.22379,1.56237,2.6453,3.35735,4.13532,11.2457,37.9458,36.2679,2.00259,2.50687
3,Rosenbrock,10.0,2.94422,2.81454,2.28984,2.81306,8263.33,110.512,2.79347,2.49466,2639.25,3155.8
3,Sphere,10.0,0.00380361,0.00421356,0.00309776,0.00788485,1.51218,0.247956,0.00378324,0.00506311,0.460162,0.605806
4,Rastrigin,10.0,6.75993,5.30777,6.16951,4.85455,33.472,60.3584,183.174,36.1045,4.5349,5.65502


In [357]:
df_pivot_rank.style.background_gradient(cmap=plt.cm.Greens, axis=1)

Unnamed: 0_level_0,Unnamed: 1_level_0,method,noNN_RI,NN_RI,noNN_HMu,NN_HMu,noNN_CwN,NN_CwN,noNN_No,NN_No,noNN_Rst,NN_Rst
experiment,function,freq,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
exp1,Rastrigin,10.0,1,2,3,4,7,8,10,9,5,6
exp1,Rosenbrock,10.0,1,2,4,3,9,8,10,7,5,6
exp1,Sphere,10.0,1,2,4,3,9,8,10,7,5,6
exp2,Rastrigin,10.0,1,2,3,5,10,7,6,4,8,9
exp2,Rosenbrock,10.0,2,3,4,5,10,7,6,1,9,8
exp2,Sphere,10.0,2,3,4,5,10,8,9,1,6,7
exp3,Rastrigin,10.0,1,2,5,6,7,8,10,9,3,4
exp3,Rosenbrock,10.0,6,5,1,4,10,7,3,2,8,9
exp3,Sphere,10.0,3,4,1,6,10,7,2,5,8,9
exp4,Rastrigin,10.0,6,3,5,2,7,9,10,8,1,4


In [358]:
summary = df_pivot.groupby(['experiment', 'function']).mean()
summary.round(2).style.background_gradient(cmap=plt.cm.Greens, axis=1)

Unnamed: 0_level_0,method,noNN_RI,NN_RI,noNN_HMu,NN_HMu,noNN_CwN,NN_CwN,noNN_No,NN_No,noNN_Rst,NN_Rst
experiment,function,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1
1,Rastrigin,1.36,1.66,2.0,2.17,7.07,14.05,22.45,21.99,3.25,3.69
1,Rosenbrock,594.45,634.09,972.52,666.11,27032.6,14162.0,86304.9,5392.92,1068.32,1469.1
1,Sphere,0.17,0.17,0.26,0.2,6.82,3.61,23.72,1.56,0.34,0.43
2,Rastrigin,0.96,0.97,1.01,1.09,5.72,1.99,1.65,1.06,4.51,5.05
2,Rosenbrock,12.41,14.63,26.04,31.46,1077.3,188.91,36.54,5.86,287.25,258.82
2,Sphere,0.01,0.02,0.03,0.04,1.53,0.35,0.58,0.01,0.22,0.24
3,Rastrigin,1.22,1.56,2.65,3.36,4.14,11.25,37.95,36.27,2.0,2.51
3,Rosenbrock,2.94,2.81,2.29,2.81,8263.33,110.51,2.79,2.49,2639.25,3155.8
3,Sphere,0.0,0.0,0.0,0.01,1.51,0.25,0.0,0.01,0.46,0.61
4,Rastrigin,6.76,5.31,6.17,4.85,33.47,60.36,183.17,36.1,4.53,5.66


In [359]:
out = summary.round(2).style
for i in range(len(labels_order)//2): 
    out = out.highlight_min(axis=1, subset=labels_order[i*2:(i+1)*2])

out

Unnamed: 0_level_0,method,noNN_RI,NN_RI,noNN_HMu,NN_HMu,noNN_CwN,NN_CwN,noNN_No,NN_No,noNN_Rst,NN_Rst
experiment,function,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1
1,Rastrigin,1.36,1.66,2.0,2.17,7.07,14.05,22.45,21.99,3.25,3.69
1,Rosenbrock,594.45,634.09,972.52,666.11,27032.6,14162.0,86304.9,5392.92,1068.32,1469.1
1,Sphere,0.17,0.17,0.26,0.2,6.82,3.61,23.72,1.56,0.34,0.43
2,Rastrigin,0.96,0.97,1.01,1.09,5.72,1.99,1.65,1.06,4.51,5.05
2,Rosenbrock,12.41,14.63,26.04,31.46,1077.3,188.91,36.54,5.86,287.25,258.82
2,Sphere,0.01,0.02,0.03,0.04,1.53,0.35,0.58,0.01,0.22,0.24
3,Rastrigin,1.22,1.56,2.65,3.36,4.14,11.25,37.95,36.27,2.0,2.51
3,Rosenbrock,2.94,2.81,2.29,2.81,8263.33,110.51,2.79,2.49,2639.25,3155.8
3,Sphere,0.0,0.0,0.0,0.01,1.51,0.25,0.0,0.01,0.46,0.61
4,Rastrigin,6.76,5.31,6.17,4.85,33.47,60.36,183.17,36.1,4.53,5.66


# Interactive

In [207]:
from ipywidgets import interact
def show_table(dm):
    out = summary[[f'noNN_{dm}', f'NN_{dm}']].round(2)
    return out.style.background_gradient(cmap=plt.cm.Blues_r, axis=1)
    
interact(show_table, dm=['RI', 'HMu','No','Rst'])

interactive(children=(Dropdown(description='dm', options=('RI', 'HMu', 'No', 'Rst'), value='RI'), Output()), _…

<function __main__.show_table(dm)>