In [428]:
%reload_ext autoreload
%autoreload 2
%matplotlib inline
from denn import *
import pandas as pd
import seaborn as sns
import io 

In [460]:
# Functions
nn_p = 5
nn_w = 10
nn_tw = 1
freqlimit = str(20)
labels_order = ['noNN_RI', 'NN_RI','NN_HMu','noNN_HMu',  'noNN_No', 
                 'NN_No','noNN_Rst', 'NN_Rst']#'noNN_CwN', 'NN_CwN',  
path= Path(f'../../data/cluster_results')
col_by_freq = True
col_palette = 'Set3'

pat = re.compile('.*/(exp\d)/(\w*)/nonn/freq([0-9\.]+)div(\w+)/(\w+)_\w+.csv')
decode_keys = ['experiment','function','freq','div','method']

nn_pat = re.compile('.*/(exp\d)/(\w*)/nn/freq([0-9\.]+)nn_w(\d+)nn_p(\d+)\w+nn_tw(\d+)\w+div([A-Za-z]+)/(\w+)_(\w+)_\w+.csv')
nn_decode_keys = ['experiment','function','freq','nnw','nnp','nntw','div','method','replace_mech']#,

def get_files(m): return list(path.glob(f'**/nonn/**/*{m}.csv'))
def get_nn_files(m): return list(path.glob(f'**/nn/**/*{m}.csv'))

def read_csv(f,m):
    df = pd.read_csv(f)
    for k,v in zip(decode_keys,pat.search(str(f)).groups()): df[k] = v
    df['freq'] = df['freq'].astype(float)
    df['method'] = df['method'] + '_' + df['div']
    df.drop('div', axis=1, inplace=True)
    df.rename({'0':m.upper(), m:m.upper()}, axis=1, inplace=True)
    return df

def read_nn_csv(f,m):
    df = pd.read_csv(f)
    for k,v in zip(nn_decode_keys,nn_pat.search(str(f)).groups()): df[k] = v
    df['freq'] = df['freq'].astype(float)
    df['method'] = df['method'] + '_' + df['replace_mech'] + '_' + df['div']
    df['method'] = df['method'].str.replace('NNnorm_Worst', 'NN')
    df['method'] = df['method'].str.replace('NNconv_Worst', 'NNconv')
    df.drop(['replace_mech','div'], axis=1, inplace=True)
    df.rename({'0':m.upper(), m:m.upper()}, axis=1, inplace=True)
    return df

def get_data(m, normalize=False):
    files = get_files(m)
    nn_files = get_nn_files(m)
#     data = pd.concat([read_csv(f,m) for f in files] + [read_nn_csv(f,m) for f in nn_files])
    nn_data = pd.concat([read_nn_csv(f,m) for f in nn_files])
    nn_data = nn_data[nn_data['nnw']==str(nn_w)]
    nn_data = nn_data[nn_data['nntw']==str(nn_tw)]
    nn_data = nn_data[nn_data['nnp']==str(nn_p)]
    nonn_data = pd.concat([read_csv(f,m) for f in files])
    data = pd.concat([nn_data , nonn_data])

    if normalize:
        data_norm = (data.groupby(['experiment','function','freq','method'])[m.upper()].mean().reset_index()
                         .groupby(['experiment','function'])[m.upper()].min().reset_index()
                         .rename({m.upper():m.upper()+'_norm'}, axis=1))
        data = data.merge(data_norm, 'left')
        data[m.upper()+'_norm'] = data[m.upper()] / data[m.upper()+'_norm']
    return data.reset_index(drop=True)
    return data

def plot_one(data, m, normalize=False, title='', title_size=14, col_by_freq=col_by_freq, col_palette=col_palette,
             legend=False, hide_x=True, hide_y=True, ax=None, do_lim=True, ll=0.2, ul=0.8):
    m = m.upper()
    if normalize: m = m + '_norm' 
    if ax is None: fig,ax = plt.subplots(1,1,figsize=(6,4))
    sns.boxplot('method' if col_by_freq else 'freq', m, hue='freq' if col_by_freq else 'method',
                data=data, palette=col_palette,
                # width=2.5,
                linewidth=0.5, fliersize=0, ax=ax)
    if not legend: ax.get_legend().remove()
    if do_lim:
        ax.set_ylim(-0.05,1.05)
    else:
        g = data.groupby(['method','freq'])[m]
        q1,q3 = g.quantile(ll),g.quantile(ul)
        iqr = q3-q1
        lower_lim = (q1 - 1.5*iqr).min()
        upper_lim = (q3 + 1.5*iqr).max()
        lower_lim = data[m][data[m]>=lower_lim].min()
        upper_lim = data[m][data[m]<=upper_lim].max()
        ax.set_ylim(lower_lim,upper_lim)
        
    ax.set_xlabel('')
    if hide_x: ax.set_xticklabels([])
    if hide_y: ax.set_ylabel('')
    ax.set_title(title, size=title_size)
    return ax

def plot_all_vertical(m, normalize=False, title_size=14, col_by_freq=col_by_freq, col_palette=col_palette, do_lim=True,
                      ll=0.2, ul=0.8):
    data = get_data(m, normalize=normalize)
#     fig,axss = plt.subplots(4, 3, figsize=(14,16), sharex=do_lim, sharey=do_lim)
    fig,axss = plt.subplots(4, 3, figsize=(26,18), sharex=False, sharey=False)
    for i,(axs,exp) in enumerate(zip(axss,['exp1','exp2','exp3','exp4'])):
        first_exp = i==0
        for j,(ax,func) in enumerate(zip(axs,['sphere', 'rosenbrock', 'rastrigin'])):
            first_func = j==0
            test = data.query(f'experiment=={exp!r} and function=={func!r}').sort_values('method', ascending=False)
            plot_one(test, m, normalize=normalize, title=f'{exp}-{func.title()}', title_size=title_size, hide_x=False,
                     hide_y=not first_func, col_by_freq=col_by_freq, col_palette=col_palette, ax=ax,
                     do_lim=do_lim, ll=ll, ul=ul)
        ax.legend(loc='upper left', ncol=3)
    plt.tight_layout()
    return fig,axss

def plot_all_horizontal(m, normalize=False, title_size=14, col_by_freq=col_by_freq, col_palette=col_palette, do_lim=True,
                        ll=0.2, ul=0.8):
    data = get_data(m, normalize=normalize)
#     fig,axss = plt.subplots(4, 3, figsize=(14,16), sharex=do_lim, sharey=do_lim)
    fig,axss = plt.subplots(3, 4, figsize=(28,20), sharex=False, sharey=False)#20,12
    for i,exp in enumerate(['exp1','exp2','exp3','exp4']):#
        first_exp = i==0
        axs = axss[:,i]
        for j,(ax,func) in enumerate(zip(axs,['sphere', 'rosenbrock', 'rastrigin'])):
            first_func = i==0
            test = data.query(f'experiment=={exp!r} and function=={func!r}').sort_values('method', ascending=False)
            plot_one(test, m, normalize=normalize, title=f'{exp}-{func.title()}', title_size=title_size, hide_x=False,
                     hide_y=not first_func, col_by_freq=col_by_freq, col_palette=col_palette, ax=ax,
                     do_lim=do_lim, ll=ll, ul=ul)
        
    for axs in axss: axs[-1].legend(loc='upper right', ncol=3)
    plt.tight_layout()
    return fig,axss

def get_heatmap_data(m):
    df = get_data(m)
    df = df[df.nnp.isna() | (df.nnp == str(nn_p))].drop('nnp', axis=1)
    df.function = df.function.str.title()
    m = m.upper()
    df_pivot = df.pivot_table(index=['experiment','function','freq'], columns=['method'], values=[m],
                              aggfunc='mean')[m]
    return df_pivot

# Plots

In [463]:
df_pivot = get_heatmap_data('mof')#[labels_order]
df_pivot_rank = df_pivot.rank(axis=1)
df_pivot = df_pivot.reset_index()
df_pivot.experiment = df_pivot.experiment.str.slice(3)
df_pivot.set_index(['experiment','function','freq'], inplace=True)

Sorting because non-concatenation axis is not aligned. A future version
of pandas will change to not sort by default.

To accept the future behavior, pass 'sort=False'.




In [464]:
df_pivot_rank = df_pivot_rank.query(f'freq=={freqlimit}')
df_pivot = df_pivot.query(f'freq=={freqlimit}')

In [465]:
df_pivot.style.background_gradient(cmap=plt.cm.Greens, axis=1)

Unnamed: 0_level_0,Unnamed: 1_level_0,method,NNconv_No,NNconv_RI,NNconv_Rst,noNN_CwN,noNN_HMu,noNN_No,noNN_RI,noNN_Rst
experiment,function,freq,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1
1,Rastrigin,20.0,515.001,26.6529,71.3298,6.49431,39.2888,517.692,23.8551,48.6123
1,Rosenbrock,20.0,43872.6,7880.25,,25614.7,17560.2,1987840.0,6180.61,10916.7
1,Sphere,20.0,12.7609,2.52113,,6.41115,3.46929,546.126,1.8265,3.40912
2,Rastrigin,20.0,,19.7362,94.3913,4.93966,20.6919,34.3769,20.7103,65.8285
2,Rosenbrock,20.0,,226.511,4280.11,751.105,357.601,3056.13,126.966,3038.6
2,Sphere,20.0,,0.2604,4.10686,1.25172,0.378244,5.95756,0.155349,2.4357
3,Rastrigin,20.0,913.692,60.8569,,3.13306,67.0527,949.653,28.0775,22.3127
3,Rosenbrock,20.0,15.2556,14.3963,55528.5,4843.49,31.8245,22.6134,20.2742,30126.8
3,Sphere,20.0,,0.0325425,9.93442,1.08808,6.0526,899.161,1.32079,5.05208
4,Rastrigin,20.0,,150.519,,24.0983,92.8285,3948.05,124.467,57.4356


In [466]:
df_pivot_rank.style.background_gradient(cmap=plt.cm.Greens, axis=1)

Unnamed: 0_level_0,Unnamed: 1_level_0,method,NNconv_No,NNconv_RI,NNconv_Rst,noNN_CwN,noNN_HMu,noNN_No,noNN_RI,noNN_Rst
experiment,function,freq,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1
exp1,Rastrigin,20.0,7.0,3,6.0,1,4,8,2,5
exp1,Rosenbrock,20.0,6.0,2,,5,4,7,1,3
exp1,Sphere,20.0,6.0,2,,5,4,7,1,3
exp2,Rastrigin,20.0,,2,7.0,1,3,5,4,6
exp2,Rosenbrock,20.0,,2,7.0,4,3,6,1,5
exp2,Sphere,20.0,,2,6.0,4,3,7,1,5
exp3,Rastrigin,20.0,6.0,4,,1,5,7,3,2
exp3,Rosenbrock,20.0,2.0,1,8.0,6,5,4,3,7
exp3,Sphere,20.0,,1,6.0,2,5,7,3,4
exp4,Rastrigin,20.0,,5,,1,3,6,4,2


In [467]:
summary = df_pivot.groupby(['experiment', 'function']).mean()
summary.round(2).style.background_gradient(cmap=plt.cm.Greens, axis=1)

Unnamed: 0_level_0,method,NNconv_No,NNconv_RI,NNconv_Rst,noNN_CwN,noNN_HMu,noNN_No,noNN_RI,noNN_Rst
experiment,function,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
1,Rastrigin,515.0,26.65,71.33,6.49,39.29,517.69,23.86,48.61
1,Rosenbrock,43872.6,7880.25,,25614.7,17560.2,1987840.0,6180.61,10916.7
1,Sphere,12.76,2.52,,6.41,3.47,546.13,1.83,3.41
2,Rastrigin,,19.74,94.39,4.94,20.69,34.38,20.71,65.83
2,Rosenbrock,,226.51,4280.11,751.11,357.6,3056.13,126.97,3038.6
2,Sphere,,0.26,4.11,1.25,0.38,5.96,0.16,2.44
3,Rastrigin,913.69,60.86,,3.13,67.05,949.65,28.08,22.31
3,Rosenbrock,15.26,14.4,55528.5,4843.49,31.82,22.61,20.27,30126.8
3,Sphere,,0.03,9.93,1.09,6.05,899.16,1.32,5.05
4,Rastrigin,,150.52,,24.1,92.83,3948.05,124.47,57.44


In [468]:
out = summary.round(2).style
for i in range(len(labels_order)//2): 
    out = out.highlight_min(axis=1, subset=labels_order[i*2:(i+1)*2])

out

Unnamed: 0_level_0,method,NNconv_No,NNconv_RI,NNconv_Rst,noNN_CwN,noNN_HMu,noNN_No,noNN_RI,noNN_Rst
experiment,function,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
1,Rastrigin,515.0,26.65,71.33,6.49,39.29,517.69,23.86,48.61
1,Rosenbrock,43872.6,7880.25,,25614.7,17560.2,1987840.0,6180.61,10916.7
1,Sphere,12.76,2.52,,6.41,3.47,546.13,1.83,3.41
2,Rastrigin,,19.74,94.39,4.94,20.69,34.38,20.71,65.83
2,Rosenbrock,,226.51,4280.11,751.11,357.6,3056.13,126.97,3038.6
2,Sphere,,0.26,4.11,1.25,0.38,5.96,0.16,2.44
3,Rastrigin,913.69,60.86,,3.13,67.05,949.65,28.08,22.31
3,Rosenbrock,15.26,14.4,55528.5,4843.49,31.82,22.61,20.27,30126.8
3,Sphere,,0.03,9.93,1.09,6.05,899.16,1.32,5.05
4,Rastrigin,,150.52,,24.1,92.83,3948.05,124.47,57.44


# Interactive

In [469]:
from ipywidgets import interact
def show_table(dm):
    out = summary[[f'noNN_{dm}', f'NN_{dm}']].round(2)
    return out.style.background_gradient(cmap=plt.cm.Blues_r, axis=1)
    
interact(show_table, dm=['RI', 'HMu','No','Rst'])

interactive(children=(Dropdown(description='dm', options=('RI', 'HMu', 'No', 'Rst'), value='RI'), Output()), _…

<function __main__.show_table(dm)>