In [412]:
%reload_ext autoreload
%autoreload 2
%matplotlib inline
from denn import *
import pandas as pd
import seaborn as sns
import io 

In [413]:
# Functions
nn_p = 5
nn_w = 5
nn_tw = 1
freqlimit = str(10)
labels_order = ['noNN_RI', 'NN_RI','noNN_HMu',  'NN_HMu', 'noNN_No', 
                 'NN_No','noNN_Rst', 'NN_Rst']#'noNN_CwN', 'NN_CwN',
path= Path(f'../../data/cluster_results')
col_by_freq = True
col_palette = 'Set3'

pat = re.compile('.*/(exp\d)/(\w*)/nonn/freq([0-9\.]+)div(\w+)/(\w+)_\w+.csv')
decode_keys = ['experiment','function','freq','div','method']

nn_pat = re.compile('.*/(exp\d)/(\w*)/nn/freq([0-9\.]+)nn_w(\d+)nn_p(\d+)\w+nn_tw(\d+)\w+div([A-Za-z]+)/(\w+)_(\w+)_\w+.csv')
nn_decode_keys = ['experiment','function','freq','nnw','nnp','nntw','div','method','replace_mech']#,

def get_files(m): return list(path.glob(f'**/nonn/**/*{m}.csv'))
def get_nn_files(m): return list(path.glob(f'**/nn/**/*{m}.csv'))

def read_csv(f,m):
    df = pd.read_csv(f)
    for k,v in zip(decode_keys,pat.search(str(f)).groups()): df[k] = v
    df['freq'] = df['freq'].astype(float)
    df['method'] = df['method'] + '_' + df['div']
#     df['method'] = df['method'].str.replace('noNNRestart', 'noNN_Rst')
    df['method'] = df['method'].str.replace('noNNRestart_No', 'noNN_Rst')
    df.drop('div', axis=1, inplace=True)
    df.rename({'0':m.upper(), m:m.upper()}, axis=1, inplace=True)
    return df

def read_nn_csv(f,m):
    df = pd.read_csv(f)
    for k,v in zip(nn_decode_keys,nn_pat.search(str(f)).groups()): df[k] = v
    df['freq'] = df['freq'].astype(float)
    df['method'] = df['method'] + '_' + df['replace_mech'] + '_' + df['div']
    df['method'] = df['method'].str.replace('NNnorm_Worst', 'NN')
    df['method'] = df['method'].str.replace('NNconv_Worst', 'NN')
    df.drop(['replace_mech','div'], axis=1, inplace=True)
    df.rename({'0':m.upper(), m:m.upper()}, axis=1, inplace=True)
    return df

def get_data(m, normalize=False):
    files = get_files(m)
    nn_files = get_nn_files(m)
#     data = pd.concat([read_csv(f,m) for f in files] + [read_nn_csv(f,m) for f in nn_files])
    nn_data = pd.concat([read_nn_csv(f,m) for f in nn_files])
    nn_data = nn_data[nn_data['nnw']==str(nn_w)]
    nn_data = nn_data[nn_data['nntw']==str(nn_tw)]
    nn_data = nn_data[nn_data['nnp']==str(nn_p)]
    nonn_data = pd.concat([read_csv(f,m) for f in files])
    data = pd.concat([nn_data , nonn_data])

    if normalize:
        data_norm = (data.groupby(['experiment','function','freq','method'])[m.upper()].mean().reset_index()
                         .groupby(['experiment','function'])[m.upper()].min().reset_index()
                         .rename({m.upper():m.upper()+'_norm'}, axis=1))
        data = data.merge(data_norm, 'left')
        data[m.upper()+'_norm'] = data[m.upper()] / data[m.upper()+'_norm']
    return data.reset_index(drop=True)
    return data

def plot_one(data, m, normalize=False, title='', title_size=14, col_by_freq=col_by_freq, col_palette=col_palette,
             legend=False, hide_x=True, hide_y=True, ax=None, do_lim=True, ll=0.2, ul=0.8):
    m = m.upper()
    if normalize: m = m + '_norm' 
    if ax is None: fig,ax = plt.subplots(1,1,figsize=(6,4))
    sns.boxplot('method' if col_by_freq else 'freq', m, hue='freq' if col_by_freq else 'method',
                data=data, palette=col_palette,
                # width=2.5,
                linewidth=0.5, fliersize=0, ax=ax)
    if not legend: ax.get_legend().remove()
    if do_lim:
        ax.set_ylim(-0.05,1.05)
    else:
        g = data.groupby(['method','freq'])[m]
        q1,q3 = g.quantile(ll),g.quantile(ul)
        iqr = q3-q1
        lower_lim = (q1 - 1.5*iqr).min()
        upper_lim = (q3 + 1.5*iqr).max()
        lower_lim = data[m][data[m]>=lower_lim].min()
        upper_lim = data[m][data[m]<=upper_lim].max()
        ax.set_ylim(lower_lim,upper_lim)
        
    ax.set_xlabel('')
    if hide_x: ax.set_xticklabels([])
    if hide_y: ax.set_ylabel('')
    ax.set_title(title, size=title_size)
    return ax

def plot_all_vertical(m, normalize=False, title_size=14, col_by_freq=col_by_freq, col_palette=col_palette, do_lim=True,
                      ll=0.2, ul=0.8):
    data = get_data(m, normalize=normalize)
#     fig,axss = plt.subplots(4, 3, figsize=(14,16), sharex=do_lim, sharey=do_lim)
    fig,axss = plt.subplots(4, 3, figsize=(26,18), sharex=False, sharey=False)
    for i,(axs,exp) in enumerate(zip(axss,['exp1','exp2','exp3','exp4'])):
        first_exp = i==0
        for j,(ax,func) in enumerate(zip(axs,['sphere', 'rosenbrock', 'rastrigin'])):
            first_func = j==0
            test = data.query(f'experiment=={exp!r} and function=={func!r}').sort_values('method', ascending=False)
            plot_one(test, m, normalize=normalize, title=f'{exp}-{func.title()}', title_size=title_size, hide_x=False,
                     hide_y=not first_func, col_by_freq=col_by_freq, col_palette=col_palette, ax=ax,
                     do_lim=do_lim, ll=ll, ul=ul)
        ax.legend(loc='upper left', ncol=3)
    plt.tight_layout()
    return fig,axss

def plot_all_horizontal(m, normalize=False, title_size=14, col_by_freq=col_by_freq, col_palette=col_palette, do_lim=True,
                        ll=0.2, ul=0.8):
    data = get_data(m, normalize=normalize)
#     fig,axss = plt.subplots(4, 3, figsize=(14,16), sharex=do_lim, sharey=do_lim)
    fig,axss = plt.subplots(3, 4, figsize=(28,20), sharex=False, sharey=False)#20,12
    for i,exp in enumerate(['exp1','exp2','exp3','exp4']):#
        first_exp = i==0
        axs = axss[:,i]
        for j,(ax,func) in enumerate(zip(axs,['sphere', 'rosenbrock', 'rastrigin'])):
            first_func = i==0
            test = data.query(f'experiment=={exp!r} and function=={func!r}').sort_values('method', ascending=False)
            plot_one(test, m, normalize=normalize, title=f'{exp}-{func.title()}', title_size=title_size, hide_x=False,
                     hide_y=not first_func, col_by_freq=col_by_freq, col_palette=col_palette, ax=ax,
                     do_lim=do_lim, ll=ll, ul=ul)
        
    for axs in axss: axs[-1].legend(loc='upper right', ncol=3)
    plt.tight_layout()
    return fig,axss

def get_heatmap_data(m):
    df = get_data(m)
    df = df[df.nnp.isna() | (df.nnp == str(nn_p))].drop('nnp', axis=1)
    df.function = df.function.str.title()
    m = m.upper()
    df_pivot = df.pivot_table(index=['experiment','function','freq'], columns=['method'], values=[m],
                              aggfunc='mean')[m]
    return df_pivot

# Plots

In [414]:
df_pivot = get_heatmap_data('mof')[labels_order]
df_pivot_rank = df_pivot.rank(axis=1)
df_pivot = df_pivot.reset_index()
df_pivot.experiment = df_pivot.experiment.str.slice(3)
df_pivot.set_index(['experiment','function','freq'], inplace=True)

Sorting because non-concatenation axis is not aligned. A future version
of pandas will change to not sort by default.

To accept the future behavior, pass 'sort=False'.




In [415]:
df_pivot_rank = df_pivot_rank.query(f'freq=={freqlimit}')
df_pivot = df_pivot.query(f'freq=={freqlimit}')

In [416]:
df_pivot.style.background_gradient(cmap=plt.cm.Greens, axis=1)

Unnamed: 0_level_0,Unnamed: 1_level_0,method,noNN_RI,NN_RI,noNN_HMu,NN_HMu,noNN_No,NN_No,noNN_Rst,NN_Rst
experiment,function,freq,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1
1,Rastrigin,10.0,28.9707,35.9541,44.8104,45.327,495.517,461.781,70.5126,79.9719
1,Rosenbrock,10.0,12904.3,12855.7,20735.2,13688.2,1897650.0,56462.2,22773.5,32169.8
1,Sphere,10.0,3.69325,3.87804,5.71827,4.26535,523.23,17.0778,7.07603,9.34691
2,Rastrigin,10.0,21.1277,21.6001,22.1115,24.8553,36.0356,22.0951,97.2913,109.371
2,Rosenbrock,10.0,259.323,331.247,583.509,715.332,195.092,135.627,5839.66,5201.47
2,Sphere,10.0,0.296526,0.430068,0.618716,0.832421,9.71964,0.21296,4.74717,4.84787
3,Rastrigin,10.0,26.3746,36.2383,57.7198,80.0655,838.864,755.85,42.8156,56.1327
3,Rosenbrock,10.0,59.1273,58.7844,51.5603,62.1723,78.2425,57.9463,54836.5,72831.2
3,Sphere,10.0,0.0806472,0.0758166,0.0684503,0.11345,0.0824397,0.0829051,9.7454,13.7734
4,Rastrigin,10.0,153.789,116.25,132.085,106.172,4038.62,720.563,94.2977,124.947


In [417]:
df_pivot_rank.style.background_gradient(cmap=plt.cm.Greens, axis=1)

Unnamed: 0_level_0,Unnamed: 1_level_0,method,noNN_RI,NN_RI,noNN_HMu,NN_HMu,noNN_No,NN_No,noNN_Rst,NN_Rst
experiment,function,freq,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1
exp1,Rastrigin,10.0,1,2,3,4,8,7,5,6
exp1,Rosenbrock,10.0,2,1,4,3,8,7,5,6
exp1,Sphere,10.0,1,2,4,3,8,7,5,6
exp2,Rastrigin,10.0,1,2,4,5,6,3,7,8
exp2,Rosenbrock,10.0,3,4,5,6,2,1,8,7
exp2,Sphere,10.0,2,3,4,5,8,1,6,7
exp3,Rastrigin,10.0,1,2,5,6,8,7,3,4
exp3,Rosenbrock,10.0,4,3,1,5,6,2,7,8
exp3,Sphere,10.0,3,2,1,6,4,5,7,8
exp4,Rastrigin,10.0,6,3,5,2,8,7,1,4


In [418]:
summary = df_pivot.groupby(['experiment', 'function']).mean()
summary.round(2).style.background_gradient(cmap=plt.cm.Greens, axis=1)

Unnamed: 0_level_0,method,noNN_RI,NN_RI,noNN_HMu,NN_HMu,noNN_No,NN_No,noNN_Rst,NN_Rst
experiment,function,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
1,Rastrigin,28.97,35.95,44.81,45.33,495.52,461.78,70.51,79.97
1,Rosenbrock,12904.4,12855.7,20735.2,13688.2,1897650.0,56462.2,22773.5,32169.8
1,Sphere,3.69,3.88,5.72,4.27,523.23,17.08,7.08,9.35
2,Rastrigin,21.13,21.6,22.11,24.86,36.04,22.1,97.29,109.37
2,Rosenbrock,259.32,331.25,583.51,715.33,195.09,135.63,5839.66,5201.47
2,Sphere,0.3,0.43,0.62,0.83,9.72,0.21,4.75,4.85
3,Rastrigin,26.37,36.24,57.72,80.07,838.86,755.85,42.82,56.13
3,Rosenbrock,59.13,58.78,51.56,62.17,78.24,57.95,54836.5,72831.2
3,Sphere,0.08,0.08,0.07,0.11,0.08,0.08,9.75,13.77
4,Rastrigin,153.79,116.25,132.09,106.17,4038.62,720.56,94.3,124.95


In [419]:
out = summary.round(2).style
for i in range(len(labels_order)//2): 
    out = out.highlight_min(axis=1, subset=labels_order[i*2:(i+1)*2])

out

Unnamed: 0_level_0,method,noNN_RI,NN_RI,noNN_HMu,NN_HMu,noNN_No,NN_No,noNN_Rst,NN_Rst
experiment,function,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
1,Rastrigin,28.97,35.95,44.81,45.33,495.52,461.78,70.51,79.97
1,Rosenbrock,12904.4,12855.7,20735.2,13688.2,1897650.0,56462.2,22773.5,32169.8
1,Sphere,3.69,3.88,5.72,4.27,523.23,17.08,7.08,9.35
2,Rastrigin,21.13,21.6,22.11,24.86,36.04,22.1,97.29,109.37
2,Rosenbrock,259.32,331.25,583.51,715.33,195.09,135.63,5839.66,5201.47
2,Sphere,0.3,0.43,0.62,0.83,9.72,0.21,4.75,4.85
3,Rastrigin,26.37,36.24,57.72,80.07,838.86,755.85,42.82,56.13
3,Rosenbrock,59.13,58.78,51.56,62.17,78.24,57.95,54836.5,72831.2
3,Sphere,0.08,0.08,0.07,0.11,0.08,0.08,9.75,13.77
4,Rastrigin,153.79,116.25,132.09,106.17,4038.62,720.56,94.3,124.95


# Interactive

In [403]:
from ipywidgets import interact
def show_table(dm):
    out = summary[[f'noNN_{dm}', f'NN_{dm}']].round(2)
    return out.style.background_gradient(cmap=plt.cm.Blues_r, axis=1)
    
interact(show_table, dm=['RI', 'HMu','No','Rst'])

interactive(children=(Dropdown(description='dm', options=('RI', 'HMu', 'No', 'Rst'), value='RI'), Output()), _…

<function __main__.show_table(dm)>