In [None]:
import os

import pandas as pd

import pareto

import matplotlib.pyplot as plt
%matplotlib inline

In [None]:
plt.style.use('seaborn-bright')
plt.rcParams['figure.figsize'] = [15, 9]
plt.rcParams['font.size'] = 12

pd.set_option('display.max_columns', None)
# pd.set_option('display.max_rows', None)

In [None]:
cwd = os.getcwd()
join = os.path.join
norm = os.path.normpath

In [None]:
dynamic_path = norm(join(cwd, '../dynamic/runs/dynamic_stats.csv'))
static_path = norm(join(cwd, '../static/runs/static_stats.csv'))
mlaa_path = norm(join(cwd, '../MLAA-Bernier/runs/MLAA_stats.csv'))
liu_path = norm(join(cwd, '../Hierarchical-Liu/runs/Hierarchical_stats.csv'))
cenk_path = norm(join(cwd, '../Yavuzturk/runs/Yavuzturk_stats.csv'))

In [None]:
df_d = pd.read_csv(dynamic_path, index_col=[0])
df_s = pd.read_csv(static_path, index_col=[0])
df_m = pd.read_csv(mlaa_path, index_col=[0])
df_l = pd.read_csv(liu_path, index_col=[0])
df_c = pd.read_csv(cenk_path, index_col=[0])

In [None]:
df_d.head(2)

In [None]:
def find_claesson(load, year):
    _df = df_d.loc[(df_d['load'] == load) & (df_d['sim time'] == year) & (df_d['start width'] == 5) & (df_d['end width'] == 5) & (df_d['exp_rate'] == 2)]
    x = _df['rmse'].values
    y = _df['run time fraction'].values
    return float(x), float(y)

In [None]:
find_claesson('balanced', 1)

In [None]:
markers = ['X', 'D', 'v', 'h', '+', '*']

In [None]:
def plot_all_methods_runtimefrac_vs_rmse(dfs, names, load, year):
    fig = plt.figure(figsize=(7, 5), dpi=200)
    ax = fig.add_subplot(1, 1, 1)
    
    for idx, df in enumerate(dfs):
        mask = (df['load'] == load) & (df['sim time'] == year)
        x = df.loc[mask]['rmse']
        y = df.loc[mask]['run time fraction']
        ax.scatter(x, y, label=names[idx], marker=markers[idx])
      
    x, y = find_claesson(load, year)
    ax.scatter(x, y, label='Claesson', marker=markers[-1])
    
    plt.xlabel('RMSE MFT [C]')
    plt.ylabel('Runtime Fraction')
    plt.title('{} {}'.format(load.title(), year))
    
    plt.legend()
    plt.grid(True)
    plt.savefig('{}_{}.pdf'.format(load, year), bbox_inches='tight')
    plt.show()

In [None]:
plot_all_methods_runtimefrac_vs_rmse([df_d, df_s, df_m, df_l, df_c], 
                                     ['Dynamic', 'Static', 'Bernier', 'Liu', 'Yavuzturk'],
                                    'balanced',
                                    1)

In [None]:
plot_all_methods_runtimefrac_vs_rmse([df_d, df_s, df_m, df_l, df_c], 
                                     ['Dynamic', 'Static', 'Bernier', 'Liu', 'Yavuzturk'],
                                    'imbalanced',
                                    1)

In [None]:
plot_all_methods_runtimefrac_vs_rmse([df_d, df_s, df_m, df_l, df_c], 
                                     ['Dynamic', 'Static', 'Bernier', 'Liu', 'Yavuzturk'],
                                    'balanced',
                                    5)

In [None]:
plot_all_methods_runtimefrac_vs_rmse([df_d, df_s, df_m, df_l, df_c], 
                                     ['Dynamic', 'Static', 'Bernier', 'Liu', 'Yavuzturk'],
                                    'imbalanced',
                                    5)

In [None]:
plot_all_methods_runtimefrac_vs_rmse([df_d, df_s, df_m, df_l, df_c], 
                                     ['Dynamic', 'Static', 'Bernier', 'Liu', 'Yavuzturk'],
                                    'balanced',
                                    10)

In [None]:
plot_all_methods_runtimefrac_vs_rmse([df_d, df_s, df_m, df_l, df_c], 
                                     ['Dynamic', 'Static', 'Bernier', 'Liu', 'Yavuzturk'],
                                    'imbalanced',
                                    10)

In [None]:
def define_pareto(df_in):
    df = pd.DataFrame.from_records(pareto.eps_sort([list(df_in.itertuples(False))], [4, 5]), columns=list(df_in.columns.values))
    df.sort_values(by=['rmse'], inplace=True)
    return df

In [None]:
m_b1 = (df_d['sim time'] == 1) & (df_d['load'] == 'balanced')

In [None]:
pareto_b1 = define_pareto(df_d.loc[m_b1])
pareto_b1

In [None]:

pareto_b2 = define_pareto(df.loc[m_b2])
pareto_b3 = define_pareto(df.loc[m_b3])
pareto_b4 = define_pareto(df.loc[m_b4])
pareto_b5 = define_pareto(df.loc[m_b5])
pareto_b6 = define_pareto(df.loc[m_b6])

In [None]:
pareto_i1 = define_pareto(df.loc[m_i1])
pareto_i2 = define_pareto(df.loc[m_i2])
pareto_i3 = define_pareto(df.loc[m_i3])
pareto_i4 = define_pareto(df.loc[m_i4])
pareto_i5 = define_pareto(df.loc[m_i5])
pareto_i6 = define_pareto(df.loc[m_i6])

In [None]:
make_fig(pareto_b1, exp_rates, 'exp_rate', '1-year Balanced')
make_fig(pareto_b2, exp_rates, 'exp_rate', '2-year Balanced')
make_fig(pareto_b3, exp_rates, 'exp_rate', '3-year Balanced')
make_fig(pareto_b4, exp_rates, 'exp_rate', '4-year Balanced')
make_fig(pareto_b5, exp_rates, 'exp_rate', '5-year Balanced')
make_fig(pareto_b6, exp_rates, 'exp_rate', '6-year Balanced')

In [None]:
make_fig(pareto_i1, exp_rates, 'exp_rate', '1-year Imbalanced')
make_fig(pareto_i2, exp_rates, 'exp_rate', '2-year Imbalanced')
make_fig(pareto_i3, exp_rates, 'exp_rate', '3-year Imbalanced')
make_fig(pareto_i4, exp_rates, 'exp_rate', '4-year Imbalanced')
make_fig(pareto_i5, exp_rates, 'exp_rate', '5-year Imbalanced')
make_fig(pareto_i6, exp_rates, 'exp_rate', '6-year Imbalanced')

In [None]:
def make_fig_with_annotation(df_in, mask_series, mask_col_name, annotate_col_name, title=None):
    fig = plt.figure()
    ax = fig.add_subplot(1, 1, 1)

    for idx, mask in enumerate(reversed(mask_series)):
        s = df_in[mask_col_name] == float(mask)

        x = df_in.loc[s]['rmse']
        y = df_in.loc[s]['run time']

        m = markers[idx]
        ax.scatter(x, y, marker=m, label=mask, s=60)
              
        for i, txt in enumerate(df_in.loc[s][annotate_col_name].values):
            ax.annotate(txt, (x.values[i], y.values[i]))

    if title:
        plt.title(title)
        
    plt.legend()
    plt.show()

In [None]:
exp_rate_mask = df['exp_rate'] == 1.75

In [None]:
start_widths = range(1, 6)

In [None]:
make_fig_with_annotation(df.loc[m_b1 & exp_rate_mask], start_widths, 'start width', 'end width', '1-year Balanced')
make_fig_with_annotation(df.loc[m_b2 & exp_rate_mask], start_widths, 'start width', 'end width', '2-year Balanced')
make_fig_with_annotation(df.loc[m_b3 & exp_rate_mask], start_widths, 'start width', 'end width', '3-year Balanced')
make_fig_with_annotation(df.loc[m_b4 & exp_rate_mask], start_widths, 'start width', 'end width', '4-year Balanced')
make_fig_with_annotation(df.loc[m_b5 & exp_rate_mask], start_widths, 'start width', 'end width', '5-year Balanced')
make_fig_with_annotation(df.loc[m_b6 & exp_rate_mask], start_widths, 'start width', 'end width', '6-year Balanced')

In [None]:
make_fig_with_annotation(df.loc[m_i1 & exp_rate_mask], start_widths, 'start width', 'end width', '1-year Imbalanced')
make_fig_with_annotation(df.loc[m_i2 & exp_rate_mask], start_widths, 'start width', 'end width', '2-year Imbalanced')
make_fig_with_annotation(df.loc[m_i3 & exp_rate_mask], start_widths, 'start width', 'end width', '3-year Imbalanced')
make_fig_with_annotation(df.loc[m_i4 & exp_rate_mask], start_widths, 'start width', 'end width', '4-year Imbalanced')
make_fig_with_annotation(df.loc[m_i5 & exp_rate_mask], start_widths, 'start width', 'end width', '5-year Imbalanced')
make_fig_with_annotation(df.loc[m_i6 & exp_rate_mask], start_widths, 'start width', 'end width', '6-year Imbalanced')

In [None]:
def make_some_plot(*args):
    fig = plt.figure()
    ax = fig.add_subplot(1, 1, 1)
    
    args = args[0]
    
    for s in args:
        print(args)
        try:
            ax.plot(s['x'], s['y'], label=s['label'])
        except KeyError:
                ax.plot(s['x'], s['y'])
        
    plt.grid()
    plt.legend()
    plt.show()

In [None]:
make_some_plot([a, b, c])