In [1]:
import os
import sys
import csv
import seaborn as sns
import matplotlib.pyplot as plt
import pandas as pd

repo_root = os.path.abspath(os.path.join(os.getcwd(), '..', '..'))
sys.path.append(repo_root)

from src import *

In [2]:
process_directory_real_data(os.getcwd())

In [3]:


def process_results(base_path):
    # Read the summary CSV files
    log_likelihood_df = pd.read_csv(os.path.join(base_path, 'log_likelihood_summary.csv')).groupby(by=['dataset']).mean().reset_index()
    leadership_log_likelihood_df = pd.read_csv(os.path.join(base_path, 'leadership_log_likelihood_summary.csv')).groupby(by=['dataset']).mean().reset_index()

    filtered_log_like = log_likelihood_df.drop(columns=['rep']).set_index('dataset')
    filtered_leader_like = leadership_log_likelihood_df.drop(columns=['rep']).set_index('dataset')
    
    return filtered_log_like, filtered_leader_like


def visualize_df(df, title):
    print(f"\n{title}\n")
    styled_df = df.style.set_table_styles(
       
    ).set_properties(**{
        'background-color': 'LightGray',
        'color': 'black',
        'border-color': 'DarkBlue',
        'border-style': 'solid',
        'border-width': '1px',
        'text-align': 'left'
    })
    
    display(styled_df)

In [4]:
unique_datasets = pd.read_csv(os.path.join(os.path.join(os.getcwd(), 'results'), 'log_likelihood_summary.csv'))['dataset'].unique()
dataset_info = pd.read_csv(os.path.join(repo_root, 'datasets', 'dataset_info.csv'))
filtered_dataset_info = dataset_info[dataset_info['dataset_id'].isin(unique_datasets)].set_index('dataset_id')
visualize_df(filtered_dataset_info, 'Datasets Tested')



Datasets Tested



Unnamed: 0_level_0,name,N,M,K1,K2
dataset_id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
1,irish_election,36,138011,1,14
2,debian,36,3352,1,9
4,netflix_prize,196,163759,3,4
6,skate,249,174,14,30
7,electoral_reform_society,30,35610,1,29
8,glasgow_city_council,209,188376,1,13
9,AGH_course_selection,10,299,7,9
12,t_shirt,12,30,11,11
14,sushi,103,10000,10,10
18,minneapolis_election,778,137482,1,3


In [5]:

log_like, leadership_log = process_results(os.path.join(os.getcwd(), 'results'))


In [6]:
visualize_df(log_like, 'log likelihood')


log likelihood



Unnamed: 0_level_0,BT,BT_leadership,HO_BT,HOL_BT,Spring_Rank,Spring_Rank_Leadership,Page_Rank,Page_Rank_Leadership,Point_Wise
dataset,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
1,-5.044229,-5.169924,-5.036036,-5.143064,-5.625426,-5.717296,-5.196946,-5.077089,-5.082346
2,-4.672714,-5.045789,-4.663846,-4.985351,-5.455923,-5.495389,-6.983254,-6.086496,-5.014611
4,-1.929228,-1.986866,-1.927163,-1.98513,-2.0083,-2.036996,-2.861661,-2.702381,-2.090668
6,-20.047749,-42.985954,-20.833562,-42.288676,-38.298251,-52.1519,-66.932374,-44.982715,-35.446929
7,-6.177104,-6.203007,-6.174987,-6.195116,-6.307919,-6.431429,-6.236753,-6.274201,-6.18484
8,-3.158094,-3.263374,-3.154436,-3.258237,-3.273359,-3.494488,-3.266435,-3.19952,-3.193524
9,-9.075683,-11.196154,-9.033729,-9.655373,-22.409253,-56.516805,-11.97639,-10.724481,-9.951059
12,-15.781606,-22.036627,-15.731733,-18.417697,-28.668071,-81.344196,-19.486445,-17.614313,-16.341428
14,-14.458811,-15.617013,-14.410356,-15.260622,-14.519396,-15.89553,-15.793643,-15.325292,-14.603172
18,-1.427299,-1.430719,-1.42713,-1.430777,-2.783171,-3.002387,-1.504377,-1.490002,-1.472192


In [7]:
visualize_df(leadership_log, 'Leadership log likelihood')


Leadership log likelihood



Unnamed: 0_level_0,BT,BT_leadership,HO_BT,HOL_BT,Spring_Rank,Spring_Rank_Leadership,Page_Rank,Page_Rank_Leadership,Point_Wise
dataset,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
1,-1.413646,-1.396724,-1.415263,-1.395091,-1.433378,-1.419383,-1.471437,-1.440121,-1.432245
2,-1.249969,-1.218791,-1.260563,-1.217912,-1.368773,-1.272094,-2.00442,-1.719453,-1.403802
4,-0.960354,-0.947128,-0.967511,-0.947028,-1.015259,-1.001538,-1.512117,-1.402239,-1.095738
6,-0.745733,-0.714314,-0.830318,-0.811607,-2.550378,-1.226761,-4.375815,-3.057249,-2.419413
7,-1.521415,-1.52052,-1.522623,-1.519561,-1.53838,-1.544886,-1.535947,-1.538078,-1.526059
8,-1.145459,-1.116094,-1.146772,-1.114434,-1.158389,-1.141853,-1.228527,-1.19476,-1.174335
9,-0.798906,-2.308192,-0.879971,-1.160518,-1.349901,-0.311867,-3.065081,-2.215976,-1.679889
12,-2.293822,-2.239523,-2.350903,-2.240049,-2.713953,-2.90972,-2.619781,-2.425969,-2.290493
14,-2.089955,-2.048006,-2.126411,-2.041446,-2.134286,-2.100719,-2.32733,-2.237109,-2.196671
18,-0.926821,-0.925212,-0.927569,-0.925173,-1.529747,-1.610487,-0.988544,-0.975298,-0.968206
