In [1]:
import pandas as pd
import numpy as np

In [2]:
def maze_summary(dataframe, category):
    '''
    Calculate the means and standard deviations of certain categories in the dataframe.
    dataframe: data table, pandas dataframe
    category: user specified categories for calculation, python list
    '''
    maze_list = dataframe['maze'].unique().tolist()
    mode_list = dataframe['mode'].unique().tolist()
    intuition_list = dataframe['intuition'].unique().tolist()
    heuristic_list = dataframe['heuristic'].unique().tolist()
    summary_mean = pd.DataFrame()
    summary_std = pd.DataFrame()
    for maze in maze_list:
        for mode in mode_list:
            for intuition in intuition_list:
                for heuristic in heuristic_list:
                    data = dataframe[(dataframe['maze'] == maze) & (dataframe['mode'] == mode) & (dataframe['intuition'] == intuition) & (dataframe['heuristic'] == heuristic)][category]
                    data_mean = np.around(data.mean().values, decimals = 2).tolist()
                    data_std = np.around(data.std().values, decimals = 2).tolist()
                    summary_mean = summary_mean.append([[maze, mode, intuition, heuristic] + data_mean], ignore_index = True)
                    summary_std = summary_std.append([[maze, mode, intuition, heuristic] + data_std], ignore_index = True)
    return (summary_mean, summary_std)

In [3]:
def file_process(file_list):
    '''
    Process files for maze_summary.
    file_list: file name list, python list
    '''
    summary_mean = pd.DataFrame()
    summary_std = pd.DataFrame()
    for file in file_list:
        dataframe = pd.read_csv(file, sep = ',')
        category = dataframe.columns.values.tolist()[4:]
        summary = maze_summary(dataframe = dataframe, category = category)
        summary_mean = summary_mean.append(summary[0], ignore_index = True)
        summary_std = summary_std.append(summary[1], ignore_index = True)
    return (summary_mean, summary_std)

In [4]:
def summary_process(dataframe_list):
    '''
    Merge statistics of multiple dataframe in a list.
    dataframe_list: dataframe list, python list
    '''
    summary_mean = pd.DataFrame()
    summary_std = pd.DataFrame()
    for dataframe in dataframe_list:
        category = dataframe.columns.values.tolist()[4:]
        summary = maze_summary(dataframe = dataframe, category = category)
        summary_mean = summary_mean.append(summary[0], ignore_index = True)
        summary_std = summary_std.append(summary[1], ignore_index = True)
    return (summary_mean, summary_std)

In [5]:
file_list = ['test_result_maze_01.csv', 'test_result_maze_02.csv', 'test_result_maze_03.csv']

In [6]:
dataframe_list = list()
for file in file_list:
    dataframe_list.append(pd.read_csv(file, sep = ','))

In [7]:
# Take a look at the data
dataframe_list[0].head()

Unnamed: 0,maze,mode,intuition,heuristic,num_actions_1,length_movement_1,num_actions_2,length_movement_2,num_actions_3,length_movement_3,true_coverage,score,exploration_time,computation_time
0,1,complete,False,False,190.0,223.0,11.0,17.0,17.0,32.0,1.0,23.7,549.488,549.858
1,1,complete,False,False,190.0,223.0,11.0,17.0,17.0,32.0,1.0,23.7,591.497,591.88
2,1,complete,False,False,176.0,203.0,12.0,21.0,17.0,32.0,1.0,23.266667,365.862,366.253
3,1,complete,False,False,183.0,221.0,18.0,31.0,17.0,32.0,1.0,23.7,394.488,394.887
4,1,complete,False,False,187.0,210.0,9.0,18.0,17.0,32.0,1.0,23.533333,403.505,403.874


In [8]:
# Add maze_size information
# Calculate exploration efficiency
maze_size_dict = {1: 144, 2: 196, 3: 256}
for i in xrange(len(dataframe_list)):
    dataframe_list[i]['maze_size'] = dataframe_list[i]['maze'].map(lambda x: maze_size_dict[x])
    dataframe_list[i]['num_grid_per_action_1'] = dataframe_list[i]['maze_size'] * dataframe_list[i]['true_coverage'] / dataframe_list[i]['num_actions_1']
    dataframe_list[i]['num_grid_per_length_1'] = dataframe_list[i]['maze_size'] * dataframe_list[i]['true_coverage'] / dataframe_list[i]['length_movement_1']

In [9]:
dataframe_list[0].head()

Unnamed: 0,maze,mode,intuition,heuristic,num_actions_1,length_movement_1,num_actions_2,length_movement_2,num_actions_3,length_movement_3,true_coverage,score,exploration_time,computation_time,maze_size,num_grid_per_action_1,num_grid_per_length_1
0,1,complete,False,False,190.0,223.0,11.0,17.0,17.0,32.0,1.0,23.7,549.488,549.858,144,0.757895,0.64574
1,1,complete,False,False,190.0,223.0,11.0,17.0,17.0,32.0,1.0,23.7,591.497,591.88,144,0.757895,0.64574
2,1,complete,False,False,176.0,203.0,12.0,21.0,17.0,32.0,1.0,23.266667,365.862,366.253,144,0.818182,0.70936
3,1,complete,False,False,183.0,221.0,18.0,31.0,17.0,32.0,1.0,23.7,394.488,394.887,144,0.786885,0.651584
4,1,complete,False,False,187.0,210.0,9.0,18.0,17.0,32.0,1.0,23.533333,403.505,403.874,144,0.770053,0.685714


In [10]:
column_names = ['Maze', 'Mode', 'Intuition', 'Heuristics', 'Time Steps 1', 'Path Length 1', 
                'Time Steps 2', 'Path Length 2', 'Time Steps 3', 'Path Length 3','Coverage', 'Score', 'Exploration Time', 'Computation Time', 'Maze Size', 'Number of Grid Visited Per Time Step during Exploration', 'Number of Grid Visited Per Path Length during Exploration']

In [11]:
summary = summary_process(dataframe_list)
summary_mean = summary[0]
summary_std = summary[1]

In [12]:
summary_mean.columns = column_names
summary_std.columns = column_names

In [13]:
summary_mean

Unnamed: 0,Maze,Mode,Intuition,Heuristics,Time Steps 1,Path Length 1,Time Steps 2,Path Length 2,Time Steps 3,Path Length 3,Coverage,Score,Exploration Time,Computation Time,Maze Size,Number of Grid Visited Per Time Step during Exploration,Number of Grid Visited Per Path Length during Exploration
0,1,complete,False,False,185.5,220.4,11.6,20.4,17.0,32.0,1.0,23.57,415.4,415.81,144.0,0.78,0.65
1,1,complete,False,True,189.1,225.7,9.0,15.9,17.0,32.0,1.0,23.6,109.17,109.62,144.0,0.76,0.64
2,1,complete,True,False,186.8,219.7,7.6,15.1,17.0,32.0,1.0,23.48,79.08,79.43,144.0,0.77,0.66
3,1,complete,True,True,186.1,216.5,9.6,17.3,17.0,32.0,1.0,23.52,43.44,43.79,144.0,0.77,0.67
4,1,incomplete,False,False,118.8,136.2,18.3,31.2,18.3,32.4,0.7,22.87,257.91,258.24,144.0,0.88,0.78
5,1,incomplete,False,True,133.7,150.8,17.8,31.8,17.8,33.2,0.79,22.85,61.72,62.05,144.0,0.86,0.77
6,1,incomplete,True,False,102.2,114.4,18.4,31.2,18.4,32.2,0.64,22.42,37.99,38.32,144.0,0.91,0.82
7,1,incomplete,True,True,141.5,161.8,17.3,30.6,17.3,32.4,0.82,22.59,29.95,30.27,144.0,0.84,0.75
8,2,complete,False,False,256.4,302.4,12.7,22.2,22.0,43.0,1.0,30.97,680.18,680.7,196.0,0.77,0.65
9,2,complete,False,True,268.1,323.8,13.9,26.0,22.0,43.0,1.0,31.4,161.89,162.37,196.0,0.73,0.61


In [14]:
summary_std

Unnamed: 0,Maze,Mode,Intuition,Heuristics,Time Steps 1,Path Length 1,Time Steps 2,Path Length 2,Time Steps 3,Path Length 3,Coverage,Score,Exploration Time,Computation Time,Maze Size,Number of Grid Visited Per Time Step during Exploration,Number of Grid Visited Per Path Length during Exploration
0,1,complete,False,False,5.36,10.53,3.69,5.99,0.0,0.0,0.0,0.23,128.94,128.91,0.0,0.02,0.03
1,1,complete,False,True,4.51,8.35,5.06,8.6,0.0,0.0,0.0,0.27,14.47,14.5,0.0,0.02,0.02
2,1,complete,True,False,4.96,6.17,4.33,7.23,0.0,0.0,0.0,0.12,20.15,20.14,0.0,0.02,0.02
3,1,complete,True,True,4.68,5.72,4.86,8.84,0.0,0.0,0.0,0.22,2.78,2.79,0.0,0.02,0.02
4,1,incomplete,False,False,52.05,65.01,1.49,1.69,1.49,0.84,0.26,0.92,131.54,131.55,0.0,0.08,0.11
5,1,incomplete,False,True,35.63,43.49,0.92,2.2,0.92,2.15,0.18,0.82,18.44,18.44,0.0,0.05,0.07
6,1,incomplete,True,False,30.77,38.65,1.43,1.4,1.43,1.48,0.17,1.17,21.37,21.37,0.0,0.04,0.08
7,1,incomplete,True,True,35.39,44.61,0.67,1.35,0.67,1.26,0.17,1.02,9.4,9.42,0.0,0.05,0.08
8,2,complete,False,False,9.7,16.62,5.64,10.11,0.0,0.0,0.0,0.45,157.31,157.34,0.0,0.03,0.03
9,2,complete,False,True,8.49,15.31,7.42,14.79,0.0,0.0,0.0,0.45,12.7,12.71,0.0,0.02,0.03


In [15]:
summary_mean.to_csv('summary_mean.csv', sep = ',', index = False)
summary_std.to_csv('summary_std.csv', sep = ',', index = False)