In [1]:
# Libraries
import itertools
from importlib import resources
import pandas as pd
import numpy as np
from tqdm import tqdm

from drdt.helper_functions import DecisionRuleCreatorFromDecisionTable, Reduction, R_SR, R_AD, SAlphaStep, SPlus, SMax, NCover, NGreedy
from drdt.algorithms import DynamicProgrammingAlgorithms, A_C_N, A_C_G


# Loading Data

In [2]:
with resources.path('datasets.DecisionRuleSystems', 'DRS_balance_scale') as dataset_path:
    S = pd.read_csv(dataset_path).sample(n=10, random_state=42).applymap(lambda x: str(x) if pd.notnull(x) else x)
S

Unnamed: 0,right-distance,right-weight,left-distance,left-weight,class
447,3.0,5.0,3.0,4.0,R
485,1.0,3.0,5.0,,L
215,1.0,,4.0,2.0,L
212,3.0,3.0,4.0,2.0,R
480,1.0,2.0,5.0,,L
515,1.0,4.0,,5.0,L
163,4.0,3.0,2.0,,R
77,3.0,1.0,4.0,,L
527,3.0,1.0,,5.0,L
145,,5.0,1.0,2.0,R


# Dataset Analyses

In [3]:
print(f"Number of features  = {len(S.columns)-1}")

Number of features  = 4


In [4]:
print(f"Does # of features = d  = {not S.dropna().empty}")

Does # of features = d  = True


In [5]:
# Count non-NaN values for each row
non_nan_counts = S.count(axis=1)

# Find the index
max_non_nan_row_index = non_nan_counts.idxmax()

# Retrieve the row
max_non_nan_row = S.loc[max_non_nan_row_index]

# Number of non-NaN values in the row
max_non_nan_count = non_nan_counts[max_non_nan_row_index]

print(f"d of  = {max_non_nan_count - 1}") # remove 1 because of last class column

d of  = 4


In [6]:
P = S
P_plus = SPlus(P)
B = NCover(P_plus)
print(f"Length of Node Cover for AR = {len(B)}")

Length of Node Cover for AR = 4


In [7]:
P = R_SR(S)
P_plus = SPlus(P)
B = NCover(P_plus)
print(f"Length of Node Cover for SR = {len(B)}")

Length of Node Cover for SR = 4


In [8]:
P = R_AD(S)
P_plus = SPlus(P)
B = NCover(P_plus)
print(f"Length of Node Cover for AD = {len(B)}")

Length of Node Cover for AD = 4


In [9]:
P = S
P_plus = SPlus(P)
B = NGreedy(P_plus)
print(f"Length of Node Cover greedy for AR = {len(B)}")

Length of Node Cover greedy for AR = 1


In [10]:
P = R_SR(S)
P_plus = SPlus(P)
B = NGreedy(P_plus)
print(f"Length of Node Cover greedy for SR = {len(B)}")

Length of Node Cover greedy for SR = 1


In [11]:
P = R_AD(S)
P_plus = SPlus(P)
B = NGreedy(P_plus)
print(f"Length of Node Cover greedy for AD = {len(B)}")

Length of Node Cover greedy for AD = 1


# Dynamic Programming

In [12]:
alg = DynamicProgrammingAlgorithms(C="AR")
depth = alg.A_DP(S)
print(f"DP AR = {depth}")

DP AR = 4


In [13]:
alg = DynamicProgrammingAlgorithms(C="EAR")
depth = alg.A_DP(S)
print(f"DP EAR = {depth}")

DP EAR = 4


In [14]:
alg = DynamicProgrammingAlgorithms(C="SR")
depth = alg.A_DP(S)
print(f"DP SR = {depth}")

DP SR = 4


In [15]:
alg = DynamicProgrammingAlgorithms(C="ESR")
depth = alg.A_DP(S)
print(f"DP ESR = {depth}")

DP ESR = 4


In [16]:
alg = DynamicProgrammingAlgorithms(C="AD")
depth = alg.A_DP(S)
print(f"DP AD = {depth}")

DP AD = 4


In [17]:
alg = DynamicProgrammingAlgorithms(C="EAD")
depth = alg.A_DP(S)
print(f"DP EAD = {depth}")

DP EAD = 4


# Combinations

In [18]:
# Possible values for each featue
right_distance_values = ['3.0', '1.0', '4.0']
right_weight_values = ['5.0', '3.0', '2.0', '4.0', '1.0']
left_distance_values = ['3.0', '5.0', '4.0', '2.0', '1.0']
left_weight_values = ['4.0', '2.0', '5.0']                  

# All possible combinations
combinations = list(itertools.product(right_distance_values, right_weight_values, left_distance_values, left_weight_values))


In [19]:
# Possible values for each featue
right_distance_values = ['3.0', '1.0', '4.0', '*']
right_weight_values = ['5.0', '3.0', '2.0', '4.0', '1.0', '*']
left_distance_values = ['3.0', '5.0', '4.0', '2.0', '1.0', '*']
left_weight_values = ['4.0', '2.0', '5.0', '*']                  

# All possible combinations
extended_combinations = list(itertools.product(right_distance_values, right_weight_values, left_distance_values, left_weight_values))


# Node Cover

In [20]:
depths = []

for comb in tqdm(combinations):
    #creating delta
    delta = pd.DataFrame(
    [[comb[0], comb[1], comb[2], comb[3]]],
    columns=['right-distance','right-weight','left-distance','left-weight'])
    
    delta = delta.loc[0]
    
    alg = A_C_N(C="AR", N="cover")
    
    depth, _ = alg.solve(S, delta=delta)
    
    depths.append(depth)
    
print("NC AR")    
print("(Max Depth, Min Depth, Average Depth) =", (max(depths), min(depths), sum(depths)/len(depths)))

100%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 225/225 [00:00<00:00, 547.28it/s]

NC AR
(Max Depth, Min Depth, Average Depth) = (4, 4, 4.0)





In [21]:
depths = []

for comb in tqdm(extended_combinations):
    #creating delta
    delta = pd.DataFrame(
    [[comb[0], comb[1], comb[2], comb[3]]],
    columns=['right-distance','right-weight','left-distance','left-weight'])
    
    delta = delta.loc[0]
    
    alg = A_C_N(C="EAR", N="cover")
    
    depth, _ = alg.solve(S, delta=delta)
    
    depths.append(depth)
    
print("NC EAR")    
print("(Max Depth, Min Depth, Average Depth) =", (max(depths), min(depths), sum(depths)/len(depths)))

100%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 576/576 [00:01<00:00, 554.91it/s]

NC EAR
(Max Depth, Min Depth, Average Depth) = (4, 4, 4.0)





In [22]:
depths = []

for comb in tqdm(combinations):
    #creating delta
    delta = pd.DataFrame(
    [[comb[0], comb[1], comb[2], comb[3]]],
    columns=['right-distance','right-weight','left-distance','left-weight'])
    
    delta = delta.loc[0]
    
    alg = A_C_N(C="SR", N="cover")
    
    depth, _ = alg.solve(S, delta=delta)
    
    depths.append(depth)
    
print("NC SR")    
print("(Max Depth, Min Depth, Average Depth) =", (max(depths), min(depths), sum(depths)/len(depths)))

100%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 225/225 [00:01<00:00, 134.09it/s]

NC SR
(Max Depth, Min Depth, Average Depth) = (4, 4, 4.0)





In [23]:
depths = []

for comb in tqdm(extended_combinations):
    #creating delta
    delta = pd.DataFrame(
    [[comb[0], comb[1], comb[2], comb[3]]],
    columns=['right-distance','right-weight','left-distance','left-weight'])
    
    delta = delta.loc[0]
    
    alg = A_C_N(C="ESR", N="cover")
    
    depth, _ = alg.solve(S, delta=delta)
    
    depths.append(depth)
    
print("NC ESR")    
print("(Max Depth, Min Depth, Average Depth) =", (max(depths), min(depths), sum(depths)/len(depths)))

100%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 576/576 [00:04<00:00, 135.97it/s]

NC ESR
(Max Depth, Min Depth, Average Depth) = (4, 4, 4.0)





In [24]:
depths = []

for comb in tqdm(combinations):
    #creating delta
    delta = pd.DataFrame(
    [[comb[0], comb[1], comb[2], comb[3]]],
    columns=['right-distance','right-weight','left-distance','left-weight'])
    
    delta = delta.loc[0]
    
    alg = A_C_N(C="AD", N="cover")
    
    depth, _ = alg.solve(S, delta=delta)
    
    depths.append(depth)
    
print("NC AD")    
print("(Max Depth, Min Depth, Average Depth) =", (max(depths), min(depths), sum(depths)/len(depths)))

100%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 225/225 [00:01<00:00, 202.75it/s]

NC AD
(Max Depth, Min Depth, Average Depth) = (4, 4, 4.0)





In [25]:
depths = []

for comb in tqdm(extended_combinations):
    #creating delta
    delta = pd.DataFrame(
    [[comb[0], comb[1], comb[2], comb[3]]],
    columns=['right-distance','right-weight','left-distance','left-weight'])
    
    delta = delta.loc[0]
    
    alg = A_C_N(C="EAD", N="cover")
    
    depth, _ = alg.solve(S, delta=delta)
    
    depths.append(depth)
    
print("NC EAD")    
print("(Max Depth, Min Depth, Average Depth) =", (max(depths), min(depths), sum(depths)/len(depths)))

100%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 576/576 [00:02<00:00, 201.57it/s]

NC EAD
(Max Depth, Min Depth, Average Depth) = (4, 4, 4.0)





# Node Cover Greedy

In [26]:
depths = []

for comb in tqdm(combinations):
    #creating delta
    delta = pd.DataFrame(
    [[comb[0], comb[1], comb[2], comb[3]]],
    columns=['right-distance','right-weight','left-distance','left-weight'])
    
    delta = delta.loc[0]
    
    alg = A_C_N(C="AR", N="greedy")
    
    depth, _ = alg.solve(S, delta=delta)
    
    depths.append(depth)
    
print("NCgreedy AR")    
print("(Max Depth, Min Depth, Average Depth) =", (max(depths), min(depths), sum(depths)/len(depths)))

100%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 225/225 [00:01<00:00, 147.89it/s]

NCgreedy AR
(Max Depth, Min Depth, Average Depth) = (4, 2, 2.92)





In [27]:
depths = []

for comb in tqdm(extended_combinations):
    #creating delta
    delta = pd.DataFrame(
    [[comb[0], comb[1], comb[2], comb[3]]],
    columns=['right-distance','right-weight','left-distance','left-weight'])
    
    delta = delta.loc[0]
    
    alg = A_C_N(C="EAR", N="greedy")
    
    depth, _ = alg.solve(S, delta=delta)
    
    depths.append(depth)
    
print("NCgreedy EAR")    
print("(Max Depth, Min Depth, Average Depth) =", (max(depths), min(depths), sum(depths)/len(depths)))

100%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 576/576 [00:03<00:00, 162.63it/s]

NCgreedy EAR
(Max Depth, Min Depth, Average Depth) = (4, 2, 2.6597222222222223)





In [28]:
depths = []

for comb in tqdm(combinations):
    #creating delta
    delta = pd.DataFrame(
    [[comb[0], comb[1], comb[2], comb[3]]],
    columns=['right-distance','right-weight','left-distance','left-weight'])
    
    delta = delta.loc[0]
    
    alg = A_C_N(C="SR", N="greedy")
    
    depth, _ = alg.solve(S, delta=delta)
    
    depths.append(depth)
    
print("NCgreedy SR")    
print("(Max Depth, Min Depth, Average Depth) =", (max(depths), min(depths), sum(depths)/len(depths)))

100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 225/225 [00:03<00:00, 73.08it/s]

NCgreedy SR
(Max Depth, Min Depth, Average Depth) = (4, 2, 2.92)





In [29]:
depths = []

for comb in tqdm(extended_combinations):
    #creating delta
    delta = pd.DataFrame(
    [[comb[0], comb[1], comb[2], comb[3]]],
    columns=['right-distance','right-weight','left-distance','left-weight'])
    
    delta = delta.loc[0]
    
    alg = A_C_N(C="ESR", N="greedy")
    
    depth, _ = alg.solve(S, delta=delta)
    
    depths.append(depth)
    
print("NCgreedy ESR")    
print("(Max Depth, Min Depth, Average Depth) =", (max(depths), min(depths), sum(depths)/len(depths)))

100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 576/576 [00:07<00:00, 78.09it/s]

NCgreedy ESR
(Max Depth, Min Depth, Average Depth) = (4, 2, 2.6597222222222223)





In [30]:
depths = []

for comb in tqdm(combinations):
    #creating delta
    delta = pd.DataFrame(
    [[comb[0], comb[1], comb[2], comb[3]]],
    columns=['right-distance','right-weight','left-distance','left-weight'])
    
    delta = delta.loc[0]
    
    alg = A_C_N(C="AD", N="greedy")
    
    depth, _ = alg.solve(S, delta=delta)
    
    depths.append(depth)
    
print("NCgreedy AD")    
print("(Max Depth, Min Depth, Average Depth) =", (max(depths), min(depths), sum(depths)/len(depths)))

100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 225/225 [00:02<00:00, 92.15it/s]

NCgreedy AD
(Max Depth, Min Depth, Average Depth) = (4, 2, 2.92)





In [31]:
depths = []

for comb in tqdm(extended_combinations):
    #creating delta
    delta = pd.DataFrame(
    [[comb[0], comb[1], comb[2], comb[3]]],
    columns=['right-distance','right-weight','left-distance','left-weight'])
    
    delta = delta.loc[0]
    
    alg = A_C_N(C="EAD", N="greedy")
    
    depth, _ = alg.solve(S, delta=delta)
    
    depths.append(depth)
    
print("NCgreedy EAD")    
print("(Max Depth, Min Depth, Average Depth) =", (max(depths), min(depths), sum(depths)/len(depths)))

100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 576/576 [00:05<00:00, 99.44it/s]

NCgreedy EAD
(Max Depth, Min Depth, Average Depth) = (4, 2, 2.6597222222222223)





# Greedy

In [32]:
depths = []

for comb in tqdm(combinations):
    #creating delta
    delta = pd.DataFrame(
    [[comb[0], comb[1], comb[2], comb[3]]],
    columns=['right-distance','right-weight','left-distance','left-weight'])
    
    delta = delta.loc[0]
    
    alg = A_C_G(C="AR")
    
    depth, _ = alg.solve(S, delta=delta)
    
    depths.append(depth)
    
print("Greedy AR")    
print("(Max Depth, Min Depth, Average Depth) =", (max(depths), min(depths), sum(depths)/len(depths)))

100%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 225/225 [00:00<00:00, 319.05it/s]

Greedy AR
(Max Depth, Min Depth, Average Depth) = (4, 2, 2.8755555555555556)





In [33]:
depths = []

for comb in tqdm(extended_combinations):
    #creating delta
    delta = pd.DataFrame(
    [[comb[0], comb[1], comb[2], comb[3]]],
    columns=['right-distance','right-weight','left-distance','left-weight'])
    
    delta = delta.loc[0]
    
    alg = A_C_G(C="EAR")
    
    depth, _ = alg.solve(S, delta=delta)
    
    depths.append(depth)
    
print("Greedy EAR")    
print("(Max Depth, Min Depth, Average Depth) =", (max(depths), min(depths), sum(depths)/len(depths)))

100%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 576/576 [00:01<00:00, 353.90it/s]

Greedy EAR
(Max Depth, Min Depth, Average Depth) = (4, 2, 2.6284722222222223)





In [34]:
depths = []

for comb in tqdm(combinations):
    #creating delta
    delta = pd.DataFrame(
    [[comb[0], comb[1], comb[2], comb[3]]],
    columns=['right-distance','right-weight','left-distance','left-weight'])
    
    delta = delta.loc[0]
    
    alg = A_C_G(C="SR")
    
    depth, _ = alg.solve(S, delta=delta)
    
    depths.append(depth)
    
print("Greedy SR")    
print("(Max Depth, Min Depth, Average Depth) =", (max(depths), min(depths), sum(depths)/len(depths)))

100%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 225/225 [00:02<00:00, 100.22it/s]

Greedy SR
(Max Depth, Min Depth, Average Depth) = (4, 2, 2.862222222222222)





In [35]:
depths = []

for comb in tqdm(extended_combinations):
    #creating delta
    delta = pd.DataFrame(
    [[comb[0], comb[1], comb[2], comb[3]]],
    columns=['right-distance','right-weight','left-distance','left-weight'])
    
    delta = delta.loc[0]
    
    alg = A_C_G(C="ESR")
    
    depth, _ = alg.solve(S, delta=delta)
    
    depths.append(depth)
    
print("Greedy ESR")    
print("(Max Depth, Min Depth, Average Depth) =", (max(depths), min(depths), sum(depths)/len(depths)))

100%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 576/576 [00:05<00:00, 105.73it/s]

Greedy ESR
(Max Depth, Min Depth, Average Depth) = (4, 2, 2.6215277777777777)





In [36]:
depths = []

for comb in tqdm(combinations):
    #creating delta
    delta = pd.DataFrame(
    [[comb[0], comb[1], comb[2], comb[3]]],
    columns=['right-distance','right-weight','left-distance','left-weight'])
    
    delta = delta.loc[0]
    
    alg = A_C_G(C="AD")
    
    depth, _ = alg.solve(S, delta=delta)
    
    depths.append(depth)
    
print("Greedy AD")    
print("(Max Depth, Min Depth, Average Depth) =", (max(depths), min(depths), sum(depths)/len(depths)))

100%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 225/225 [00:01<00:00, 139.74it/s]

Greedy AD
(Max Depth, Min Depth, Average Depth) = (4, 2, 2.862222222222222)





In [37]:
depths = []

for comb in tqdm(extended_combinations):
    #creating delta
    delta = pd.DataFrame(
    [[comb[0], comb[1], comb[2], comb[3]]],
    columns=['right-distance','right-weight','left-distance','left-weight'])
    
    delta = delta.loc[0]
    
    alg = A_C_G(C="EAD")
    
    depth, _ = alg.solve(S, delta=delta)
    
    depths.append(depth)
    
print("Greedy EAD")    
print("(Max Depth, Min Depth, Average Depth) =", (max(depths), min(depths), sum(depths)/len(depths)))

100%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 576/576 [00:03<00:00, 149.36it/s]

Greedy EAD
(Max Depth, Min Depth, Average Depth) = (4, 2, 2.6215277777777777)



