In [1]:
import pandas as pd
import numpy as np

import os
import sys
module_path = os.path.abspath(os.path.join('..'))
if module_path not in sys.path:
    sys.path.append(module_path)
import warnings
warnings.filterwarnings('ignore')
import facts
from facts.clean import clean_dataset
from facts import valid_ifthens_with_coverage_correctness, rules2rulesbyif
from facts.models import customLogisticRegression
from facts.parameters import ParameterProxy
from facts.formatting import recourse_report_reverse, print_recourse_report, print_recourse_report_cumulative, print_recourse_report_KStest_cumulative
from facts.utils import load_rules_by_if
from facts.fairness_metrics_aggr import get_diff_table, get_comb_df, get_analysis_dfs

In [2]:
cost_budget = 10
top_count = 20
c_inf = 5

# Dataset

In [3]:
DATAFILE = '../../ad_campaign_data.csv' # location of dataset
random_state = None # change to something for exactly reproducible results

# as selected in "tutorial_bias_advertising" notebook
selected_features = ['religion','politics','gender', 'parents', 'ages', 'income', 'area', 'college_educated', 'homeowner']
cate_features = ['religion','politics','gender', 'parents', 'ages', 'income', 'area', 'college_educated']
num_features = ['homeowner']

# if not specified, set to 1
feature_weights = {"gender": 1, "parents": 1, "age": 1}

target_name = "true_conversion"
positive_label = 1
negative_label = 0

model_train_fraction = 0.7
learning_class_weights = {0: 0.5, 1: 265}

sensitive_attribute = "gender"
sensitive_alias = {"M": "Male", "F": "Female", "Unknown": "Unknown"}

ad_conversion_dataset = pd.read_csv(DATAFILE)
ad_conversion_dataset.gender = ad_conversion_dataset.gender.map(sensitive_alias)
ad_conversion_dataset.rename(columns = {'age':'ages'}, inplace = True)
ad_conversion_dataset = ad_conversion_dataset[selected_features + [target_name]]
ad_conversion_dataset.head()


Unnamed: 0,religion,politics,gender,parents,ages,income,area,college_educated,homeowner,true_conversion
0,Unknown,Unknown,Unknown,1,55-64,Unknown,Unknown,1,1,0
1,Other,Unknown,Unknown,1,55-64,Unknown,Urban,1,1,0
2,Unknown,Unknown,Female,1,55-64,Unknown,Unknown,1,1,0
3,Unknown,Unknown,Female,1,55-64,Unknown,Unknown,1,1,0
4,Unknown,Unknown,Female,1,55-64,Unknown,Urban,1,1,0


In [4]:
y = ad_conversion_dataset['true_conversion']
X = ad_conversion_dataset.drop('true_conversion', axis=1)

num_features = X._get_numeric_data().columns.to_list()
cate_features = X.select_dtypes(include=['object','category']).columns.to_list()
ord_features = []

# Rules

In [6]:
rules_with_atomic_correctness = load_rules_by_if("rulesAdCampaing_atomic.data")
rules_with_cumulative_correctness = load_rules_by_if("rulesAdCampaing_cumulative.data")

In [7]:
num_features = []
cate_features = ['religion','politics', 'parents', 'ages', 'income', 'area', 'college_educated', 'homeowner']
ord_features = []

feature_weights = {'religion':5,'politics':2, 'parents':3, 'ages':10, 'income':3, 'area':2, 'college_educated':3, 'homeowner':1}
features_with_binary_cost = cate_features
features_with_proportional_cost = num_features


comparators = facts.feature_change_builder(
    X,
    num_cols=features_with_proportional_cost,
    cate_cols=features_with_binary_cost,
    ord_cols=ord_features,
    feature_weights=feature_weights,
    num_normalization=False,
)
params = ParameterProxy(featureChanges=comparators)

# Macro Viewpoint

## Equal Cost of Effectiveness (Macro)

In [19]:
top_rules, subgroup_costs = facts.select_rules_subset(
    rules_with_atomic_correctness,
    metric="min-above-thr",
    sort_strategy="generic-sorting-ignore-exists-subgroup-empty",
    top_count=top_count,
    cor_threshold=0.7,
    filter_sequence = [
        "remove-contained",
        "remove-below-thr",        
        #"remove-fair-rules",
        "keep-only-min-change"
    ],
    params=params
)

print_recourse_report(
    top_rules,
    subgroup_costs=subgroup_costs,
    show_subgroup_costs=True,
    metric_name = 'Equal Cost of Effectiveness (Macro) (threshold = 0.7)'
)

If [1mhomeowner = 1[0m:
	Protected Subgroup '[1mMale[0m', [34m98.67%[39m covered
		Make [1m[31mhomeowner = 0[39m[0m with effectiveness [32m94.80%[39m.
		[1mAggregate cost[0m of the above recourses = [35m1.00[39m
	Protected Subgroup '[1mFemale[0m', [34m98.31%[39m covered
		Make [1m[31mhomeowner = 0[39m[0m with effectiveness [32m93.00%[39m.
		[1mAggregate cost[0m of the above recourses = [35m1.00[39m
	[35mNo bias![39m
If [1mhomeowner = 1, income = Unknown[0m:
	Protected Subgroup '[1mMale[0m', [34m95.78%[39m covered
		Make [1m[31mhomeowner = 0[39m[0m with effectiveness [32m95.46%[39m.
		[1mAggregate cost[0m of the above recourses = [35m1.00[39m
	Protected Subgroup '[1mFemale[0m', [34m95.46%[39m covered
		Make [1m[31mhomeowner = 0[39m[0m with effectiveness [32m93.93%[39m.
		[1mAggregate cost[0m of the above recourses = [35m1.00[39m
	[35mNo bias![39m
If [1mhomeowner = 1, parents = 1[0m:
	Protected Subgroup '[1mMale[0m', [3

## Equal Choice for Recourse(Macro)

In [20]:
top_rules, subgroup_costs = facts.select_rules_subset(
    rules_with_atomic_correctness,
    metric="num-above-thr",
    sort_strategy="generic-sorting-ignore-forall-subgroups-empty",
    top_count=top_count,
    cor_threshold=0.7,
    filter_sequence = [
        "remove-contained",
        "remove-below-thr",
        "remove-fair-rules"
    ],
    params=params
)

print_recourse_report(
    top_rules,
    subgroup_costs=subgroup_costs,
    show_subgroup_costs=True,
    metric_name = 'Equal Choice for Recourse(Macro) (threshold = 0.7)'
)

If [1marea = Unknown, religion = Unknown[0m:
	Protected Subgroup '[1mMale[0m', [34m53.09%[39m covered
		Make [1m[31marea = Urban[39m, [31mreligion = Christianity[39m[0m with effectiveness [32m85.47%[39m.
		Make [1m[31marea = Urban[39m, [31mreligion = Other[39m[0m with effectiveness [32m85.47%[39m.
		Make [1m[31marea = Rural[39m, [31mreligion = Christianity[39m[0m with effectiveness [32m90.52%[39m.
		Make [1m[31marea = Rural[39m, [31mreligion = Other[39m[0m with effectiveness [32m90.52%[39m.
		[1mAggregate cost[0m of the above recourses = [35m-4.00[39m
	Protected Subgroup '[1mFemale[0m', [34m48.86%[39m covered
		[31mNo recourses for this subgroup![39m
		[1mAggregate cost[0m of the above recourses = [35m0.00[39m
	[35mBias against Female due to Equal Choice for Recourse(Macro) (threshold = 0.7). Unfairness score = 4.[39m
If [1marea = Unknown, homeowner = 1, religion = Unknown[0m:
	Protected Subgroup '[1mMale[0m', [34m51.81%[39m c

# Micro Viewpoint

##  Equal Conditional Mean Recourse

In [22]:
top_rules, subgroup_costs = facts.select_rules_subset_cumulative(
    rules_with_cumulative_correctness,
    metric="fairness-of-mean-recourse-conditional",
    sort_strategy="generic-sorting-ignore-exists-subgroup-empty",
    top_count=top_count,
    filter_sequence = [
        "remove-contained",
        "remove-fair-rules"
    ],
    params=params
)

print_recourse_report_cumulative(
    top_rules,
    subgroup_costs=subgroup_costs,
    show_subgroup_costs=True,
    show_then_costs=True,
    metric_name = 'Equal Conditional Mean Recourse'
)

If [1mages = 55-64, area = Unknown, college_educated = 1, income = Unknown, parents = 0, politics = Unknown, religion = Unknown[0m:
	Protected Subgroup '[1mMale[0m', [34m2.77%[39m covered
		Make [1m[31mparents = 1[39m[0m with effectiveness [32m14.23%[39m and counterfactual cost = 3.0.
		Make [1m[31mincome = <100K[39m, [31mparents = 1[39m[0m with effectiveness [32m14.23%[39m and counterfactual cost = 6.0.
		Make [1m[31mcollege_educated = 0[39m, [31mparents = 1[39m[0m with effectiveness [32m14.23%[39m and counterfactual cost = 6.0.
		Make [1m[31mparents = 1[39m, [31mreligion = Christianity[39m[0m with effectiveness [32m14.23%[39m and counterfactual cost = 8.0.
		Make [1m[31mparents = 1[39m, [31mreligion = Other[39m[0m with effectiveness [32m14.23%[39m and counterfactual cost = 8.0.
		Make [1m[31marea = Urban[39m, [31mparents = 1[39m, [31mreligion = Christianity[39m[0m with effectiveness [32m100.00%[39m and counterfactual cost = 10.0.


## Equal Cost of Effectiveness (Micro)

In [23]:
top_rules, subgroup_costs = facts.select_rules_subset_cumulative(
    rules_with_cumulative_correctness,
    metric="min-above-corr",
    sort_strategy="generic-sorting-ignore-exists-subgroup-empty",
    top_count=top_count,
    cor_threshold = 0.7,
    filter_sequence = [
        "remove-contained",
        "remove-fair-rules",
        "keep-cheap-rules-above-thr-cor",
        
    ],
    params=params
)

print_recourse_report_cumulative(
    top_rules,
    subgroup_costs=subgroup_costs,
    show_subgroup_costs=True,
    show_then_costs=True,
    metric_name = 'Equal Cost of Effectiveness (Micro) (threshold = 0.7)'
)

[1mWith the given parameters, no recourses showing unfairness have been found![0m


## Equal Effectiveness

In [24]:
top_rules, subgroup_costs = facts.select_rules_subset_cumulative(
    rules_with_cumulative_correctness,
    metric="total-correctness",
    sort_strategy="generic-sorting-ignore-forall-subgroups-empty",
    top_count=top_count,
    filter_sequence = [
        "remove-contained",
        "remove-fair-rules",
    ],
    params=params
)

print_recourse_report_cumulative(
    top_rules,
    subgroup_costs=subgroup_costs,
    show_subgroup_costs=True,
    show_then_costs=True,
    correctness_metric=True,
    metric_name = 'Equal Effectiveness'
)

If [1mages = 55-64, area = Unknown, income = Unknown, parents = 1, politics = Unknown, religion = Unknown[0m:
	Protected Subgroup '[1mMale[0m', [34m43.91%[39m covered
		Make [1m[31mincome = <100K[39m[0m with effectiveness [32m0.00%[39m and counterfactual cost = 3.0.
		Make [1m[31mreligion = Christianity[39m[0m with effectiveness [32m0.00%[39m and counterfactual cost = 5.0.
		Make [1m[31mreligion = Other[39m[0m with effectiveness [32m0.00%[39m and counterfactual cost = 5.0.
		Make [1m[31marea = Urban[39m, [31mreligion = Christianity[39m[0m with effectiveness [32m94.30%[39m and counterfactual cost = 7.0.
		Make [1m[31marea = Urban[39m, [31mreligion = Other[39m[0m with effectiveness [32m94.30%[39m and counterfactual cost = 7.0.
		Make [1m[31marea = Rural[39m, [31mreligion = Other[39m[0m with effectiveness [32m100.00%[39m and counterfactual cost = 7.0.
		Make [1m[31marea = Rural[39m, [31mreligion = Christianity[39m[0m with effectiveness

## Fair Effectiveness-Cost Trade-Off

In [28]:
# taken from the other notebooks
affected_pop_sizes = {"Male": 94138, "Female": 180304}

top_rules,unfairness = facts.select_rules_subset_KStest(
    rules_with_cumulative_correctness,
    affected_pop_sizes,
    top_count=top_count
)

print_recourse_report_KStest_cumulative(
    top_rules,
    population_sizes=affected_pop_sizes,
    unfairness = unfairness,
    show_then_costs=True,
    metric_name = 'Fair Effectiveness-Cost Trade-Off'
    # show_cumulative_plots=True
)

If [1mages = 55-64, area = Unknown, income = Unknown, parents = 1, politics = Unknown, religion = Unknown[0m:
	Protected Subgroup '[1mMale[0m', [34m43.91%[39m covered out of 94138
		Make [1m[31mincome = <100K[39m[0m with effectiveness [32m0.00%[39m and counterfactual cost = 3.0.
		Make [1m[31mreligion = Christianity[39m[0m with effectiveness [32m0.00%[39m and counterfactual cost = 5.0.
		Make [1m[31mreligion = Other[39m[0m with effectiveness [32m0.00%[39m and counterfactual cost = 5.0.
		Make [1m[31marea = Urban[39m, [31mreligion = Christianity[39m[0m with effectiveness [32m94.30%[39m and counterfactual cost = 7.0.
		Make [1m[31marea = Urban[39m, [31mreligion = Other[39m[0m with effectiveness [32m94.30%[39m and counterfactual cost = 7.0.
		Make [1m[31marea = Rural[39m, [31mreligion = Other[39m[0m with effectiveness [32m100.00%[39m and counterfactual cost = 7.0.
		Make [1m[31marea = Rural[39m, [31mreligion = Christianity[39m[0m with 

## Equal Effectiveness within Budget (Micro)

In [29]:
top_rules, subgroup_costs = facts.select_rules_subset_cumulative(
    rules_with_cumulative_correctness,
    metric="max-upto-cost",
    sort_strategy="generic-sorting-ignore-exists-subgroup-empty",
    top_count=top_count,
    cost_threshold = cost_budget,
    filter_sequence = [
        "remove-contained",
        "remove-fair-rules",
        "remove-above-thr-cost"
    ],
    params=params
)

print_recourse_report_cumulative(
    top_rules,
    subgroup_costs=subgroup_costs,
    show_subgroup_costs=True,
    show_then_costs=True,
    correctness_metric = True,
    metric_name = 'Equal Effectiveness within Budget (Micro)'
)

If [1mages = 55-64, area = Unknown, income = Unknown, parents = 1, politics = Unknown, religion = Unknown[0m:
	Protected Subgroup '[1mMale[0m', [34m43.91%[39m covered
		Make [1m[31mincome = <100K[39m[0m with effectiveness [32m0.00%[39m and counterfactual cost = 3.0.
		Make [1m[31mreligion = Christianity[39m[0m with effectiveness [32m0.00%[39m and counterfactual cost = 5.0.
		Make [1m[31mreligion = Other[39m[0m with effectiveness [32m0.00%[39m and counterfactual cost = 5.0.
		Make [1m[31marea = Urban[39m, [31mreligion = Christianity[39m[0m with effectiveness [32m94.30%[39m and counterfactual cost = 7.0.
		Make [1m[31marea = Urban[39m, [31mreligion = Other[39m[0m with effectiveness [32m94.30%[39m and counterfactual cost = 7.0.
		Make [1m[31marea = Rural[39m, [31mreligion = Other[39m[0m with effectiveness [32m100.00%[39m and counterfactual cost = 7.0.
		Make [1m[31marea = Rural[39m, [31mreligion = Christianity[39m[0m with effectiveness

## Get ranking of subgroups based on metrics

In [30]:
from facts.fairness_metrics_aggr import make_table, auto_budget_calculation

In [31]:
rules_with_both = {}
for ifc, all_thens in rules_with_cumulative_correctness.items():
    new_all_thens = {}
    for sg, (cov, thens_cum) in all_thens.items():
        thens_atom = rules_with_atomic_correctness[ifc][sg][1]
        thens_atom_dict = {then: atom_cor for then, atom_cor in thens_atom}
        new_all_thens[sg] = (cov, [(then, thens_atom_dict[then], cumcor) for then, cumcor, _cost in thens_cum])
    rules_with_both[ifc] = new_all_thens

In [32]:
budgets = auto_budget_calculation(rules_with_cumulative_correctness, cor_thres=0.5, percentiles=[0.3, 0.6, 0.9])

df = make_table(
    rules_with_both,
    sensitive_attribute_vals=["Male", "Female"],
    effectiveness_thresholds=[0.3, 0.7],
    cost_budgets=budgets,
    params=params
)
# dropping 'weighted-average' and 'mean-cost-cinf'
df.drop(['weighted-average', 'mean-cost-cinf'], axis=1, inplace=True)

In [33]:
#table of differences between Male and Female for each metric
diff = get_diff_table(df, sensitive_attribute_vals=["Male", "Female"], with_abs = True)
diff = diff.set_index('subgroup')
ranked = diff.drop(columns=[('Fair Effectiveness-Cost Trade-Off','bias')]).mask(diff == 0).rank(ascending = False,axis=0,method='dense')
ranked = ranked.replace(np.nan,"Fair")

In [34]:
rev_bias_metrics = ['Equal Effectiveness', 'Equal Effectiveness within Budget']
comb_df = get_comb_df(df, ranked, diff, rev_bias_metrics, sensitive_attribute_vals=["Male", "Female"])
analysis_df,rank_analysis_df = get_analysis_dfs(comb_df,ranked, sensitive_attribute_vals=["Male", "Female"])

In [35]:
comb_df.head()

Unnamed: 0_level_0,"(Equal Cost of Effectiveness(Macro), 0.3)","(Equal Cost of Effectiveness(Macro), 0.3)","(Equal Cost of Effectiveness(Macro), 0.3)","(Equal Cost of Effectiveness(Macro), 0.7)","(Equal Cost of Effectiveness(Macro), 0.7)","(Equal Cost of Effectiveness(Macro), 0.7)","(Equal Choice for Recourse, 0.3)","(Equal Choice for Recourse, 0.3)","(Equal Choice for Recourse, 0.3)","(Equal Choice for Recourse, 0.7)",...,"(Equal Cost of Effectiveness(Micro), 0.3)","(Equal Cost of Effectiveness(Micro), 0.7)","(Equal Cost of Effectiveness(Micro), 0.7)","(Equal Cost of Effectiveness(Micro), 0.7)",Equal(Conditional Mean Recourse),Equal(Conditional Mean Recourse),Equal(Conditional Mean Recourse),Fair Effectiveness-Cost Trade-Off,Fair Effectiveness-Cost Trade-Off,Fair Effectiveness-Cost Trade-Off
Unnamed: 0_level_1,rank,score,bias against,rank,score,bias against,rank,score,bias against,rank,...,bias against,rank,score,bias against,rank,score,bias against,rank,score,bias against
subgroup,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2,Unnamed: 9_level_2,Unnamed: 10_level_2,Unnamed: 11_level_2,Unnamed: 12_level_2,Unnamed: 13_level_2,Unnamed: 14_level_2,Unnamed: 15_level_2,Unnamed: 16_level_2,Unnamed: 17_level_2,Unnamed: 18_level_2,Unnamed: 19_level_2,Unnamed: 20_level_2,Unnamed: 21_level_2
homeowner = 1,Fair,0.0,Fair,Fair,0.0,Fair,Fair,0.0,Fair,Fair,...,Fair,Fair,0.0,Fair,Fair,0.0,Fair,908.0,0.01808,Female
"homeowner = 1, politics = Unknown",Fair,0.0,Fair,Fair,0.0,Fair,Fair,0.0,Fair,Fair,...,Fair,Fair,0.0,Fair,Fair,0.0,Fair,929.0,0.016813,Female
income = Unknown,Fair,0.0,Fair,Fair,0.0,Fair,Fair,0.0,Fair,Fair,...,Fair,Fair,0.0,Fair,642.0,4.440892e-16,Male,541.0,0.100406,Female
"income = Unknown, politics = Unknown",Fair,0.0,Fair,Fair,0.0,Fair,Fair,0.0,Fair,Fair,...,Fair,Fair,0.0,Fair,Fair,0.0,Fair,540.0,0.100887,Female
"homeowner = 1, income = Unknown",Fair,0.0,Fair,Fair,0.0,Fair,Fair,0.0,Fair,Fair,...,Fair,Fair,0.0,Fair,619.0,0.003322132,Female,945.0,0.015355,Female


In [36]:
analysis_df

Unnamed: 0,Rank = 1 Count,Male bias against Count,Female bias against Count
"(Equal Cost of Effectiveness(Macro), 0.3)",427,16,429
"(Equal Cost of Effectiveness(Micro), 0.3)",427,16,429
Equal(Conditional Mean Recourse),108,278,554
"(Equal Cost of Effectiveness(Macro), 0.7)",264,0,264
"(Equal Choice for Recourse, 0.7)",384,0,392
"(Equal Cost of Effectiveness(Micro), 0.7)",264,0,264
Equal Effectiveness,15,167,1072
Fair Effectiveness-Cost Trade-Off,15,244,1188
"(Equal Effectiveness within Budget, 5.0)",10,151,989
"(Equal Effectiveness within Budget, 1.0)",1,20,402


In [37]:
rank_analysis_df

Unnamed: 0,"(Equal Effectiveness within Budget, 5.0)",Fair Effectiveness-Cost Trade-Off,"(Equal Cost of Effectiveness(Macro), 0.7)","(Equal Cost of Effectiveness(Micro), 0.3)","(Equal Choice for Recourse, 0.7)","(Equal Cost of Effectiveness(Macro), 0.3)","(Equal Choice for Recourse, 0.3)",Equal Effectiveness,Equal(Conditional Mean Recourse),"(Equal Effectiveness within Budget, 1.0)","(Equal Cost of Effectiveness(Micro), 0.7)"
"(Equal Effectiveness within Budget, 5.0)",1.0,1.0,1.0,1.0,1.0,1.0,2.0,1.0,1.0,423.0,1.0
Fair Effectiveness-Cost Trade-Off,222.5,1.0,1.0,1.0,1.0,1.0,2.0,1.0,1.0,423.0,1.0
"(Equal Cost of Effectiveness(Macro), 0.7)",228.0,96.3,1.0,1.0,1.0,1.0,2.1,97.4,325.4,423.0,1.0
"(Equal Cost of Effectiveness(Micro), 0.3)",299.4,187.9,1.4,1.0,1.8,1.0,2.9,197.7,313.4,423.0,1.4
"(Equal Choice for Recourse, 0.7)",417.6,333.5,1.3,2.0,1.0,2.0,2.0,351.3,364.0,359.8,1.3
"(Equal Cost of Effectiveness(Macro), 0.3)",299.4,187.9,1.4,1.0,1.8,1.0,2.9,197.7,313.4,423.0,1.4
"(Equal Choice for Recourse, 0.3)",1085.0,413.0,2.0,1.0,3.0,1.0,1.0,866.0,23.5,423.0,2.0
Equal Effectiveness,222.5,1.0,1.0,1.0,1.0,1.0,2.0,1.0,1.0,423.0,1.0
Equal(Conditional Mean Recourse),442.2,326.2,1.5,2.1,2.1,2.1,3.9,296.5,1.0,423.0,1.5
"(Equal Effectiveness within Budget, 1.0)",728.0,482.0,2.0,4.0,3.0,4.0,6.0,847.0,196.0,1.0,2.0


In [22]:
# ranked_indexed = top_rank.set_index([top_rank.index, "subgroup"])
# ranked_fair = ranked_indexed == 'Fair'
# ranked_more_than_2000 = ranked_indexed.mask(ranked_indexed=='Fair') >= 1000
# new_rank = ranked_indexed[ranked_fair.apply(lambda row: row.sum() >=4 , axis=1) | ranked_more_than_2000.apply(lambda row : row.sum() >= 6,axis=1)]
# new_rank.head()

In [23]:
# sgs = [
#     ranked.iloc[9841].subgroup,
# ]

# rules_sgs_atomic = {ifc: rules_with_atomic_correctness[ifc] for ifc in sgs}
# rules_sgs_cumulative = {ifc: rules_with_cumulative_correctness[ifc] for ifc in sgs}

In [24]:
# df.iloc[4228].to_frame().T

In [25]:
# top_rules, subgroup_costs = facts.select_rules_subset(
#     rules_sgs_atomic,
#     metric="min-above-thr",
#     sort_strategy="generic-sorting-ignore-exists-subgroup-empty",
#     cor_threshold=0.7,
#     filter_sequence = [
#         # "remove-contained",
#         "remove-below-thr",        
#         #"remove-fair-rules", 
#         "keep-only-min-change"
#     ],
#     params=params
# )

# print_recourse_report(
#     top_rules,
#     subgroup_costs=subgroup_costs,
#     show_subgroup_costs=True
# )

In [26]:
# top_rules, subgroup_costs = facts.select_rules_subset_cumulative(
#     rules_sgs_cumulative,
#     metric="max-upto-cost",
#     sort_strategy="generic-sorting-ignore-exists-subgroup-empty",
#     top_count=top_count,
#     cost_threshold = 10,
#     filter_sequence = [
#         # "remove-contained",
#         # "remove-fair-rules",
#         "keep-cheap-rules-above-thr-cor",
#         # "keep-only-min-change",
        
#     ],
#     params=params
# )

# print_recourse_report_cumulative(
#     top_rules,
#     subgroup_costs=subgroup_costs,
#     show_subgroup_costs=True,
#     show_then_costs=True,
#     correctness_metric=True
# )

# Turn reports to latex

In [38]:
r = ranked[(ranked.mask(lambda x: x == "Fair") <= 5).any(axis=1) & (ranked.mask(lambda x: x == "Fair") > 5000).any(axis=1)]
r = r[r.index.map(lambda p: len(p.features) >= 3)]
r = r[(r.mask(lambda x: x == "Fair") > 5000).sum(axis=1) >= 5]
r = r[(r.mask(lambda x: x == "Fair") < 100).sum(axis=1) >= 4]
r

Unnamed: 0_level_0,"(Equal Cost of Effectiveness(Macro), 0.3)","(Equal Cost of Effectiveness(Macro), 0.7)","(Equal Choice for Recourse, 0.3)","(Equal Choice for Recourse, 0.7)",Equal Effectiveness,"(Equal Effectiveness within Budget, 5.076880768807688)","(Equal Effectiveness within Budget, 10.0)","(Equal Effectiveness within Budget, 18.0)","(Equal Cost of Effectiveness(Micro), 0.3)","(Equal Cost of Effectiveness(Micro), 0.7)",Equal(Conditional Mean Recourse),"(Fair Effectiveness-Cost Trade-Off, value)"
subgroup,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
"capital-loss = 0, marital-status = Divorced, native-country = United-States, relationship = Not-in-family",19.0,28.0,13.0,5.0,5789.0,Fair,5352.0,5226.0,22.0,1.0,6982.0,7860.0
"capital-gain = 0, capital-loss = 0, native-country = United-States, occupation = Exec-managerial",Fair,21.0,13.0,5.0,8434.0,5036.0,7138.0,7696.0,Fair,15.0,6725.0,2535.0
"capital-gain = 0, capital-loss = 0, hours-per-week = BrainDrain, relationship = Not-in-family",Fair,30.0,12.0,5.0,8000.0,5960.0,6731.0,7281.0,Fair,10.0,7105.0,4759.0
"Workclass = Private, marital-status = Never-married, occupation = Exec-managerial, relationship = Not-in-family",Fair,1.0,10.0,3.0,6038.0,Fair,5588.0,5463.0,Fair,1.0,7336.0,8127.0
"Workclass = Private, capital-loss = 0, marital-status = Never-married, occupation = Exec-managerial, relationship = Not-in-family",Fair,1.0,12.0,4.0,6340.0,Fair,6280.0,5737.0,Fair,1.0,6339.0,8508.0
