# Frequent Itemset Mining within Clusters

In [1]:
import pandas as pd

In [2]:
df = pd.read_csv("Clusters.csv")
#df.head(3)

## Pre-processing

In [3]:
"""
1. Renaming columns for later convenience.
2. One-Hot encoding of all columns
"""
from sklearn.preprocessing import LabelEncoder

#Age Column not needed
df = df.drop(columns = ["Age"]) 
df["Agecat"] = df["Agecat"].str.strip()

#Renaming columns
df = df.rename(columns = {"Agecat":"A","Gender":"G","Race":"R", "Clinical Trial Participant":"CTP", "Tobacco Use":"TU",
                         "Cancer Description":"CD", "Stage":"S"})


#OneHot encoding
df = pd.get_dummies(df, columns=["TU", "CD", "RUCA", "S", "A", "G","R",
                                "CTP"])

df.head()

Unnamed: 0,DBSCAN,Agglomerative,Spectral,OPTICS,K_means,TU_Current Smoker,TU_Former Smoker,TU_Non Smoker,TU_Unknown,CD_Breast cancer,...,A_18 to 65,A_66 to 75,A_75 to 85,A_>85,G_Female,G_Male,R_Nonwhite,R_White,CTP_No,CTP_Yes
0,0,8,4,0,6,0,0,1,0,0,...,0,0,1,0,0,1,0,1,1,0
1,0,8,4,0,6,0,0,1,0,0,...,0,0,0,1,0,1,0,1,1,0
2,1,7,7,4,7,0,1,0,0,0,...,0,0,1,0,1,0,0,1,1,0
3,2,9,6,5,0,0,1,0,0,1,...,0,0,1,0,1,0,0,1,1,0
4,3,5,3,2,4,0,1,0,0,0,...,0,0,0,1,0,1,0,1,1,0


In [4]:
"""
Function that loops through each cluster and mines for frequent itemsets & association rules.
Reference: http://rasbt.github.io/mlxtend/user_guide/frequent_patterns/apriori/
"""
def FreqMine(cluster_list, cluster_alg):
    from mlxtend.frequent_patterns import apriori, association_rules 
    for i in clusters:
        temp_basket = dbdf[dbdf[cluster_alg]==i].drop(columns = [cluster_alg])
        frq_items = apriori(temp_basket, min_support = 0.6, use_colnames = True) #60% support threshold
        rules = association_rules(frq_items, metric ="lift", min_threshold = 1) 
        rules = rules.sort_values(['confidence', 'lift'], ascending =[False, False])
        print("\nINTERESTING PATTERNS IN CLUSTER#",i,":")
        
        #Filtering out rules that have lift>1
        display(rules[rules["lift"]>1].head())
        
        #Printing all frequent itemsets in the cluster
        print(rules["antecedents"].value_counts())

### (1) DBScan Clusters

In [5]:
dbdf = df.drop(columns = ["Agglomerative", "Spectral", "OPTICS", "K_means"])
print(dbdf["DBSCAN"].value_counts())
clusters = dbdf["DBSCAN"].value_counts().index
FreqMine(clusters, "DBSCAN")

 8     548
 2     470
 3     370
 4     359
-1     357
 1     268
 0     233
 7     197
 11    110
 5     105
 9      90
 10     61
 6      56
Name: DBSCAN, dtype: int64

INTERESTING PATTERNS IN CLUSTER# 8 :


Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(CD_Breast cancer)                                      15
(R_White)                                               15
(CTP_No)                                                15
(TU_Non Smoker)                                         15
(G_Female)                                              15
(R_White, G_Female)                                      7
(CD_Breast cancer, G_Female)                             7
(TU_Non Smoker, R_White)                                 7
(R_White, CD_Breast cancer)                              7
(CTP_No, CD_Breast cancer)                               7
(CTP_No, G_Female)                                       7
(R_White, CTP_No)                                        7
(TU_Non Smoker, G_Female)                                7
(TU_Non Smoker, CD_Breast cancer)                        7
(TU_Non Smoker, CTP_No)                                  7
(R_White, CTP_No, G_Female)                              3
(R_White, CTP_No, CD_Breast cancer)                     

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(CD_Breast cancer)                                         15
(TU_Former Smoker)                                         15
(G_Female)                                                 15
(CTP_No)                                                   15
(R_White)                                                  15
(TU_Former Smoker, R_White)                                 7
(R_White, G_Female)                                         7
(CD_Breast cancer, G_Female)                                7
(TU_Former Smoker, G_Female)                                7
(R_White, CD_Breast cancer)                                 7
(CTP_No, CD_Breast cancer)                                  7
(CTP_No, G_Female)                                          7
(TU_Former Smoker, CD_Breast cancer)                        7
(R_White, CTP_No)                                           7
(TU_Former Smoker, CTP_No)                                  7
(TU_Former Smoker, R_White, CD_Breast cancer)               3
(CD_Brea

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(G_Male)                                                      15
(CD_Respiratory cancer)                                       15
(TU_Former Smoker)                                            15
(R_White)                                                     15
(CTP_No)                                                      15
(TU_Former Smoker, R_White)                                    7
(TU_Former Smoker, CD_Respiratory cancer)                      7
(CD_Respiratory cancer, G_Male)                                7
(CD_Respiratory cancer, R_White)                               7
(R_White, G_Male)                                              7
(G_Male, CTP_No)                                               7
(R_White, CTP_No)                                              7
(TU_Former Smoker, CTP_No)                                     7
(CD_Respiratory cancer, CTP_No)                                7
(TU_Former Smoker, G_Male)                                     7
(TU_Former Smoker, CD_Res

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(CD_GU cancer)                                       15
(R_White)                                            15
(CTP_No)                                             15
(TU_Former Smoker)                                   15
(G_Male)                                             15
(CD_GU cancer, CTP_No)                                7
(TU_Former Smoker, CTP_No)                            7
(TU_Former Smoker, R_White)                           7
(TU_Former Smoker, CD_GU cancer)                      7
(R_White, G_Male)                                     7
(G_Male, CTP_No)                                      7
(R_White, CD_GU cancer)                               7
(TU_Former Smoker, G_Male)                            7
(G_Male, CD_GU cancer)                                7
(R_White, CTP_No)                                     7
(R_White, G_Male, CD_GU cancer)                       3
(R_White, G_Male, CTP_No)                             3
(TU_Former Smoker, R_White, CD_GU cancer)       

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction
0,(CTP_Yes),(R_White),0.633053,0.77591,0.610644,0.964602,1.243187,0.119452,6.330532
1,(R_White),(CTP_Yes),0.77591,0.633053,0.610644,0.787004,1.243187,0.119452,1.722784


(CTP_Yes)    1
(R_White)    1
Name: antecedents, dtype: int64

INTERESTING PATTERNS IN CLUSTER# 1 :


Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(R_White)                                                       15
(G_Female)                                                      15
(TU_Former Smoker)                                              15
(CTP_No)                                                        15
(CD_Respiratory cancer)                                         15
(CD_Respiratory cancer, G_Female)                                7
(R_White, G_Female)                                              7
(CD_Respiratory cancer, CTP_No)                                  7
(CTP_No, G_Female)                                               7
(TU_Former Smoker, G_Female)                                     7
(TU_Former Smoker, CTP_No)                                       7
(R_White, CTP_No)                                                7
(TU_Former Smoker, R_White)                                      7
(CD_Respiratory cancer, R_White)                                 7
(TU_Former Smoker, CD_Respiratory cancer)                     

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(CD_GU cancer)                                    15
(R_White)                                         15
(CTP_No)                                          15
(TU_Non Smoker)                                   15
(G_Male)                                          15
(R_White, G_Male)                                  7
(G_Male, CD_GU cancer)                             7
(TU_Non Smoker, R_White)                           7
(R_White, CTP_No)                                  7
(TU_Non Smoker, CTP_No)                            7
(G_Male, CTP_No)                                   7
(TU_Non Smoker, G_Male)                            7
(R_White, CD_GU cancer)                            7
(TU_Non Smoker, CD_GU cancer)                      7
(CD_GU cancer, CTP_No)                             7
(TU_Non Smoker, G_Male, CD_GU cancer)              3
(G_Male, CD_GU cancer, CTP_No)                     3
(R_White, G_Male, CTP_No)                          3
(TU_Non Smoker, G_Male, CTP_No)               

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(G_Male)                                             15
(CTP_No)                                             15
(TU_Former Smoker)                                   15
(CD_GI cancer)                                       15
(R_White)                                            15
(TU_Former Smoker, CTP_No)                            7
(CD_GI cancer, R_White)                               7
(TU_Former Smoker, R_White)                           7
(CD_GI cancer, CTP_No)                                7
(TU_Former Smoker, CD_GI cancer)                      7
(CD_GI cancer, G_Male)                                7
(TU_Former Smoker, G_Male)                            7
(G_Male, CTP_No)                                      7
(R_White, G_Male)                                     7
(R_White, CTP_No)                                     7
(TU_Former Smoker, CD_GI cancer, CTP_No)              3
(TU_Former Smoker, CD_GI cancer, G_Male)              3
(R_White, G_Male, CTP_No)                       

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(G_Female)                                             15
(TU_Former Smoker)                                     15
(CTP_No)                                               15
(R_White)                                              15
(CD_GI cancer)                                         15
(CD_GI cancer, R_White)                                 7
(R_White, G_Female)                                     7
(TU_Former Smoker, G_Female)                            7
(CTP_No, G_Female)                                      7
(TU_Former Smoker, CTP_No)                              7
(TU_Former Smoker, CD_GI cancer)                        7
(TU_Former Smoker, R_White)                             7
(R_White, CTP_No)                                       7
(CD_GI cancer, CTP_No)                                  7
(CD_GI cancer, G_Female)                                7
(TU_Former Smoker, CD_GI cancer, R_White)               3
(TU_Former Smoker, R_White, CTP_No)                     3
(CD_GI cancer,

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(R_White)                                                     31
(TU_Non Smoker)                                               31
(G_Male)                                                      31
(CTP_No)                                                      31
(A_18 to 65)                                                  31
                                                              ..
(TU_Non Smoker, A_18 to 65, R_White, CTP_No, CD_GI cancer)     1
(A_18 to 65, R_White, CTP_No, CD_GI cancer, G_Male)            1
(TU_Non Smoker, A_18 to 65, CTP_No, CD_GI cancer, G_Male)      1
(TU_Non Smoker, A_18 to 65, R_White, CD_GI cancer, G_Male)     1
(TU_Non Smoker, R_White, CTP_No, CD_GI cancer, G_Male)         1
Name: antecedents, Length: 62, dtype: int64

INTERESTING PATTERNS IN CLUSTER# 9 :


Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(CTP_No)                                            15
(G_Female)                                          15
(TU_Non Smoker)                                     15
(R_White)                                           15
(CD_GI cancer)                                      15
(CTP_No, G_Female)                                   7
(TU_Non Smoker, CTP_No)                              7
(TU_Non Smoker, CD_GI cancer)                        7
(TU_Non Smoker, R_White)                             7
(R_White, CD_GI cancer)                              7
(R_White, G_Female)                                  7
(CD_GI cancer, G_Female)                             7
(R_White, CTP_No)                                    7
(CD_GI cancer, CTP_No)                               7
(TU_Non Smoker, G_Female)                            7
(TU_Non Smoker, R_White, G_Female)                   3
(CD_GI cancer, CTP_No, G_Female)                     3
(CD_GI cancer, R_White, CTP_No)                      3
(CD_GI can

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(R_White)                                                  15
(CD_Respiratory cancer)                                    15
(CTP_No)                                                   15
(TU_Non Smoker)                                            15
(G_Male)                                                   15
(R_White, G_Male)                                           7
(CD_Respiratory cancer, R_White)                            7
(CD_Respiratory cancer, CTP_No)                             7
(G_Male, CTP_No)                                            7
(TU_Non Smoker, R_White)                                    7
(CD_Respiratory cancer, TU_Non Smoker)                      7
(TU_Non Smoker, G_Male)                                     7
(CD_Respiratory cancer, G_Male)                             7
(TU_Non Smoker, CTP_No)                                     7
(R_White, CTP_No)                                           7
(CD_Respiratory cancer, TU_Non Smoker, CTP_No)              3
(CD_Resp

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(CTP_No)                                                     15
(G_Female)                                                   15
(TU_Non Smoker)                                              15
(R_White)                                                    15
(CD_Respiratory cancer)                                      15
(CTP_No, G_Female)                                            7
(CD_Respiratory cancer, R_White)                              7
(CD_Respiratory cancer, G_Female)                             7
(CD_Respiratory cancer, CTP_No)                               7
(TU_Non Smoker, R_White)                                      7
(TU_Non Smoker, CTP_No)                                       7
(R_White, CTP_No)                                             7
(R_White, G_Female)                                           7
(TU_Non Smoker, G_Female)                                     7
(CD_Respiratory cancer, TU_Non Smoker)                        7
(CD_Respiratory cancer, R_White, CTP_No)

### (2) Agglomerative Clusters

In [6]:
dbdf = df.drop(columns = ["DBSCAN", "Spectral", "OPTICS", "K_means"])
print(dbdf["Agglomerative"].value_counts())
clusters = dbdf["Agglomerative"].value_counts().index
FreqMine(clusters, "Agglomerative")

3    548
9    470
6    412
5    370
1    314
0    312
7    268
8    233
2    217
4     80
Name: Agglomerative, dtype: int64

INTERESTING PATTERNS IN CLUSTER# 3 :


Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(CD_Breast cancer)                                      15
(R_White)                                               15
(CTP_No)                                                15
(TU_Non Smoker)                                         15
(G_Female)                                              15
(R_White, G_Female)                                      7
(CD_Breast cancer, G_Female)                             7
(TU_Non Smoker, R_White)                                 7
(R_White, CD_Breast cancer)                              7
(CTP_No, CD_Breast cancer)                               7
(CTP_No, G_Female)                                       7
(R_White, CTP_No)                                        7
(TU_Non Smoker, G_Female)                                7
(TU_Non Smoker, CD_Breast cancer)                        7
(TU_Non Smoker, CTP_No)                                  7
(R_White, CTP_No, G_Female)                              3
(R_White, CTP_No, CD_Breast cancer)                     

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(CD_Breast cancer)                                         15
(TU_Former Smoker)                                         15
(G_Female)                                                 15
(CTP_No)                                                   15
(R_White)                                                  15
(TU_Former Smoker, R_White)                                 7
(R_White, G_Female)                                         7
(CD_Breast cancer, G_Female)                                7
(TU_Former Smoker, G_Female)                                7
(R_White, CD_Breast cancer)                                 7
(CTP_No, CD_Breast cancer)                                  7
(CTP_No, G_Female)                                          7
(TU_Former Smoker, CD_Breast cancer)                        7
(R_White, CTP_No)                                           7
(TU_Former Smoker, CTP_No)                                  7
(TU_Former Smoker, R_White, CD_Breast cancer)               3
(CD_Brea

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction
0,(TU_Former Smoker),(CD_GU cancer),0.90534,0.961165,0.90534,1.0,1.040404,0.035159,inf
18,"(TU_Former Smoker, G_Male)",(CD_GU cancer),0.871359,0.961165,0.871359,1.0,1.040404,0.033839,inf
24,"(TU_Former Smoker, R_White)",(CD_GU cancer),0.90534,0.961165,0.90534,1.0,1.040404,0.035159,inf
27,(TU_Former Smoker),"(R_White, CD_GU cancer)",0.90534,0.961165,0.90534,1.0,1.040404,0.035159,inf
31,"(TU_Former Smoker, CTP_No)",(CD_GU cancer),0.90534,0.961165,0.90534,1.0,1.040404,0.035159,inf


(CD_GU cancer)                                       15
(TU_Former Smoker)                                   15
(R_White)                                            15
(CTP_No)                                             13
(G_Male)                                             13
(CD_GU cancer, CTP_No)                                7
(TU_Former Smoker, G_Male)                            7
(TU_Former Smoker, R_White)                           7
(TU_Former Smoker, CD_GU cancer)                      7
(G_Male, CTP_No)                                      7
(TU_Former Smoker, CTP_No)                            7
(R_White, CD_GU cancer)                               7
(G_Male, CD_GU cancer)                                7
(R_White, G_Male)                                     6
(R_White, CTP_No)                                     6
(TU_Former Smoker, G_Male, CD_GU cancer)              3
(G_Male, CD_GU cancer, CTP_No)                        3
(R_White, G_Male, CTP_No)                       

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(G_Male)                                                      15
(CD_Respiratory cancer)                                       15
(TU_Former Smoker)                                            15
(R_White)                                                     15
(CTP_No)                                                      15
(TU_Former Smoker, R_White)                                    7
(TU_Former Smoker, CD_Respiratory cancer)                      7
(CD_Respiratory cancer, G_Male)                                7
(CD_Respiratory cancer, R_White)                               7
(R_White, G_Male)                                              7
(G_Male, CTP_No)                                               7
(R_White, CTP_No)                                              7
(TU_Former Smoker, CTP_No)                                     7
(CD_Respiratory cancer, CTP_No)                                7
(TU_Former Smoker, G_Male)                                     7
(TU_Former Smoker, CD_Res

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction
1,(CD_GI cancer),(TU_Former Smoker),0.977707,0.993631,0.977707,1.0,1.00641,0.006227,inf
16,"(CD_GI cancer, G_Male)",(TU_Former Smoker),0.627389,0.993631,0.627389,1.0,1.00641,0.003996,inf
20,"(CD_GI cancer, R_White)",(TU_Former Smoker),0.977707,0.993631,0.977707,1.0,1.00641,0.006227,inf
22,(CD_GI cancer),"(TU_Former Smoker, R_White)",0.977707,0.993631,0.977707,1.0,1.00641,0.006227,inf
26,"(CD_GI cancer, CTP_No)",(TU_Former Smoker),0.977707,0.993631,0.977707,1.0,1.00641,0.006227,inf


(R_White)                                            15
(CTP_No)                                             15
(TU_Former Smoker)                                   11
(CD_GI cancer, G_Male)                                7
(CD_GI cancer)                                        7
(R_White, CTP_No)                                     7
(TU_Former Smoker, R_White)                           5
(TU_Former Smoker, CTP_No)                            5
(TU_Former Smoker, G_Male)                            3
(CD_GI cancer, CTP_No)                                3
(TU_Former Smoker, CD_GI cancer, G_Male)              3
(G_Male)                                              3
(CD_GI cancer, G_Male, CTP_No)                        3
(TU_Former Smoker, CD_GI cancer)                      3
(CD_GI cancer, G_Male, R_White)                       3
(CD_GI cancer, R_White)                               3
(TU_Former Smoker, R_White, CTP_No)                   2
(TU_Former Smoker, R_White, G_Male, CD_GI cancer

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(CD_GI cancer)                            7
(CTP_No)                                  7
(R_White)                                 7
(TU_Non Smoker)                           7
(TU_Non Smoker, R_White)                  3
(R_White, CTP_No)                         3
(CD_GI cancer, CTP_No)                    3
(TU_Non Smoker, CTP_No)                   3
(TU_Non Smoker, CD_GI cancer)             3
(R_White, CD_GI cancer)                   3
(TU_Non Smoker, CTP_No, CD_GI cancer)     1
(CD_GI cancer, R_White, CTP_No)           1
(TU_Non Smoker, R_White, CD_GI cancer)    1
(TU_Non Smoker, R_White, CTP_No)          1
Name: antecedents, dtype: int64

INTERESTING PATTERNS IN CLUSTER# 7 :


Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(R_White)                                                       15
(G_Female)                                                      15
(TU_Former Smoker)                                              15
(CTP_No)                                                        15
(CD_Respiratory cancer)                                         15
(CD_Respiratory cancer, G_Female)                                7
(R_White, G_Female)                                              7
(CD_Respiratory cancer, CTP_No)                                  7
(CTP_No, G_Female)                                               7
(TU_Former Smoker, G_Female)                                     7
(TU_Former Smoker, CTP_No)                                       7
(R_White, CTP_No)                                                7
(TU_Former Smoker, R_White)                                      7
(CD_Respiratory cancer, R_White)                                 7
(TU_Former Smoker, CD_Respiratory cancer)                     

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(CD_GU cancer)                                    15
(R_White)                                         15
(CTP_No)                                          15
(TU_Non Smoker)                                   15
(G_Male)                                          15
(R_White, G_Male)                                  7
(G_Male, CD_GU cancer)                             7
(TU_Non Smoker, R_White)                           7
(R_White, CTP_No)                                  7
(TU_Non Smoker, CTP_No)                            7
(G_Male, CTP_No)                                   7
(TU_Non Smoker, G_Male)                            7
(R_White, CD_GU cancer)                            7
(TU_Non Smoker, CD_GU cancer)                      7
(CD_GU cancer, CTP_No)                             7
(TU_Non Smoker, G_Male, CD_GU cancer)              3
(G_Male, CD_GU cancer, CTP_No)                     3
(R_White, G_Male, CTP_No)                          3
(TU_Non Smoker, G_Male, CTP_No)               

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(CTP_Yes)    1
(R_White)    1
Name: antecedents, dtype: int64

INTERESTING PATTERNS IN CLUSTER# 4 :


Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(R_Nonwhite)          2
(CTP_No)              1
(TU_Former Smoker)    1
Name: antecedents, dtype: int64


### (3) Spectral Clusters

In [7]:
dbdf = df.drop(columns = ["DBSCAN", "Agglomerative", "OPTICS", "K_means"])
print(dbdf["Spectral"].value_counts())
clusters = dbdf["Spectral"].value_counts().index
FreqMine(clusters, "Spectral")

2    605
6    507
3    409
9    373
7    361
4    271
0    239
8    210
5    171
1     78
Name: Spectral, dtype: int64

INTERESTING PATTERNS IN CLUSTER# 2 :


Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction
15,(CTP_No),(R_White),0.943802,0.975207,0.920661,0.975482,1.000282,0.00026,1.011216
39,"(TU_Non Smoker, CTP_No)",(R_White),0.943802,0.975207,0.920661,0.975482,1.000282,0.00026,1.011216
43,(CTP_No),"(TU_Non Smoker, R_White)",0.943802,0.975207,0.920661,0.975482,1.000282,0.00026,1.011216
50,"(CTP_No, G_Female)",(R_White),0.943802,0.975207,0.920661,0.975482,1.000282,0.00026,1.011216
53,(CTP_No),"(R_White, G_Female)",0.943802,0.975207,0.920661,0.975482,1.000282,0.00026,1.011216


(G_Female)                                            15
(TU_Non Smoker)                                       15
(CTP_No)                                               7
(R_White)                                              7
(TU_Non Smoker, G_Female)                              7
(CTP_No, G_Female)                                     3
(CTP_No, CD_Breast cancer)                             3
(CD_Breast cancer)                                     3
(R_White, G_Female)                                    3
(R_White, CTP_No, CD_Breast cancer)                    3
(TU_Non Smoker, R_White)                               3
(R_White, CD_Breast cancer)                            3
(TU_Non Smoker, CTP_No)                                3
(R_White, CTP_No)                                      3
(CD_Breast cancer, R_White, G_Female)                  1
(TU_Non Smoker, R_White, CTP_No)                       1
(TU_Non Smoker, CTP_No, G_Female)                      1
(TU_Non Smoker, R_White, G_Fema

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(CD_Breast cancer)                               15
(CTP_No, G_Female)                                1
(TU_Former Smoker, R_White, CTP_No, G_Female)     1
(TU_Former Smoker, CTP_No, G_Female)              1
(TU_Former Smoker)                                1
(G_Female)                                        1
(TU_Former Smoker, R_White, CTP_No)               1
(R_White, CTP_No, G_Female)                       1
(TU_Former Smoker, R_White, G_Female)             1
(R_White, CTP_No)                                 1
(TU_Former Smoker, G_Female)                      1
(CTP_No)                                          1
(TU_Former Smoker, CTP_No)                        1
(R_White, G_Female)                               1
(TU_Former Smoker, R_White)                       1
(R_White)                                         1
Name: antecedents, dtype: int64

INTERESTING PATTERNS IN CLUSTER# 3 :


Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(G_Male)                                                      15
(CD_Respiratory cancer)                                       15
(CD_Respiratory cancer, G_Male)                                7
(TU_Former Smoker, R_White, CTP_No)                            3
(TU_Former Smoker, CTP_No)                                     3
(R_White)                                                      3
(TU_Former Smoker, R_White)                                    3
(R_White, CTP_No)                                              3
(CTP_No)                                                       3
(TU_Former Smoker)                                             3
(TU_Former Smoker, G_Male, CTP_No)                             1
(G_Male, CTP_No)                                               1
(TU_Former Smoker, CD_Respiratory cancer, CTP_No)              1
(CD_Respiratory cancer, R_White)                               1
(TU_Former Smoker, CD_Respiratory cancer, R_White, CTP_No)     1
(CD_Respiratory cancer, C

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(CD_GU cancer)                                       15
(R_White)                                            15
(CTP_No)                                             15
(TU_Former Smoker)                                   15
(G_Male)                                             15
(CD_GU cancer, CTP_No)                                7
(TU_Former Smoker, CTP_No)                            7
(TU_Former Smoker, R_White)                           7
(TU_Former Smoker, CD_GU cancer)                      7
(R_White, G_Male)                                     7
(G_Male, CTP_No)                                      7
(R_White, CD_GU cancer)                               7
(TU_Former Smoker, G_Male)                            7
(G_Male, CD_GU cancer)                                7
(R_White, CTP_No)                                     7
(R_White, G_Male, CD_GU cancer)                       3
(R_White, G_Male, CTP_No)                             3
(TU_Former Smoker, R_White, CD_GU cancer)       

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction
9,(CTP_No),(R_White),0.958449,0.980609,0.944598,0.985549,1.005037,0.004734,1.341828
30,"(CTP_No, G_Female)",(R_White),0.958449,0.980609,0.944598,0.985549,1.005037,0.004734,1.341828
33,(CTP_No),"(R_White, G_Female)",0.958449,0.980609,0.944598,0.985549,1.005037,0.004734,1.341828
25,"(CD_Respiratory cancer, CTP_No)",(R_White),0.919668,0.980609,0.905817,0.98494,1.004416,0.003982,1.287535
52,"(CD_Respiratory cancer, CTP_No, G_Female)",(R_White),0.919668,0.980609,0.905817,0.98494,1.004416,0.003982,1.287535


(G_Female)                                                     15
(R_White)                                                       9
(CTP_No)                                                        7
(R_White, G_Female)                                             4
(TU_Former Smoker, CD_Respiratory cancer, CTP_No)               3
(TU_Former Smoker, R_White)                                     3
(CD_Respiratory cancer, R_White)                                3
(CD_Respiratory cancer, CTP_No)                                 3
(TU_Former Smoker, CTP_No)                                      3
(CTP_No, G_Female)                                              3
(TU_Former Smoker, CD_Respiratory cancer, CTP_No, G_Female)     1
(CD_Respiratory cancer, R_White, G_Female)                      1
(TU_Former Smoker, CD_Respiratory cancer, R_White)              1
(CD_Respiratory cancer, R_White, CTP_No)                        1
(TU_Former Smoker)                                              1
(CD_Respir

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction
15,(CTP_No),(R_White),0.929889,0.97048,0.907749,0.97619,1.005884,0.00531,1.239852
48,"(CD_GU cancer, CTP_No)",(R_White),0.929889,0.97048,0.907749,0.97619,1.005884,0.00531,1.239852
51,(CTP_No),"(R_White, CD_GU cancer)",0.929889,0.97048,0.907749,0.97619,1.005884,0.00531,1.239852
54,"(G_Male, CTP_No)",(R_White),0.929889,0.97048,0.907749,0.97619,1.005884,0.00531,1.239852
57,(CTP_No),"(R_White, G_Male)",0.929889,0.97048,0.907749,0.97619,1.005884,0.00531,1.239852


(G_Male)                                          15
(CD_GU cancer)                                    15
(CTP_No)                                          11
(R_White)                                         11
(TU_Non Smoker, R_White)                           7
(G_Male, CD_GU cancer)                             7
(TU_Non Smoker, CTP_No)                            7
(CD_GU cancer, CTP_No)                             5
(R_White, G_Male)                                  5
(R_White, CD_GU cancer)                            5
(G_Male, CTP_No)                                   5
(G_Male, TU_Non Smoker, R_White)                   3
(R_White, CTP_No)                                  3
(TU_Non Smoker, R_White, CTP_No)                   3
(TU_Non Smoker, R_White, CD_GU cancer)             3
(TU_Non Smoker, G_Male, CTP_No)                    3
(TU_Non Smoker, CD_GU cancer, CTP_No)              3
(TU_Non Smoker)                                    3
(G_Male, CD_GU cancer, CTP_No)                

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction
7,(CTP_No),(R_White),0.870293,0.958159,0.841004,0.966346,1.008545,0.007125,1.243276
18,"(CTP_No, G_Female)",(R_White),0.870293,0.958159,0.841004,0.966346,1.008545,0.007125,1.243276
21,(CTP_No),"(R_White, G_Female)",0.870293,0.958159,0.841004,0.966346,1.008545,0.007125,1.243276
13,"(CD_GI cancer, CTP_No)",(R_White),0.866109,0.958159,0.83682,0.966184,1.008375,0.00695,1.237298
23,"(CD_GI cancer, CTP_No, G_Female)",(R_White),0.866109,0.958159,0.83682,0.966184,1.008375,0.00695,1.237298


(G_Female)                           7
(CTP_No)                             5
(R_White)                            5
(CD_GI cancer, CTP_No)               3
(CD_GI cancer, R_White)              3
(R_White, G_Female)                  2
(CTP_No, G_Female)                   2
(R_White, CTP_No)                    1
(CD_GI cancer)                       1
(CD_GI cancer, R_White, CTP_No)      1
(CD_GI cancer, R_White, G_Female)    1
(CD_GI cancer, CTP_No, G_Female)     1
Name: antecedents, dtype: int64

INTERESTING PATTERNS IN CLUSTER# 8 :


Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(G_Male)                                             15
(CTP_No)                                             15
(CD_GI cancer)                                       15
(CD_GI cancer, G_Male)                                7
(R_White)                                             7
(TU_Former Smoker, R_White)                           7
(G_Male, CTP_No)                                      7
(CD_GI cancer, CTP_No)                                7
(TU_Former Smoker)                                    7
(TU_Former Smoker, R_White, G_Male)                   3
(TU_Former Smoker, CD_GI cancer, R_White)             3
(TU_Former Smoker, CTP_No)                            3
(CD_GI cancer, R_White)                               3
(CD_GI cancer, G_Male, CTP_No)                        3
(TU_Former Smoker, G_Male)                            3
(R_White, CTP_No)                                     3
(TU_Former Smoker, R_White, CTP_No)                   3
(R_White, G_Male)                               

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(G_Male)                                          15
(CTP_No)                                          15
(G_Male, CTP_No)                                   7
(CD_GI cancer)                                     3
(TU_Non Smoker)                                    3
(R_White)                                          3
(TU_Non Smoker, R_White)                           3
(TU_Non Smoker, R_White, CD_GI cancer)             3
(CD_GI cancer, R_White)                            3
(TU_Non Smoker, CD_GI cancer)                      3
(TU_Non Smoker, G_Male)                            1
(TU_Non Smoker, CTP_No)                            1
(G_Male, CD_GI cancer, R_White)                    1
(TU_Non Smoker, CD_GI cancer, R_White, CTP_No)     1
(CD_GI cancer, CTP_No)                             1
(TU_Non Smoker, CTP_No, CD_GI cancer)              1
(R_White, CTP_No)                                  1
(TU_Non Smoker, G_Male, CD_GI cancer)              1
(CD_GI cancer, R_White, CTP_No)               

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction
0,(TU_Former Smoker),(G_Male),0.628205,0.935897,0.628205,1.0,1.068493,0.04027,inf
12,"(TU_Former Smoker, R_White)",(G_Male),0.628205,0.935897,0.628205,1.0,1.068493,0.04027,inf
15,(TU_Former Smoker),"(R_White, G_Male)",0.628205,0.935897,0.628205,1.0,1.068493,0.04027,inf
18,"(TU_Former Smoker, CTP_Yes)",(G_Male),0.628205,0.935897,0.628205,1.0,1.068493,0.04027,inf
21,(TU_Former Smoker),"(CTP_Yes, G_Male)",0.628205,0.935897,0.628205,1.0,1.068493,0.04027,inf


(CTP_Yes)                               7
(G_Male)                                7
(TU_Former Smoker)                      7
(R_White)                               7
(R_White, G_Male)                       3
(TU_Former Smoker, G_Male)              3
(TU_Former Smoker, CTP_Yes)             3
(CTP_Yes, G_Male)                       3
(TU_Former Smoker, R_White)             3
(CTP_Yes, R_White)                      3
(TU_Former Smoker, CTP_Yes, R_White)    1
(TU_Former Smoker, CTP_Yes, G_Male)     1
(TU_Former Smoker, R_White, G_Male)     1
(CTP_Yes, R_White, G_Male)              1
Name: antecedents, dtype: int64


### (4) Optics

In [8]:
dbdf = df.drop(columns = ["DBSCAN", "Agglomerative", "Spectral", "K_means"])
print(dbdf["OPTICS"].value_counts())
clusters = dbdf["OPTICS"].value_counts().index
FreqMine(clusters, "OPTICS")

-1    779
 6    548
 5    470
 2    370
 1    359
 4    268
 0    233
 3    197
Name: OPTICS, dtype: int64

INTERESTING PATTERNS IN CLUSTER# -1 :


Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


Series([], Name: antecedents, dtype: int64)

INTERESTING PATTERNS IN CLUSTER# 6 :


Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(CD_Breast cancer)                                      15
(R_White)                                               15
(CTP_No)                                                15
(TU_Non Smoker)                                         15
(G_Female)                                              15
(R_White, G_Female)                                      7
(CD_Breast cancer, G_Female)                             7
(TU_Non Smoker, R_White)                                 7
(R_White, CD_Breast cancer)                              7
(CTP_No, CD_Breast cancer)                               7
(CTP_No, G_Female)                                       7
(R_White, CTP_No)                                        7
(TU_Non Smoker, G_Female)                                7
(TU_Non Smoker, CD_Breast cancer)                        7
(TU_Non Smoker, CTP_No)                                  7
(R_White, CTP_No, G_Female)                              3
(R_White, CTP_No, CD_Breast cancer)                     

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(CD_Breast cancer)                                         15
(TU_Former Smoker)                                         15
(G_Female)                                                 15
(CTP_No)                                                   15
(R_White)                                                  15
(TU_Former Smoker, R_White)                                 7
(R_White, G_Female)                                         7
(CD_Breast cancer, G_Female)                                7
(TU_Former Smoker, G_Female)                                7
(R_White, CD_Breast cancer)                                 7
(CTP_No, CD_Breast cancer)                                  7
(CTP_No, G_Female)                                          7
(TU_Former Smoker, CD_Breast cancer)                        7
(R_White, CTP_No)                                           7
(TU_Former Smoker, CTP_No)                                  7
(TU_Former Smoker, R_White, CD_Breast cancer)               3
(CD_Brea

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(G_Male)                                                      15
(CD_Respiratory cancer)                                       15
(TU_Former Smoker)                                            15
(R_White)                                                     15
(CTP_No)                                                      15
(TU_Former Smoker, R_White)                                    7
(TU_Former Smoker, CD_Respiratory cancer)                      7
(CD_Respiratory cancer, G_Male)                                7
(CD_Respiratory cancer, R_White)                               7
(R_White, G_Male)                                              7
(G_Male, CTP_No)                                               7
(R_White, CTP_No)                                              7
(TU_Former Smoker, CTP_No)                                     7
(CD_Respiratory cancer, CTP_No)                                7
(TU_Former Smoker, G_Male)                                     7
(TU_Former Smoker, CD_Res

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(CD_GU cancer)                                       15
(R_White)                                            15
(CTP_No)                                             15
(TU_Former Smoker)                                   15
(G_Male)                                             15
(CD_GU cancer, CTP_No)                                7
(TU_Former Smoker, CTP_No)                            7
(TU_Former Smoker, R_White)                           7
(TU_Former Smoker, CD_GU cancer)                      7
(R_White, G_Male)                                     7
(G_Male, CTP_No)                                      7
(R_White, CD_GU cancer)                               7
(TU_Former Smoker, G_Male)                            7
(G_Male, CD_GU cancer)                                7
(R_White, CTP_No)                                     7
(R_White, G_Male, CD_GU cancer)                       3
(R_White, G_Male, CTP_No)                             3
(TU_Former Smoker, R_White, CD_GU cancer)       

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(R_White)                                                       15
(G_Female)                                                      15
(TU_Former Smoker)                                              15
(CTP_No)                                                        15
(CD_Respiratory cancer)                                         15
(CD_Respiratory cancer, G_Female)                                7
(R_White, G_Female)                                              7
(CD_Respiratory cancer, CTP_No)                                  7
(CTP_No, G_Female)                                               7
(TU_Former Smoker, G_Female)                                     7
(TU_Former Smoker, CTP_No)                                       7
(R_White, CTP_No)                                                7
(TU_Former Smoker, R_White)                                      7
(CD_Respiratory cancer, R_White)                                 7
(TU_Former Smoker, CD_Respiratory cancer)                     

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(CD_GU cancer)                                    15
(R_White)                                         15
(CTP_No)                                          15
(TU_Non Smoker)                                   15
(G_Male)                                          15
(R_White, G_Male)                                  7
(G_Male, CD_GU cancer)                             7
(TU_Non Smoker, R_White)                           7
(R_White, CTP_No)                                  7
(TU_Non Smoker, CTP_No)                            7
(G_Male, CTP_No)                                   7
(TU_Non Smoker, G_Male)                            7
(R_White, CD_GU cancer)                            7
(TU_Non Smoker, CD_GU cancer)                      7
(CD_GU cancer, CTP_No)                             7
(TU_Non Smoker, G_Male, CD_GU cancer)              3
(G_Male, CD_GU cancer, CTP_No)                     3
(R_White, G_Male, CTP_No)                          3
(TU_Non Smoker, G_Male, CTP_No)               

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(G_Male)                                             15
(CTP_No)                                             15
(TU_Former Smoker)                                   15
(CD_GI cancer)                                       15
(R_White)                                            15
(TU_Former Smoker, CTP_No)                            7
(CD_GI cancer, R_White)                               7
(TU_Former Smoker, R_White)                           7
(CD_GI cancer, CTP_No)                                7
(TU_Former Smoker, CD_GI cancer)                      7
(CD_GI cancer, G_Male)                                7
(TU_Former Smoker, G_Male)                            7
(G_Male, CTP_No)                                      7
(R_White, G_Male)                                     7
(R_White, CTP_No)                                     7
(TU_Former Smoker, CD_GI cancer, CTP_No)              3
(TU_Former Smoker, CD_GI cancer, G_Male)              3
(R_White, G_Male, CTP_No)                       

### (5) K-Means

In [9]:
dbdf = df.drop(columns = ["DBSCAN", "Agglomerative", "Spectral", "OPTICS"])
print(dbdf["K_means"].value_counts())
clusters = dbdf["K_means"].value_counts().index
FreqMine(clusters, "K_means")

2    608
0    515
6    451
1    412
4    410
7    350
5    239
3    239
Name: K_means, dtype: int64

INTERESTING PATTERNS IN CLUSTER# 2 :


Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction
5,(CTP_No),(CD_Breast cancer),0.940789,0.981908,0.925987,0.984266,1.002401,0.002218,1.149854
30,"(CTP_No, G_Female)",(CD_Breast cancer),0.940789,0.981908,0.925987,0.984266,1.002401,0.002218,1.149854
33,(CTP_No),"(G_Female, CD_Breast cancer)",0.940789,0.981908,0.925987,0.984266,1.002401,0.002218,1.149854
15,"(TU_Non Smoker, CTP_No)",(CD_Breast cancer),0.939145,0.981908,0.924342,0.984238,1.002373,0.002188,1.147844
48,"(TU_Non Smoker, CTP_No, G_Female)",(CD_Breast cancer),0.939145,0.981908,0.924342,0.984238,1.002373,0.002188,1.147844


(G_Female)                                              15
(CTP_No)                                                13
(CD_Breast cancer)                                       9
(TU_Non Smoker, CTP_No)                                  7
(CTP_No, G_Female)                                       6
(R_White, CD_Breast cancer)                              5
(TU_Non Smoker, CD_Breast cancer)                        5
(R_White)                                                5
(R_White, CTP_No)                                        5
(G_Female, CD_Breast cancer)                             4
(TU_Non Smoker, R_White)                                 3
(TU_Non Smoker, R_White, CD_Breast cancer)               3
(TU_Non Smoker, CTP_No, G_Female)                        3
(TU_Non Smoker, R_White, CTP_No)                         3
(R_White, G_Female, CD_Breast cancer)                    2
(TU_Non Smoker, G_Female, CD_Breast cancer)              2
(R_White, G_Female)                                     

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(G_Female)                                               15
(TU_Former Smoker)                                       15
(TU_Former Smoker, G_Female)                              7
(CTP_No, CD_Breast cancer)                                3
(R_White, CTP_No, CD_Breast cancer)                       3
(R_White)                                                 3
(CD_Breast cancer)                                        3
(CTP_No)                                                  3
(R_White, CTP_No)                                         3
(R_White, CD_Breast cancer)                               3
(R_White, CTP_No, G_Female)                               1
(CTP_No, G_Female, CD_Breast cancer)                      1
(TU_Former Smoker, CD_Breast cancer, R_White, CTP_No)     1
(TU_Former Smoker, CTP_No)                                1
(TU_Former Smoker, CTP_No, CD_Breast cancer)              1
(CTP_No, G_Female)                                        1
(R_White, G_Female)                     

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction
11,(CTP_No),(R_White),0.906874,0.977827,0.889135,0.98044,1.002672,0.00237,1.133592
25,"(TU_Non Smoker, CTP_No)",(R_White),0.906874,0.977827,0.889135,0.98044,1.002672,0.00237,1.133592
29,(CTP_No),"(TU_Non Smoker, R_White)",0.906874,0.977827,0.889135,0.98044,1.002672,0.00237,1.133592
32,"(G_Male, CTP_No)",(R_White),0.906874,0.977827,0.889135,0.98044,1.002672,0.00237,1.133592
35,(CTP_No),"(R_White, G_Male)",0.906874,0.977827,0.889135,0.98044,1.002672,0.00237,1.133592


(G_Male)                            7
(CTP_No)                            7
(R_White)                           7
(TU_Non Smoker)                     7
(TU_Non Smoker, G_Male)             3
(R_White, CTP_No)                   3
(G_Male, CTP_No)                    3
(TU_Non Smoker, R_White)            3
(R_White, G_Male)                   3
(TU_Non Smoker, CTP_No)             3
(G_Male, TU_Non Smoker, R_White)    1
(TU_Non Smoker, G_Male, CTP_No)     1
(R_White, G_Male, CTP_No)           1
(TU_Non Smoker, R_White, CTP_No)    1
Name: antecedents, dtype: int64

INTERESTING PATTERNS IN CLUSTER# 1 :


Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(G_Male)                                             15
(TU_Former Smoker, R_White, CD_GU cancer, CTP_No)     1
(R_White, CD_GU cancer)                               1
(TU_Former Smoker)                                    1
(TU_Former Smoker, CD_GU cancer, CTP_No)              1
(CD_GU cancer, CTP_No)                                1
(TU_Former Smoker, R_White, CTP_No)                   1
(R_White, CTP_No)                                     1
(CTP_No)                                              1
(R_White, CD_GU cancer, CTP_No)                       1
(TU_Former Smoker, CTP_No)                            1
(TU_Former Smoker, CD_GU cancer)                      1
(TU_Former Smoker, R_White)                           1
(R_White)                                             1
(TU_Former Smoker, R_White, CD_GU cancer)             1
(CD_GU cancer)                                        1
Name: antecedents, dtype: int64

INTERESTING PATTERNS IN CLUSTER# 4 :


Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction


(G_Male)                                                      15
(TU_Former Smoker, CTP_No)                                     1
(R_White, CTP_No)                                              1
(TU_Former Smoker, R_White, CTP_No)                            1
(TU_Former Smoker, CD_Respiratory cancer)                      1
(TU_Former Smoker, CD_Respiratory cancer, R_White)             1
(TU_Former Smoker, CD_Respiratory cancer, CTP_No)              1
(CTP_No)                                                       1
(CD_Respiratory cancer, CTP_No)                                1
(CD_Respiratory cancer, R_White, CTP_No)                       1
(TU_Former Smoker)                                             1
(TU_Former Smoker, CD_Respiratory cancer, R_White, CTP_No)     1
(CD_Respiratory cancer, R_White)                               1
(CD_Respiratory cancer)                                        1
(TU_Former Smoker, R_White)                                    1
(R_White)                

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction
17,(CTP_No),(R_White),0.948571,0.98,0.934286,0.98494,1.005041,0.004686,1.328
57,"(CD_Respiratory cancer, CTP_No)",(R_White),0.948571,0.98,0.934286,0.98494,1.005041,0.004686,1.328
61,(CTP_No),"(CD_Respiratory cancer, R_White)",0.948571,0.98,0.934286,0.98494,1.005041,0.004686,1.328
64,"(CTP_No, G_Female)",(R_White),0.948571,0.98,0.934286,0.98494,1.005041,0.004686,1.328
67,(CTP_No),"(R_White, G_Female)",0.948571,0.98,0.934286,0.98494,1.005041,0.004686,1.328


(G_Female)                                                      15
(CD_Respiratory cancer)                                         15
(CTP_No)                                                        15
(R_White)                                                       11
(CTP_No, G_Female)                                               7
(CD_Respiratory cancer, CTP_No)                                  7
(TU_Former Smoker)                                               7
(TU_Former Smoker, CTP_No)                                       7
(TU_Former Smoker, R_White)                                      7
(CD_Respiratory cancer, G_Female)                                7
(CD_Respiratory cancer, R_White)                                 5
(R_White, G_Female)                                              5
(TU_Former Smoker, CD_Respiratory cancer, CTP_No)                3
(TU_Former Smoker, CD_Respiratory cancer)                        3
(CD_Respiratory cancer, CTP_No, G_Female)                     

Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction
7,(CTP_No),(R_White),0.870293,0.958159,0.841004,0.966346,1.008545,0.007125,1.243276
18,"(CTP_No, G_Female)",(R_White),0.870293,0.958159,0.841004,0.966346,1.008545,0.007125,1.243276
21,(CTP_No),"(R_White, G_Female)",0.870293,0.958159,0.841004,0.966346,1.008545,0.007125,1.243276
13,"(CD_GI cancer, CTP_No)",(R_White),0.866109,0.958159,0.83682,0.966184,1.008375,0.00695,1.237298
23,"(CD_GI cancer, CTP_No, G_Female)",(R_White),0.866109,0.958159,0.83682,0.966184,1.008375,0.00695,1.237298


(G_Female)                           7
(CTP_No)                             5
(R_White)                            5
(CD_GI cancer, CTP_No)               3
(CD_GI cancer, R_White)              3
(R_White, G_Female)                  2
(CTP_No, G_Female)                   2
(R_White, CTP_No)                    1
(CD_GI cancer)                       1
(CD_GI cancer, R_White, CTP_No)      1
(CD_GI cancer, R_White, G_Female)    1
(CD_GI cancer, CTP_No, G_Female)     1
Name: antecedents, dtype: int64

INTERESTING PATTERNS IN CLUSTER# 3 :


Unnamed: 0,antecedents,consequents,antecedent support,consequent support,support,confidence,lift,leverage,conviction
5,(CTP_No),(TU_Former Smoker),0.882845,0.979079,0.866109,0.981043,1.002005,0.001733,1.103556
26,"(CD_GI cancer, CTP_No)",(TU_Former Smoker),0.882845,0.979079,0.866109,0.981043,1.002005,0.001733,1.103556
29,(CTP_No),"(TU_Former Smoker, CD_GI cancer)",0.882845,0.979079,0.866109,0.981043,1.002005,0.001733,1.103556
34,"(G_Male, CTP_No)",(TU_Former Smoker),0.882845,0.979079,0.866109,0.981043,1.002005,0.001733,1.103556
37,(CTP_No),"(TU_Former Smoker, G_Male)",0.882845,0.979079,0.866109,0.981043,1.002005,0.001733,1.103556


(G_Male)                                             15
(CD_GI cancer)                                       15
(TU_Former Smoker)                                   11
(R_White, CTP_No)                                     7
(CTP_No)                                              7
(CD_GI cancer, G_Male)                                7
(TU_Former Smoker, CD_GI cancer)                      5
(TU_Former Smoker, G_Male)                            5
(TU_Former Smoker, R_White)                           3
(R_White, G_Male, CTP_No)                             3
(CD_GI cancer, R_White, CTP_No)                       3
(TU_Former Smoker, CTP_No)                            3
(R_White)                                             3
(CD_GI cancer, CTP_No)                                3
(TU_Former Smoker, R_White, CTP_No)                   3
(G_Male, CTP_No)                                      3
(TU_Former Smoker, CD_GI cancer, G_Male)              2
(TU_Former Smoker, R_White, G_Male, CTP_No)     