In [109]:
import pandas as pd
import ast
import re

from sklearn.metrics import precision_recall_fscore_support, f1_score
from sklearn.preprocessing import MultiLabelBinarizer

import plotly.graph_objects as go

The dessi dataset can be downloaded from   
https://www.kaggle.com/datasets/sensitivedetection/dessi-dataset-for-structured-sensitive-information  
where the only the DeSSI_v2 folder is necessary

# Evaluation - Presidio Confusion Matrix on Dessi Data

Use a Presidio Confusion Matrx to find label errors for Dessi Data  
Use all Predictions of Presidio without any thresholds so that no wrong predictions are ignored

In [110]:
dessi_train_labels = pd.read_csv("DeSSI_v2/train_labels.csv")
dessi_train = pd.read_csv("DeSSI_v2/train.csv")

dessi_dev_labels = pd.read_csv("DeSSI_v2/dev_labels.csv")
dessi_dev = pd.read_csv("DeSSI_v2/dev.csv")

dessi_test_labels = pd.read_csv("DeSSI_v2/test_labels.csv")
dessi_test = pd.read_csv("DeSSI_v2/test.csv")

dessi_all = pd.concat([dessi_train, dessi_dev, dessi_test], axis=1)
dataset_split = ["train"] * dessi_train.shape[1] + ["validation"] * dessi_dev.shape[1] + ["test"] * dessi_test.shape[1]
dataset_split_df = pd.DataFrame(dataset_split).T
dataset_split_df.columns = dessi_all.columns
dessi_all = pd.concat([dessi_all, dataset_split_df]).reset_index(drop=True)

dessi_all_labels = pd.concat([dessi_train_labels, dessi_dev_labels, dessi_test_labels], axis=0).reset_index(drop=True)
dataset_split_df = pd.DataFrame(dataset_split)
dataset_split_df.columns = ["split_type"]
dessi_all_labels = pd.concat([dessi_all_labels, dataset_split_df], axis=1).reset_index(drop=True)


Columns (62,107,161,241,255,324,449,503,686,720,807,812,889,934,1073,1113,1133,1154,1158,1242,1317,1333,1394,1408,1470,1553,1577,1674,1729,1762,1872,1913,1940,2045,2131,2139,2209,2288,2404,2436,2601,2627,2663,2779,2841,2960,2994,3061,3063,3080,3129,3136,3250,3319,3439,3464,3499,3520,3596,3637,3649,3748,3778,3787,3808,3902,3907,3917,3951,4009,4034,4037,4069,4129,4210,4218,4252,4325,4359,4386,4479,4646,4649,4652,4710,4936,4939,5013,5065,5069,5348,5352,5356,5399,5476,5702,5736,5889,5962,6072,6094,6107,6140,6159,6337,6360,6383,6407,6415,6423,6507,6555,6567,6590,6593,6689,6809,6815,6920,6995,7042,7127,7163,7229,7295,7301,7319,7321,7354,7399,7403,7465,7474,7593,7594,7694,7719,7798,7872,7979,8179,8298,8308,8473,8542,8565,8568,8570,8579,8633,8662,8707,8835,8846,8859,8899,8933,9024,9084,9126,9170,9184,9198,9251,9329,9412,9505,9588,9592,9610,9652,9803,9818,9907,9908,9952,9975,10073,10099,10136,10161,10359,10369,10407,10427,10515,10589,10694,10748,10778,10787,10830,10839,10898,11026,11068,11201,

In [111]:
def read_files(method):
    train = pd.read_csv(f"../../Presidio/old_predictions/dessi_results/train/results_{method}.csv")
    val = pd.read_csv(f"../../Presidio/old_predictions/dessi_results/val/results_{method}.csv")
    test = pd.read_csv(f"../../Presidio/old_predictions/dessi_results/test/results_{method}.csv")
    return train, val, test

def concat_results(train, val, test):
    all_results = pd.concat([train, val, test], axis=1)
    dataset_split = ["train"] * dessi_train.shape[1] + ["validation"] * dessi_dev.shape[1] + ["test"] * dessi_test.shape[1]
    dataset_split_df = pd.DataFrame(dataset_split).T
    dataset_split_df.columns = all_results.columns
    return pd.concat([all_results, dataset_split_df]).reset_index(drop=True).T.reset_index(drop=True).T     #reset index and column names

results_method3_train, results_method3_val, results_method3_test = read_files("columnwise")

results_method_3_all = concat_results(results_method3_train, results_method3_val, results_method3_test)

The Classes of Presidio must be mapped to the classes of dessi to compare both

In [112]:
# Mapping dictionary
# IN_VEHICLE_REGISTRATION, IP_ADDRESS, MEDICAL_LICENSE, URL, US_BANK_NUMBER are matched to "Other_data"
CATEGORY_MAP = {
    "AU_TFN": "NIN",
    "AU_MEDICARE": "NIN",
    "IN_AADHAAR": "NIN",
    "IN_PAN": "NIN",
    "IN_PASSPORT": "Passport",
    "UK_NHS": "NIN",
    "US_ITIN": "NIN",
    "US_SSN": "NIN",
    "AU_ABN": "Organization",
    "AU_ACN": "Organization",
    "CREDIT_CARD": "CCN",
    "DATE_TIME": "Date",
    "shared DATE_TIME": "Date",
    "EMAIL_ADDRESS": "Email",
    "IBAN_CODE": "IBAN",
    "LOCATION": ["Geolocation", "Address", "GPE"],
    "shared LOCATION": ["Geolocation", "Address", "GPE"],
    "NRP": ["Nationality", "Religion"],  
    "shared NRP": ["Nationality", "Religion"],
    "PERSON": "Person",
    "shared PERSON": "Person",
    "PHONE_NUMBER": "Phone_number",
    "shared PHONE_NUMBER": "Phone_number",
    "US_DRIVER_LICENSE": "ID_Card",
    "shared US_DRIVER_LICENSE": "ID_Card",
    "US_PASSPORT": "Passport",
    "shared IN_PAN": "NIN",
}

In [113]:
def get_categories(strings):
    if strings == []:
        return ["Other_data"]
    results = []
    for s in strings:
        category = CATEGORY_MAP.get(s, "Other_data")
        if isinstance(category, list):
            results.extend(category) 
        else:
            results.append(category)  
    return results

def convert_labels(label_str):
    return [label.strip() for label in label_str.replace('{', '').replace('}', '').replace("'", "").split(',')]

def build_dataframe(results_df, threshold_score, threshold_count):
    height, width = results_df.shape
    results_copy = results_df.copy()
    print(f"Threshold score: {threshold_score}\nThreshold count: {threshold_count}")
    empty_row1 = [[] for _ in range(width)]
    empty_row2 = [[] for _ in range(width)]
    empty_row3 = [[] for _ in range(width)]
    results_copy.loc[height] = empty_row1.copy()
    results_copy.loc[height+1] = empty_row2.copy()
    results_copy.loc[height+2] = empty_row3.copy()
    for i in range(width):
        series = pd.Series([item for sublist in results_copy.iloc[2:height:2, i]
                        for item in ast.literal_eval(sublist)], dtype="object").value_counts()
        for a, b in series.items():
            if b > threshold_count:
                results_copy.iloc[height, i].append(a)
                results_copy.iloc[height+1, i].append(b)
    for i in range(width):
        entities = [re.sub(r'_\d+(\.\d+)?$', '', item)
                    for item in results_copy.iloc[height, i] if float(re.search(r'(\d+\.\d+)', item).group(1)) >= threshold_score]
        mapped_entities = get_categories(entities)
        results_copy.iloc[height+2, i] = str(set(mapped_entities))

    results_copy.loc[0] = results_copy.loc[0].apply(convert_labels)
    results_copy.loc[height+2] = results_copy.loc[height+2].apply(convert_labels)
    return results_copy

def compute_performance(results, confusion = False):
    results_copy = results.copy()
    mlb = MultiLabelBinarizer()
    y_true = mlb.fit_transform(results_copy.loc[0])
    y_pred = mlb.transform(results_copy.loc[results_copy.shape[0]-1])
    precision, recall, f1, support = precision_recall_fscore_support(
        y_true, y_pred, average=None, zero_division=0)
    f1_micro = f1_score(y_true, y_pred, average='micro')
    f1_macro = f1_score(y_true, y_pred, average='macro')
    f1_weighted = f1_score(y_true, y_pred, average='weighted')
    evaluation = pd.DataFrame({
        'Class': mlb.classes_,
        'P': precision,
        'R': recall,
        'F1': f1,
        'S': support
    }).sort_values("S", ascending=False).reset_index(drop=True)
    print(f'Micro F1 Score: {f1_micro:.4f}')
    print(f'Macro F1 Score: {f1_macro:.4f}')
    print(f'Weighted F1 Score: {f1_weighted:.4f}')
    
    if confusion == True:
        y_true_df = pd.DataFrame(y_true)
        y_pred_df = pd.DataFrame(y_pred)

        confusion_matrix = []
        for i in range(20):
            pred_true_compare = y_pred_df.loc[y_pred_df.index.isin(y_true_df.loc[y_true_df[i] == 1].index)]
            arr_label = []
            for j in range(20):
                val = pred_true_compare.loc[:, j].value_counts(normalize=True).get(1)
                arr_label.append(val.item() if val != None else 0)
            confusion_matrix.append(arr_label)
        fig = go.Figure(go.Heatmap(z=confusion_matrix, x=mlb.classes_, y=mlb.classes_, colorscale='Blues'))
        fig.update_layout(title_text='Confusion Matrix', height=800, width=800)
        fig.update_xaxes(title="Predicted Label")
        fig.update_yaxes(title="True Label")
        fig.show()
    return evaluation

# Analyze Presidio Confusion Matrix Part 1

Get a confusion matrix without thresholds to compare all Presidio predictions with the real labels  
Try to find label errors in Dessi  
Use columnwise approach as it is similar to CASSED approach and all three approaches perform similar for no thresholds so the approach does not matter

In [114]:
dessi_cleaned = dessi_all
dessi_labels_cleaned = dessi_all_labels
wrong_columns = []

In [115]:
results_method3_thresholds = build_dataframe(results_method_3_all, 0, 0)
evaluation_method3 = compute_performance(results_method3_thresholds, confusion = True) # Best threshold_score and threshold_count

print(evaluation_method3)

Threshold score: 0
Threshold count: 0
Micro F1 Score: 0.2469
Macro F1 Score: 0.2354
Weighted F1 Score: 0.3321


           Class         P         R        F1     S
0     Other_data  0.137213  0.242951  0.175377  6561
1   Phone_number  0.377567  0.990493  0.546727  4418
2        Address  0.169818  0.843240  0.282704  3802
3         Person  0.204139  0.999721  0.339046  3582
4            NIN  0.219195  0.651773  0.328062  3469
5          Email  1.000000  0.995926  0.997959  3191
6           Date  0.153270  0.985622  0.265286  2782
7            GPE  0.104825  0.911142  0.188020  2172
8   Organization  0.001077  0.001445  0.001234  2076
9    Geolocation  0.035701  0.327502  0.064384  2058
10     SWIFT/BIC  0.000000  0.000000  0.000000   240
11          IBAN  0.892019  0.892019  0.892019   213
12           CCN  0.345098  0.807339  0.483516   109
13      Passport  0.046512  0.388889  0.083086   108
14        Gender  0.000000  0.000000  0.000000    94
15      Religion  0.012819  1.000000  0.025313    93
16     Sexuality  0.000000  0.000000  0.000000    92
17   Nationality  0.012543  1.000000  0.024775

The classes gender, organization, Race, SWIFT/BIC and sexuality can't be predicted by Presidio, as a result P/R/F1 is zero for these classes

Analyse Presidio mistakes  
First focus on the false negatives for every class, so look at the predictions which predicted other classes than the actual groundtruth

In [116]:
def analyse_class(class_label, focus="false negatives"):
    reduced_columns = results_method3_thresholds.iloc[:,dessi_all_labels.loc[dessi_all_labels["label"].str.contains(class_label)].index].T
    indi = []
    if focus == "false negatives":
        for i, a in zip(reduced_columns.index, reduced_columns[204]):
            if class_label not in a:
                indi.append(i)
    elif focus == "true positives":
        for i, a in zip(reduced_columns.index, reduced_columns[204]):
            if class_label in a:
                indi.append(i)
    else:
        raise ValueError("Focus should be either 'false negatives' or 'true positives'")
    d = dessi_all.iloc[:,[int(a) for a in reduced_columns.T[indi].columns.values]]
    add_info = reduced_columns.T[indi].iloc[[0,204],:]
    add_info.columns = d.columns
    df = pd.concat([add_info, d]).reset_index(drop=True)
    return df

'analyse_class' returns the false negative if the parameter 'focus' is not change  
first row display the groundtruth label and the second row of the dataframe the predictions, the other rows are the column values

In [117]:
df_address = analyse_class("Address")
pd.set_option('display.max_columns', 600)
df_address.head()

Unnamed: 0,aefoxiqjscpw,zip_code,vmwfwqqsnoic,country_code,zip,country_code.1,zip_code.1,zip_code.2,postc,rpxxiumyhlae,zip_code.3,zip_code.4,crxnjlldutum,zip.3,dwecggdbwnco,zipcode.1,pxltxbopsejw,postal_code.2,postal_code.5,jquonjkqmfiq,zip.4,mfeweqkheals,zip_code.6,zipcode.2,postal_code.6,lyydqikplrjv,zip_code.8,country_code.2,eamiqywoifjj,postc.1,zip_code.9,zipcode.3,zip_code.10,jwxpcokehrke,location.1,country_code.4,kilxuqjhkbxy,house_number,zip.6,zip_code.12,postc.2,gchzzbkofkvv,zip.7,kvdojtkwrsss,jkmdosfzqtok,postal_code.10,zip.8,pckfjubhvrso,zip_code.13,zipcode.4,postal_code.11,knoryrzdsoao,zip.9,qxcjviesqxrl,postcode.2,zipcode.5,postcode.3,zip.10,sktqitphfbls,postc.3,zipcode.6,zip_code.15,cbmpaziqnwzr,zip_code.16,zipcode.7,zipcode.8,saahfmplzdnr,postcode.7,zip_code.17,mrvwmvqphvio,zip_code.19,country_code.7,house_number.2,postal_code.14,tcqagfphmhfo,nujfmwqtchow,zipcode.9,zip_code.20,postal_code.15,zipcode.10,oelzemzggkla,cmosuftohfsj,ouhymyfutodh,zip.12,zip.13,postal_code.17,zip_code.21,vxcaynpxyvnc,zipcode.11,postal_code.18,xogafltwrqqc,zip.15,postal_code.19,zip_code.22,sxsymizrrnhf,zip.17,postal_code.20,oifjiggjllae,location_id.5,zip_code.23,jkzemsbeqhbo,zip_code.24,house_number.3,husndpjlsyxe,house_number.4,postc.4,nianjueahqym,house_number.5,postc.5,buijuelmzggf,zipcode.12,zipcode.13,osackobckpuq,quhkldkvphkt,zip_code.27,postcode.10,zipcode.14,house_number.6,ypkdexqrcfcb,zip.19,azjdgelpoejj,postal_code.24,iqzpkozzuzms,djfnkmahehsv,postc.7,zip_code.28,house_number.7,nhibyotdcxqs,zip.20,house_number.8,oeqorpqhverv,vksddewyefhq,zipcode.15,house_number.9,befuvvhxogwi,zip_code.29,rutydrpkxcxx,house_number.10,zlndfnlyrbzd,postc.8,tmvbpmfhhcwv,wswrqbbvsjfr,country_code.14,wxxwbnvuubbf,postc.9,zipcode.16,postcode.11,postal_code.25,zip_code.30,postc.10,house_number.11,xcecpnovxkxd,rufbblgjkafy,nwkohfhvgsfv,teohqlkbbsna,mvxdtldxlurh,country_code.15,zipcode.17,vbrwvaxhvmkg,jtltckqzxslc,zip_code.31,zipcode.18,iaaadyfzqzds,zip_code.32,zip.24,pflmllflggwn,lxbzxczfkrwf,house_number.12,zip_code.34,postc.12,zip_code.35,zip.26,sropxbmzbkbw,zip_code.36,zqwwsgrrcurx,zip_code.37,ssqrqhugrpva,zip_code.38,yigioqblrywx,postcode.12,zip.27,zvlughotfljl,zip_code.39,house_number.13,postcode.13,postc.13,yraplsrtxuwi,postal_code.29,postal_code.30,dtxttdthjbym,house_number.14,house_number.15,house_number.16,zip_code.42,house_number.17,house_number.18,postc.14,zipcode.19,zipcode.20,rdkytiyyfsba,pndocuqrbyuw,city.41,zipcode.21,postc.16,zzdijvkpnaoi,zip_code.43,kucvvtrossuf,mhyhcvwpryrh,zipcode.22,house_number.19,postal_code.34,postc.17,postcode.16,postcode.17,grktyboexsih,postcode.18,zjuvmwfuddoz,postal_code.35,rkfhjyojrqsh,odrrrxajhhez,postal_code.36,zryrhvpuzjml,postc.18,smqbxlhxqiej,zip.29,zipcode.23,zip.30,postc.19,postc.20,country_code.19,house_number.20,fekgmkmctxiy,country_code.20,latitude.32,zip_code.44,xybdpztfbvyq,zip.31,zip_code.45,postal_code.37,lkzjvygxsknf,sniugznsjnjn,zip_code.46,postc.21,xjiaxyqacwgq,gvfiwrgicheh,bccyikuaubbx,postc.22,zip_code.47,yyrxlnmsuzyv,postc.23,zip_code.48,zip.32,tsuoonieoxim,zip.33,postcode.20,jslsaftvdyjv,jfibufhqnhcf,house_number.21,jxyweotltnxt,evvcgfgmbuhv,postal_code.40,zip.34,tkhgvdzeizat,zipcode.25,zipcode.26,postcode.22,eldojcgatook,postcode.23,fapkauysacxt,zip.36,postc.25,country_code.22,zip_code.49,zipcode.27,zip_code.50,zip_code.51,ctupykepdjhj,zip_code.52,zip_code.54,zip_code.55,zipcode.28,zip.37,postal_code.43,zip.38,zip.39,zip.40,country_code.23,zip_code.57,euhfdbmkkgwy,postc.26,goipzzpplgos,zipcode.29,house_number.22,postcode.24,hehofiwojfvo,postc.27,kgurepuevnqv,zip_code.58,zip.42,house_number.23,house_number.24,zip_code.59,country_code.25,postc.28,zip_code.60,postal_code.46,mrxofygsyfip,zipcode.30,wzgweuwnhtfg,postc.29,zip.44,ndiduypjdrbm,zip.45,wktmmsdtqvfi,dejjnairpkhg,kgqlkkwbfeop,postc.30,zipcode.31,uhkirubvlktv,nhbcjglhmrim,euhyjvqtagbw,bfghzbikugme,country_code.29,postal_code.49,iepubepvmfzx,postcode.25,oaergyjxjwxc,zip_code.61,country_code.30,vivzytwkvrys,crgqwwowoaxt,zip_code.62,wzmvsenjjvht,aoyombisrkmp,wtgzpordibkc,rqxrglagsrkc,house_number.25,zip_code.63,postc.32,jrhfamsdtvba,zipcode.32,postc.33,zip_code.64,postal_code.50,postc.34,tumdhgktunme,postal_code.51,house_number.26,postal_code.52,qigwmzbfzyqi,zip_code.66,qjzlgztkgowa,postc.35,zip_code.67,zipcode.33,zip.49,kyypuxxfacqd,zipcode.34,rfrravymvvzj,pvruxnhtcdmw,house_number.27,zipcode.35,mdmjjiyavuwr,nwnpobkvguxz,postal_code.55,vrzoxztlhpcr,house_number.28,postcode,postc.24,cylaicnhfksr,country_code.3,bkxrgqxkwbja,zip_code.33,postal_code,postal_code.3,country_code.1.1,postal_code.4,zipcode.1.1,gipustqwoipo,zip.1,tbeeubladptp,zip_code.1.1,cporndogjgkw,ntjdcszxcpjn,postc.1.1,zip_code.2.1,postc.2.1,zip.2,house_number.1,idnzouwlhkyo,hkqxxaagrwzl,zip_code.4.1,zip.3.1,pkhcprscrosj,zip.4.1,zip_code.5,zipcode.2.1,house_number.2.1,azxozqiojdpo,zip_code.6.1,ojzupxjbzyjm,postc.4.1,pqikpvdckxts,odpeuygyvutb,house_number.3.1,ngcmhxruzbjo,zip_code.7,xkwtsxrmirfl,postal_code.7,zip.8.1,ijzmbosslusk,gzhkbkxhvzft,zip.9.1,xjvnvqymremp,postc.5.1,country_code.8,wdectshfqapy,djjoohqkxdly,tjogrfryyxgo,pusclmwcnfhu,zip_code.9.1,zipcode.3.1,zipcode.4.1,postal_code.10.1,postcode.2.1,postal_code.11.1,house_number.4.1,zip.10.1,postal_code.12,webjxtxauovu,country_code.9,bhizdeeflqct,postc.7.1,country_code.10,zip.12.1,zip.13.1,ewasuccsiigk,postcode.4,zipcode.5.1,zip.14,postc.8.1,zipcode.6.1,house_number.5.1,house_number.6.1,country_code.12,postcode.5,postal_code.15.1,house_number.7.1,postal_code.16,zipcode.7.1,zipcode.8.1,postcode.6,zip.16,msalfazgfluw,zipcode.9.1,sqvponwelwuk,postal_code.17.1,zip_code.11,rjbkmrgkbmzj,house_number.8.1,postc.9.1,zip.18,dkrfbkcteeyq,postal_code.18.1,postcode.8,zip_code.12.1,country_code.13,postal_code.19.1,zip_code.13.1,postal_code.20.1,zip.19.1,zip_code.14,postal_code.21,ccswupwfxqvj,pvskxtgyxgvi,house_number.9.1,country_code.15.1,uhoisnetfmol,zip.20.1,zipcode.10.1,postcode.14,zip.1.1,postc.2.2,wclnwtftdhsr,house_number.29,zip.3.2,house_number.1.1,zip_code.40,postal_code.1,house_number.2.2,postcode.1,postc.3.1,zip_code.1.2,unondxkmgapq,zip.4.2,zip.5,country_code.2.1,zip_code.2.2,zip_code.3.1,zip.6.1,postal_code.5.1,postcode.3.1,ifyikppdlliv,zip_code.4.2,postc.5.2,postc.6,house_number.3.2,postc.7.2,zipcode.1.2,zipcode.2.2,zip_code.5.1,postcode.5.1,house_number.4.2,postc.8.2,zip_code.6.2,postal_code.6.1,zip.9.2,postal_code.7.1,amkrdsyvykqc,xggjgimwkufi,postal_code.8,zip_code.10.1,xjpntebwcqiy,zlglikcvweeq,zip_code.12.2,house_number.5.2,postc.10.1,usvfxtslplnq,wsfzaeuiqcyb,house_number.6.2,addvogzxpanx,postc.11,postc.12.1,zip_code.13.2,postal_code.10.2,wrknvboktdjl,fojvzdadhwwo,postal_code.12.1,postcode.8.1,vdbavzsmqudy,house_number.7.2,postal_code.13,country_code.5,ihpnftohegeq,zip.12.2,zipcode.3.2,zip_code.14.1,qfehrnfgdjbe,zip_code.15.1,postcode.9,country_code.7.1,postc.14.1,zip_code.16.1,zip_code.17.1,browbblqwxbz,nnbjjizowywm,zip_code.18,kfaxknyooyvn,postal_code.14.1,fnahexxiljbl,vskzlmfpjhwf,wekgjdydctxi,zipcode.4.2,zip_code.19.1,zip_code.20.1,zip_code.21.1,zip.14.1,ejbswctgwghf,khycwawrifht,asudbxjqmonh,buvvvqwiqfup,zip_code.22.1,country_code.8.1,zip_code.23.1,house_number.8.2,iqjeolrqkvnl,zip_code.24.1,house_number.9.2,zip.16.1,wclctttzhvqf,zip_code.25,postc.15,xzuvpwvbyojt,zip.18.1,zip_code.26,zip_code.27.1,aaxczkifukkr,zip_code.28.1,zip_code.29.1,zip_code.30.1,omawoqigngbh,postc.16.1,zip_code.32.1,address_line1,house_number.10.1,mdlxqoyjfkos
0,[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],"[Address, Geolocation]",[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],"[Address, Geolocation]",[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],"[Geolocation, Address]",[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address],[Address]
1,"[ID_Card, Date]","[Phone_number, Date, NIN]","[Phone_number, Date, NIN]",[Person],[Date],[Person],"[Phone_number, ID_Card, Date, NIN]","[Phone_number, Date, NIN]","[ID_Card, Date]","[Phone_number, Person, ID_Card, NIN, Date]","[Phone_number, ID_Card, Date, NIN]","[Phone_number, Date, NIN]",[Person],[Date],"[Phone_number, Date, NIN]",[Date],[Person],"[Phone_number, ID_Card, Date, NIN]","[Phone_number, ID_Card, Date, NIN]","[Person, Date]",[Date],"[Phone_number, Person, ID_Card, NIN, Date]","[Phone_number, Date, NIN]",[Date],"[Phone_number, ID_Card, Date, NIN]",[Date],"[Phone_number, Date, NIN]",[Person],"[Phone_number, ID_Card, Date, NIN]","[ID_Card, Date]","[Phone_number, Date, NIN]",[Date],"[Phone_number, Date, NIN]","[Phone_number, ID_Card, Date, NIN]",[Other_data],[Person],"[ID_Card, Date]",[Date],[Date],"[Phone_number, Date, NIN]","[ID_Card, Date]","[Person, Date]",[Date],[Date],"[Person, Date]","[Phone_number, ID_Card, Date, NIN]",[Date],[Date],"[Phone_number, ID_Card, Date, NIN]",[Date],"[Phone_number, ID_Card, Date, NIN]",[Date],[Date],"[Phone_number, Date, NIN]","[Phone_number, Date, NIN]",[Date],"[ID_Card, Date, NIN]",[Date],[Date],"[ID_Card, Date]",[Date],"[Phone_number, Date, NIN]",[Date],"[Phone_number, ID_Card, Date, NIN]",[Date],[Date],"[Phone_number, Person, ID_Card, NIN, Date]","[ID_Card, Date, Other_data]","[Phone_number, ID_Card, Date, NIN]",[Date],"[Phone_number, ID_Card, Date, NIN]",[Person],[Date],"[Phone_number, Person, ID_Card, NIN, Date]","[Phone_number, Date, NIN]","[Phone_number, ID_Card, Date, NIN]",[Date],"[Phone_number, ID_Card, Date, NIN]","[Phone_number, ID_Card, Date, NIN]","[Person, Date]","[Phone_number, ID_Card, Date, NIN]",[Date],"[Phone_number, ID_Card, Date, NIN]",[Date],[Date],"[Phone_number, ID_Card, Date, NIN]","[Phone_number, ID_Card, Date, NIN]",[Date],[Date],"[Phone_number, ID_Card, Date, NIN]",[Date],[Date],"[Phone_number, ID_Card, Date, NIN]","[Phone_number, ID_Card, Date, NIN]",[Date],[Date],"[Phone_number, ID_Card, Date, NIN]","[Phone_number, ID_Card, Date, NIN]","[Phone_number, ID_Card]","[Phone_number, ID_Card, Date, NIN]","[Phone_number, Date, NIN]","[Phone_number, ID_Card, Date, NIN]",[Date],[Date],[Date],"[ID_Card, Date]","[Phone_number, Date, NIN]",[Date],"[ID_Card, Date]","[Person, Date]",[Date],"[Person, Date]",[Other_data],"[Phone_number, ID_Card, Date, NIN]","[Phone_number, ID_Card, Date, NIN]","[Phone_number, ID_Card, Date, NIN]",[Date],[Date],"[Phone_number, Person, Date, NIN]",[Date],[Date],"[Phone_number, ID_Card, Date, NIN]",[Person],[Date],"[ID_Card, Date]","[Phone_number, Date, NIN]",[Date],[Date],[Date],[Date],"[Phone_number, ID_Card, Date, NIN]",[Date],"[Person, Date]",[Date],[Date],"[Phone_number, Date, NIN]",[Date],[Date],"[Phone_number, Date, NIN]","[ID_Card, Date]","[Phone_number, Person, Date, NIN]","[ID_Card, Date]",[Person],"[ID_Card, Date]","[ID_Card, Date]",[Date],"[Phone_number, Other_data, ID_Card, NIN, Date]","[Phone_number, ID_Card, Date, NIN]","[Phone_number, Date, NIN]","[ID_Card, Date]",[Date],[Date],"[Person, Date]","[Phone_number, ID_Card, Date, NIN]",[Date],"[Phone_number, ID_Card, Date, NIN]",[Person],[Date],"[ID_Card, Date]","[Phone_number, Person, ID_Card, NIN, Date]","[Phone_number, Date, NIN]",[Date],[Date],"[ID_Card, Date]",[Date],"[Phone_number, Person, ID_Card, NIN, Date]",[Date],[Date],"[Phone_number, ID_Card, Date, NIN]","[ID_Card, Date]","[Phone_number, ID_Card, Date, NIN]",[Date],[Date],"[Phone_number, Date, NIN]","[Phone_number, Person, Date, NIN]","[Phone_number, ID_Card, Date, NIN]",[Date],"[Phone_number, Date, NIN]",[Date],"[Phone_number, Other_data, ID_Card, NIN, Date]",[Date],"[Phone_number, Date, NIN]","[Phone_number, ID_Card, Date, NIN]",[Date],"[Phone_number, Other_data, Person, ID_Card, NI...","[ID_Card, Date]","[Phone_number, ID_Card, Date, NIN]","[Phone_number, ID_Card, Date, NIN]","[Phone_number, ID_Card, Date, NIN]","[Phone_number, ID_Card, Date, NIN]",[Date],[Date],[Date],"[Phone_number, ID_Card, Date, NIN]",[Date],[Date],"[ID_Card, Date]",[Date],[Date],"[Phone_number, Date, NIN]",[Person],"[Phone_number, ID_Card]","[Person, Date]","[ID_Card, Date]","[Phone_number, ID_Card, Date, NIN]","[Phone_number, Date, NIN]","[Phone_number, ID_Card, Date, NIN]",[Date],[Date],[Date],"[Phone_number, ID_Card, Date, NIN]","[ID_Card, Date]","[Phone_number, Date, NIN]","[Date, NIN]","[Person, Date, ID_Card]","[Phone_number, Person, Date, NIN]",[Person],"[Phone_number, ID_Card, Date, NIN]","[Phone_number, ID_Card, Date, NIN]","[ID_Card, Date, NIN, Person]","[Phone_number, ID_Card, Date, NIN]",[Date],"[ID_Card, Date]",[Date],[Date],[Date],[Date],"[ID_Card, Date]",[Date],[Person],[Date],[Date],[Person],"[Phone_number, Person, ID_Card]","[Phone_number, ID_Card, Date, NIN]","[Phone_number, Date, NIN]",[Date],"[Phone_number, Date, NIN]","[Phone_number, ID_Card, Date, NIN]",[Date],"[Person, Date]","[Phone_number, Date, NIN]","[ID_Card, Date]",[Person],[Date],[Date],"[ID_Card, Date]","[Phone_number, ID_Card, Date, NIN]","[Person, Date]","[ID_Card, Date]","[Phone_number, Date, NIN]",[Date],"[Person, Date]",[Date],[Date],"[ID_Card, Date]","[Phone_number, Date, NIN]",[Date],[Person],[Date],"[Phone_number, ID_Card, Date, NIN]",[Date],"[ID_Card, Date]",[Date],[Date],"[Phone_number, Date, NIN]","[ID_Card, Date]","[ID_Card, Date, NIN]",[Date],[Date],[Date],[Person],"[Phone_number, Date, NIN]","[Person, Date]","[Phone_number, Date, NIN]","[Phone_number, ID_Card, Date, NIN]",[Date],"[Phone_number, ID_Card, Date, NIN]",[Date],"[Phone_number, ID_Card, Date, NIN]","[Person, Date]",[Date],"[Phone_number, ID_Card, Date, NIN]",[Date],[Date],[Date],[Person],"[Phone_number, Date, NIN]","[Person, Date]","[ID_Card, Date]","[Phone_number, Other_data, Person, ID_Card, NI...",[Date],[Date],"[Phone_number, Date, NIN]","[Person, Date]","[ID_Card, Date]","[Phone_number, ID_Card, Date, NIN]","[Phone_number, ID_Card, Date, NIN]",[Date],[Date],"[Person, Date]","[Phone_number, Date, NIN]",[Person],"[ID_Card, Date]","[Phone_number, Date, NIN]","[Phone_number, ID_Card, Date, NIN]","[Person, Date]",[Date],[Date],"[ID_Card, Date]",[Date],"[Phone_number, ID_Card, Date, NIN]",[Date],"[Phone_number, ID_Card, Date, NIN]","[Phone_number, ID_Card, Date, NIN]","[Phone_number, Date, NIN]","[ID_Card, Date]",[Date],[Person],[Person],[Date],[Date],[Person],"[Phone_number, ID_Card, Date, NIN]",[Person],[Date],"[Phone_number, Date, NIN]","[Phone_number, ID_Card, Date, NIN]",[Person],[Date],"[ID_Card, Date]","[Phone_number, Date, NIN]","[Phone_number, Date, NIN]",[Date],"[Person, Date]",[Date],[Date],"[Phone_number, Date, NIN]","[ID_Card, Date]","[Person, Date]",[Date],"[ID_Card, Date]","[Phone_number, ID_Card, Date, NIN]","[Phone_number, ID_Card, Date, NIN]","[ID_Card, Date]","[Person, Date]","[Phone_number, ID_Card, Date, NIN]",[Date],"[Phone_number, ID_Card, Date, NIN]","[Phone_number, ID_Card, Date, NIN]",[Date],"[Phone_number, Date, NIN]","[ID_Card, Date]","[Phone_number, Date, NIN]",[Date],[Date],[Date],[Date],"[ID_Card, Date]","[Phone_number, Person, ID_Card, NIN, Date]",[Date],[Date],"[Phone_number, ID_Card, Date, NIN]","[ID_Card, Date, Person]","[Phone_number, ID_Card, Date, NIN]",[Date],[Date],"[Phone_number, Person, Date, NIN]",[Date],[Date],[Person],[Date],"[Phone_number, Date, NIN]","[Phone_number, ID_Card, Date, NIN]","[Phone_number, ID_Card, Date, NIN]",[Person],"[Phone_number, ID_Card, Date, NIN]",[Date],[Date],"[Person, Date]",[Date],"[Phone_number, ID_Card, Date, NIN]","[Phone_number, Date, NIN]",[Date],[Date],"[Phone_number, Date, NIN]","[ID_Card, Date]",[Date],[Date],[Date],[Date],"[Phone_number, ID_Card, Date, NIN]",[Date],"[ID_Card, Date]",[Date],[Date],[Date],[Date],[Date],"[Phone_number, ID_Card, Date, NIN]",[Date],"[ID_Card, Date]",[Person],[Date],[Date],[Date],"[Phone_number, ID_Card, Date, NIN]",[Date],"[Phone_number, ID_Card, Date, NIN]",[Date],"[Phone_number, ID_Card, Date, NIN]","[Person, Date]",[Date],[Date],"[ID_Card, Date]",[Person],[Date],[Date],[Date],"[Person, Date]","[Phone_number, ID_Card, Date, NIN]",[Date],[Date],"[Phone_number, Person, ID_Card, NIN, Date]","[Phone_number, Person, Date, NIN]","[Phone_number, ID_Card, Date, NIN]",[Date],[Date],"[Phone_number, ID_Card, Date, NIN]",[Date],[Person],[Date],"[ID_Card, Date]",[Person],[Date],[Date],"[Phone_number, ID_Card, Date, NIN]","[Phone_number, ID_Card, Date, NIN]",[Date],[Date],"[ID_Card, Date]",[Date],[Date],[Date],[Person],"[Phone_number, Other_data, ID_Card, NIN, Date]","[Phone_number, ID_Card, Date, NIN]",[Date],"[Phone_number, ID_Card, Date, NIN]",[Date],[Date],"[Other_data, Person, ID_Card, NIN, Date]",[Date],[Date],[Date],"[Phone_number, Date, NIN]","[Phone_number, ID_Card, Date, NIN]","[Phone_number, Person, Date, NIN]","[Phone_number, Date, NIN]",[Date],"[ID_Card, Date]",[Date],"[ID_Card, Date]","[Phone_number, ID_Card, Date, NIN]","[ID_Card, Date, NIN]","[Phone_number, Date, NIN]",[Person],"[Phone_number, ID_Card, Date, NIN]","[Phone_number, ID_Card, Date, NIN]","[Phone_number, ID_Card, Date, NIN]",[Date],"[Phone_number, Date, NIN]","[Phone_number, ID_Card, Date, NIN]",[Date],[Date],[Date],[Person],[Date],[Date],[Date],"[Phone_number, ID_Card, Date]","[Person, Date]","[ID_Card, Date]","[Person, Date]",[Date],[Date],[Date],"[Phone_number, Person, Date, NIN]","[Phone_number, Religion, ID_Card, Nationality,...",[Date],"[Phone_number, Person, Date, NIN]",[Date],"[Phone_number, ID_Card, Date, NIN]",[Date],[Date],[Date],[Person],"[Phone_number, Date, NIN]","[Phone_number, Date, NIN]",[Date],"[Phone_number, ID_Card, Date, NIN]","[Date, NIN]","[Phone_number, ID_Card, Date, NIN]","[Phone_number, Date, NIN]","[ID_Card, Date]","[ID_Card, Date]",[Date],"[ID_Card, Date]",[Date],[Date],"[Phone_number, ID_Card, Date, NIN]","[Phone_number, Person, Date, NIN]",[Date],"[ID_Card, Date]","[Phone_number, Date, NIN]","[Phone_number, ID_Card, Date, NIN]",[Date],"[Phone_number, ID_Card, Date, NIN]","[ID_Card, Date]",[Person],"[Phone_number, ID_Card, Date, NIN]","[Phone_number, Date, NIN]","[Person, Date]","[Phone_number, Date, NIN]","[Phone_number, Date, NIN]",[Date],"[ID_Card, Date]","[Phone_number, ID_Card, Date, NIN]",[Date],[Date],[Date],"[ID_Card, Date]","[ID_Card, Date]","[Phone_number, ID_Card, Date, NIN]","[Phone_number, ID_Card, Date, NIN]","[Phone_number, Date, NIN]",[Date],"[Phone_number, ID_Card, Date, NIN]","[Date, NIN]",[Date],[Date],"[Phone_number, ID_Card, Date, NIN]",[Person],[Date],[Date],[Date],"[Phone_number, Date, NIN]","[Person, Date]","[Phone_number, Date, NIN]","[Phone_number, Date, NIN]",[Person],"[ID_Card, Date]","[Phone_number, ID_Card, Date, NIN]","[Phone_number, ID_Card, Date, NIN]","[Phone_number, ID_Card, Date, NIN]","[Phone_number, Date, NIN]",[Date],"[ID_Card, Date]","[Phone_number, ID_Card, Date, NIN]",[Date],[Date],[Date],[Date],"[Phone_number, ID_Card, Date, NIN]",[Date],"[Phone_number, Date, NIN]",[Date],[Date],"[Person, Date]","[Phone_number, Person, Date, NIN]","[Phone_number, ID_Card, Date, NIN]","[Phone_number, Date, NIN]",[Person],"[Phone_number, ID_Card, Date, NIN]",[Date],[Date],"[Phone_number, Date, NIN]",[Date],[Date],[Date],"[Phone_number, Date, NIN]","[ID_Card, Date]",[Person],[Date],"[Phone_number, Date, NIN]","[Phone_number, Date, NIN]",[Date],"[Phone_number, Date, NIN]","[Phone_number, Date, NIN]","[Phone_number, Date, NIN]","[ID_Card, Date]","[ID_Card, Date]","[Phone_number, ID_Card, Date, NIN]",[Date],[Date],[Date]
2,05304,47832,05156,us,55-330,se,06850,02539,2410-503,100576,01527,07869,de,06779,14621,07017,it,99444,08043-4719,24,74629,05060,77-300,1050,37126,57/A,2300,se,46025,6890,07201,62480,07201,80011,ROOM 56J,fi,03303,92,02113,12033,3400,3600,06779,133 38,2753,99444,68152,10,3206PM,3600,13591,2753,14701,14621,1130,02909,44121,23036,4600,80011,42289,07201,01606,100576,02842,14616,02842,100392,48413,03285,08638,us,90,02137,1030,07029,55132,80011,05443,49824,01527,02882,08096,07461,39049,03052,3260,24,1083,011675,164,68152,11100,47922,03031,83-300,100045,08053-1161,-74.45834,13900,50122,20022,31,20029,5547,6443,3830,2822,05340,12,07017,07010,us,82300,07930,03052,05035,21,2373,03872,690,25039,us,9,72474,681 31,4,1080,02113,2718,46025,10040,576 35,35,10049,47832,06320,25,03054,3303,28-230,80011,de,1040,06111,1080,03833,100045,28-230,22071,236,02703,02032,13900,23036,03588,se,05-532,2663,14149,14621,62480,06239,15065,2661VB,08721,46,238,3206PM,6890,02451,74629,38,06415,07869,03846,162 62,07869,10049,26852,10040,46149,08638,21,80011,49824,02465-2003,05060,03588,07029,22,22,8,13900,99,1,6447,62480,07010,03054,at,28.356452,3600,01056,02465-2003,681 31,14201,24,02912,41B,14127,23864,60320,6793,6111,8660,de,011675,48413,06705,37126,1,05340,23036,55-330,07739,57-511,3400,23864,pl,8,10040,fi,-75.032029,2373,1030,55-330,06415,14149,11,162 62,05647,1022,us,1294,14904,01022,80011,06239,2410-503,7362,08294,3343,39049,47877,21048,13900,6-8,us,42035,100045,39243,39013,LV-1024,72241,02322,40126,64-020,24,02113,2410-503,it,5650,1110,12033,48413,70504,02532-3223,05156,49847,07010,07461,02816,20029,2753,55-330,se,39018,02113,22071,07032,08204,95,02910,35432,2906,2373,41747,06515,18,166,28-230,de,2871,06415,80011,02703,62480,09526,80011,4600,01527,2065-311,08701,12405,38006,44124,03285,de,it,07040,23036,it,02816,us,07111,42026,06-440,us,73,1150,08003-1341,2300,23898,03031,24,16,26-333,2879,16,62480,02906,20022,011675,6606,25,1210,48,08096,06-440,01702,03466,8640,05440,LV-1024,6095,02184,62-300,1606,80011,2718,576 35,5650,40126,11100,02909,10,37121,02871,945,us,UNIT 139 C,03466,13433,14149,si,03052,42035,3343,7452,41B,3206PM,50122,06515,05340,44151,13811,39049,6,57-511,10040,13900,14701,40126,83-300,03031,51109,6-8,03285,47922,3343,06413,us,1294,136,21,14569,03266,05778,47826,24025,6095,68152,69,01056,us,06074,1294,09526,72241,1030,39011,07739,13591,05478,05443,25,55-330,100533,7452,it,47826,22071,us,47826,7452,14569,6580,02914,23036,5533,02909,5547,160,pl,03253,06320,13,06492,39011,02912,14617,08294,67,07010,01702,1070,07869,02816,28,2151,23036,21048,100045,082 75,03102,de,1210,02451,13433,55-330,14201,31400,51109,2065-311,90,at,1110,03285,35432,15819,26-300,01040,38840,5,06779,4,03102,02465-2003,97,05060,02871,06082,14904,1294,133 38,it,14621,13900,06515,08096,30200,48413,01702,80011,47011,41,13905,39011,02155,14569,7531,112,02871,07201,80011,74629,80011,44124,us,14149,7362,03060,21-013,02539,238,80011,01420,42035,98,07040,47011,39013,20022,80011,02816,14904,05443,5318,06239,90,1150,it,62480,06239,10044,01702,6095,3830,394 70,de,13905,06811,49847,15065,05647,38006,21048,06320,08294,62480,06779,06002,05-123,03102,02451,2661VB,9543,02912,7362,26-333,12033,lv,49847,4,07001,12033,18,133 38,06515,02816,02151,us,6095,13900,21077,4,02539,47832,13900,06447,2879,5650,20,69,26
3,72474,13900,7362,us,74629,us,3260,06415,02879,03846,80011,51109,se,7452,77-300,05-532,us,08721,1070,5,55-330,05060,03102,02703,02842,10,06415,it,26-333,06443,08003-1341,02912,02816,13433,ROOM 64J,us,03303,120,07001,05033,01056,1083,26-300,39049,2753,08043-4719,38840,26,46025,16031,1070,57-511,38840,14214,02919,576 35,02860,2753,68152,6890,05-532,99-418,03303,08053-1161,02842,08204,08721,23833,14201,2065-311,3260,si,46,42016,02816,100576,70504,03846,06492,72241,05401,1080,42016,133 38,02879,13433,20022,95,62480,05443,8,07040,11100,100576,06074,2661VB,42016,48413,28.953317,03846,02539,13900,2,07040,4,6447,51109,45B,14075,8,39011,08001,us,25039,2373,1004,05035,5,80011,57-511,1,1150,us,3343,2879,7362,120,02703,03060,2368,06057,9543,02920,54,06239,99-418,51109,88,06074,1022,05440,21048,es,6111,2410-503,46042,01475,02137,02539,02879,2,60437,06109,41747,23036,11100,be,02912,3588,1150,99-418,08001,02113,20022,23036,80011,153,30,46025,5472,20022,23898,8,7362,21077,1000,1080,1030,20862,03062-2258,02879,7362,07930,557,03244,21048,100045,12405,05778,05-123,6-8,24,2368,46025,108,136,13811,14904,55132,681 31,de,28.508385,14904,06606,13433,14214,08638,192,14616,5,100533,100560,55-095,1301,13905,03561,us,37126,06082,01930-3540,12405,26,13811,20029,08294,10044,4600,6890,14075,be,30/A,06515,es,39.484618,06-440,14214,55-330,01702,02137,28,49824,12033,14075,es,2065-311,60437,2410-503,05495,07461,14075,28-230,55-330,10,23036,02885,72474,14569,55,us,62-300,03588,7452,80011,08204,23865,06226,06413,23876,236,06239,72474,ro,03848,26845,01702,07029,LV-1024,1000,14621,07029,LV-1024,06779,26861,133 38,2661VB,2065-311,us,38006,14611,2151,96-130,02184,8,14006,06320,6443,57001,13900,6095,164,98,05440,us,6447,05033,99444,72241,02882,1083,01056,07461,6890,83-300,02879,100533,441 65,39013,02842,us,it,23898,2661VB,us,100533,de,99869,50670,07029,be,57/A,03102,03266,03466,02113,47832,97,1,06811,13905,5,07010,8640,08638,42016,21048,3,1150,6,1150,3260,99-418,39018,2871,06074,02914,03060,LV-1024,1083,6606,31400,90,576 35,03846,8640,24025,07739,10,212 36,06413,7/A,us,UNIT 199 C,03266,05443,06614,us,12405,07010,28,2753,164,01527,05647,47826,02906,681 31,80011,38840,67,20862,83-300,08638,02113,100560,06239,07869,70504,9,20862,15065,22,100560,it,06779,7a,112,3206PM,50122,02879,74629,02879,9543,08294,19,02871,be,07869,14611,39011,06066,05-123,14904,39011,02816,03819,02663,1103,31523,14127,74629,es,1294,8640,se,4600,4600,5650,23500,02909,6181,02879,23865,24,23,lt,37137,03588,4A,82300,02842,02184,05156,57-511,118,23865,06074,37126,13900,3830,138,100560,133 38,39013,99444,9223,06610,us,03588,02532-3223,08721,4600,06057,80011,02909,38840,11,us,02155,39243,02920,65-001,20862,06606,03285,8,02879,16,07869,80011,1872,03818,05472,5650,162 62,20862,38840,us,07201,14226,2065-311,12405,06010,02892,46149,07712,22071,17,21048,162 62,02920,13900,05655,179,47011,06610,05060,20029,06614,02871,it,82300,3830,39243,03253,03266,24,02151,05304,07010,98,06239,47011,22071,05-123,80011,38006,05-532,03052,05859,02113,73,08701,de,06320,02113,02184,99-418,07001,2300,42123,us,23864,24310,01527,47922,06415,12033,40126,05-074,6181,06851,2753,10044,6890,47832,14569,07040,6095,02912,13900,06850,07869,it,100576,65,01952,51109,25,74629,23036,05647,40126,it,10049,38006,03266,45B,01702,47832,06074,2410-503,7712,3206PM,64,43,16
4,02893,51109,02816,se,23898,us,41053,03466,13811,07029,24310,02169,it,2065-311,441 65,162 62,be,05443,14149,24,26-300,08721,05440,08742,14127,26,08003-1341,us,47922,44124,99-418,14904,50122,05443,ROOM 11J,us,23864,228,68152,03466,05340,03285,2753,4600,07001,08721,39243,228,07029,1083,25039,01952,02879,51109,2630-328,02842,02919,2753,06239,7712,1110,06074,22071,05-123,08204,08742,06320,39016,48413,54930,80011,be,593,02465-2003,681 31,01527,333 31,6890,08701,1080,3206PM,LV-1024,80011,25032,14611,03588,1000,179,02909,13591,29,06779,02816,6890,07201,23036,80011,06850,28.863564,14201,14621,3260,98,02113,277,5340,06610,65,5533,277,3600,05035,us,12405,5650,01605,576 35,113,13900,07040,164,06320,us,166,8640,7362,100;102,162 62,25032,128,6890,68152,02912,28,10049,06415,06851,300,08003-1341,6111,03054,2879,fi,2871,6890,02703,02072,100533,46149,02879,268,02882,06106,24310,07001,05778,us,576 35,13433,05-074,40131,02909,02879,08638,06779,08701,24,46,47922,49824,1000,25032,236,21077,77-300,48413,55132,03102,9543,06831,83-300,681 31,05495,10,47-370,6443,03588,03102,03102,14201,35,35,17,2373,354,290,21048,09526,09526,51109,cz,-75.226822,09526,02151,1150,06074,26-333,41B,23865,21,02842,13811,12569,02478,23864,03077,us,02904,05401,4452,24025,88,03303,38840,10040,10044,54930,6443,1056,us,45B,07461,es,27.921389,01527,05033,47826,51109,100533,5547,162 62,38006,1040,us,57-511,70504,39013,06850,26-300,05472,441 65,47826,42,08294,48529,2151,06850,75,it,05-532,03102,38840,06443,06002,39011,75321,3400,03275,153,55-330,72474,ro,1030,08742,77-300,5650,03285,02892,06074,02892,55132,2753,12405,39049,7452,133 38,us,02169,10040,21048,03076,576 35,113,38-430,02920,2893,48413,49847,39243,26,55,681 31,us,13811,05033,06614,16031,1050,02155,21048,7452,5650,03872,42016,1150,05647,21048,1080,us,us,20029,01952,us,24025,us,40010,99867,20022,it,67,02137,46149,03031,39049,44151,4A,90,46025,47011,38,02882,14075,1090,11100,7712,49,25039,91,37126,06-440,07201,38006,47011,681 31,46042,08294,14616,08204,6447,03052,279,62480,80011,40126,02465-2003,1080,16,05655,23864,502,us,UNIT 82 C,07869,06492,24025,pl,03052,1050,194,05743,5,07930,03102,20029,21048,06415,01056,01952,33,23898,31523,3206PM,9543,13811,06239,99-418,06320,97,2753,41053,20,02893,us,01952,516,50,03848,46149,1070,74629,02663,6181,03060,57/A,44124,us,05156,4408,23865,06320,1030,16031,LV-1024,100045,07849,08096,25,20862,42016,6181,us,1294,3400,us,74629,01952,07029,49846,42035,08294,05304,55132,22,11,us,99869,011675,749,80011,02155,08742,02780,02879,68D,333 31,03054,02842,47832,14214,593,47011,23036,2151,02816,01852,02539,us,06614,20022,37126,2661VB,48413,05-074,07739,133 38,54,it,60437,07001,10044,26-300,14611,06606,20862,1,54930,5,02539,24025,5,49824,80011,80011,07010,06239,03872,fi,3830,47922,6095,02879,05819,14569,03102,02893,49824,300,100560,02912,42035,26-333,14481,2,49824,13900,31400,68152,12405,44124,de,12405,77-300,38840,05156,06610,10,01040,02345,42289,20,03060,39013,06413,08053-1161,02465-2003,03102,51109,80011,02889,2661VB,900,03102,it,49824,6095,9620,03266,2065-311,01702,06606,us,03303,57001,06-440,07930,3830,03031,49824,100533,07461,46042,39049,9620,48413,05647,49847,20029,7452,55132,07869,03846,39018,fi,47922,11,6095,46149,354,2661VB,06779,3830,14075,pl,74629,03031,51109,10,03031,14214,77-300,01056,47011,06082,167,35,95


Presidio can't detect addresses, only Locations (cities, regions, mountains)   
It has problems to detect zip codes, house numbers or region abbreviations     
Cassed even detects house numbers as address

In [118]:
# Filter zip_code and house numbers
indi=[]
for i in range(df_address.shape[1]):
    for s in df_address.iloc[2:-1, i].values:
        s = str(s)
        if bool(re.fullmatch(r"\b(\d{5}|\d{2})\b", s)) or  bool(re.search(r"(?:[a-z].*?){2}", s)):      #check if its five or two digit number or it contains two letters ()
            break
    else:
        indi.append(i)
df_address.iloc[:,indi]

Unnamed: 0,location.1,location_id.5,city.41
0,[Address],"[Address, Geolocation]","[Address, Geolocation]"
1,[Other_data],"[Phone_number, ID_Card]","[Phone_number, ID_Card]"
2,ROOM 56J,-74.45834,28.356452
3,ROOM 64J,28.953317,28.508385
4,ROOM 11J,28.863564,-75.226822
...,...,...,...
98,ROOM 19J,-74.622737,28.012891
99,ROOM 146J,-75.22466,29.000363
100,ROOM 163J,-74.452212,-74.926844
101,ROOM 194J,-74.402687,28.007002


The column with room still can be an address, but the two lattitudes should only belong to geolocation

In [119]:
dessi_train[df_address.iloc[:,indi[1:]].columns]

Unnamed: 0,location_id.5,city.41
0,-74.458340,28.356452
1,28.953317,28.508385
2,28.863564,-75.226822
3,39.125028,27.700147
4,-15.471050,28.415501
...,...,...
95,-16.378117,-61.512690
96,-74.622737,28.012891
97,-75.224660,29.000363
98,-74.452212,-74.926844


In [120]:
# find indices of these two columns
indis = []
for e,i in enumerate(dessi_train.columns):
    if i == "location_id.5" or i == "city.41":
        indis.append(e)
dessi_labels_cleaned.loc[indis,:]

Unnamed: 0,label,split_type
4702,"Address,Geolocation",train
10660,"Address,Geolocation",train


In [121]:
dessi_labels_cleaned.loc[indis,"label"] = "Geolocation"
for ind in indis:
    wrong_columns.append(ind)

Credit Card Number

In [122]:
#Missed to credit card numbers
df_ccn = analyse_class("CCN")
df_ccn.head()

Unnamed: 0,uarrdsyjqvpz,client vat number,wnzigdnbecdl,voxhfyecngvb,cash card id,smetka nerezidenti.1,nxdqhzmftion,bank card number.3,danbroj,dmhloniyxwtn,alfa1,card number.1,debit card id,id.34,seller account,ebmkwmyqjjbq,card id,payment card number,intf cntpr id,intf ri tp orig code.1,xbygscenrlac
0,[CCN],[CCN],[CCN],[CCN],[CCN],[CCN],[CCN],[CCN],[CCN],[CCN],[CCN],[CCN],[CCN],[CCN],[CCN],[CCN],[CCN],[CCN],[CCN],[CCN],[CCN]
1,"[Date, Other_data]","[Date, Other_data]","[Person, Date, Other_data]","[Date, Other_data]","[Date, Other_data]","[Date, Other_data]","[Date, Other_data]","[Person, Date, Other_data]","[Other_data, GPE, Address, Geolocation, Date]","[Date, Other_data]","[Person, Date, Other_data]","[Date, Other_data]","[Date, Other_data]","[Other_data, GPE, Address, Geolocation, Date]","[Date, Other_data]","[Date, Other_data]","[Person, Date, Other_data]","[Other_data, GPE, Address, Geolocation, Date]","[Other_data, GPE, Address, Geolocation, Date]","[Date, Other_data]","[Date, Other_data]"
2,869935454005056,869978842033190,869954510277112,869917706008401,869917745689492,869937522787046,869909996521938,869992590710644,869999770894155,869906442518633,869926161502386,869955763776577,869936406252655,869948667169262,869920944848042,869917027855688,869996524200721,869983163659805,869908602155784,869919480696260,869905163418684
3,869927810021083,869916829359790,869945050845656,869966368641462,869985659355574,869945156266260,869987133504033,869933511717144,869946237729680,869950855879512,869932730150459,869984885835053,869950640363012,869914040967988,869939128683108,869967753283381,869914356540296,869983338012054,869920518192496,869931903137368,869908224514491
4,869951262014347,869986221162308,869993494327659,869980432148438,869948755528189,869909996521938,869919760677048,869908038761387,869947403973482,869936586342029,869999457534033,869997439269181,869960769888855,869990921797280,869930181943190,869924694553448,869912886830807,869992386049470,869909712494576,869935571040465,869922066186367


In [123]:
def luhn_check(card_number):
    """Check if a credit card number is valid using the Luhn algorithm. Implementation inspired by https://www.geeksforgeeks.org/luhn-algorithm/"""
    card_number = card_number.replace(" ", "")  # Remove spaces if any
    if not card_number.isdigit():
        return False  # Return False if it contains non-digit characters
    
    total = 0
    reverse_digits = card_number[::-1]
    
    for i, digit in enumerate(reverse_digits):
        n = int(digit)
        
        # Double every second digit from the right (1-indexed)
        if i % 2 == 1:
            n *= 2
            if n > 9:
                n -= 9  # Subtract 9 if doubling results in a number > 9
        
        total += n
    
    # Valid if total is a multiple of 10
    return total % 10 == 0

def contains_valid_credit_card(numbers):
    """Check if an array contains at least one valid credit card number."""
    for number in numbers:
        if luhn_check(number):
            return True
    return False


for i in range(df_ccn.shape[1]):
    if not contains_valid_credit_card([str(a) for a in df_ccn.iloc[2:-1,i].values]):
        print(i)
        


All columns contain valid credit card numbers due to the check sum algorithm, it is hard to figure out if presidio considered other options if the credit card is valid or not, presidio is wrong in not detecting them

In [124]:
df_date = analyse_class("Date")
df_date.iloc[[0,1,2,3,-1],:]

Unnamed: 0,date_account_closed,ncjfynkznere,date_account_opened,yonfgrhhcipw,activefrom.4,date_account_opened.1,hire_date.4,nfzndqloacsd,end_date.1,sdclbhqvzwiq,jlmqizcxwfvs,date_time_activated.12,deleted_date.17,fidyvxbcivtj,cxqucvgmdepk,ishufsvhndaf,txtimwgaxxmm,xqkwyqdhmoyg,jamwjeoijukj,call_start_datetime.13,rccvvsliuwnf,active_to,disconnected_at.2,lastpasswordchangeddate.2,hxtxqprtidjl,deleted_date.12,deleted_date.13,date_started_employment.3,created_date.13,nsodjjjkzgpd,birthday_id,date_employed_to,lastlogindateb,date.4,start_date.3,lastlogindate.1,order_date.1,db_tvr_cls_dt,wvaloveqccdo,hire_date.4.1
0,[Date],[Date],[Date],[Date],[Date],[Date],[Date],[Date],[Date],[Date],[Date],[Date],[Date],[Date],[Date],[Date],[Date],[Date],[Date],[Date],"[Date, NIN]",[Date],[Date],"[Date, NIN]",[Date],[Date],[Date],[Date],[Date],[Date],[Date],[Date],[Date],[Date],[Date],[Date],[Date],[Date],[Date],[Date]
1,[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Person],[Person],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],"[Phone_number, GPE, NIN, Address, Geolocation,...",[Other_data],[Other_data],"[Phone_number, Person, NIN]",[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data]
2,18.05.,08.09.,19.01.,08.04.,14.11.,23.12.,9.05.,24.06.,24.10.,27.05.,8.03.,17.03.,07.03.,10.08.,2.02.,22.08.,20.02.,24.07.,20.05.,22.05.,038 658 225,23.08.,28.05.,057-11-5612,28.12.,26.05.,5.02.,25.06.,08.03.,19.11.,07.11.,26.02.,30.08.,30.12.,02.09.,5.06.,25.12.,11.06.,01.06.,03.05.
3,9.07.,15.04.,8.02.,06.01.,04.12.,24.08.,5.03.,08.03.,25.03.,07.05.,6.12.,21.02.,05.08.,25.01.,4.06.,24.03.,23.08.,28.07.,4.10.,02.02.,660 217 712,24.12.,31.03.,654-41-1027,31.07.,15.07.,16.01.,10.12.,28.10.,07.01.,16.12.,17.11.,22.07.,16.02.,21.01.,16.11.,1.06.,3.10.,06.10.,02.04.
102,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,validation,validation,validation,validation,validation,validation,validation,validation,validation,test,test,test,test,test,test,test,test,test,test


Presidio can't detect specific date formats like dd.mm.

In [125]:
for c in ["rccvvsliuwnf", "lastpasswordchangeddate.2"]:
    print(df_date[c].values)

[list(['Date', 'NIN'])
 list(['Phone_number', 'GPE', 'NIN', 'Address', 'Geolocation', 'Organization'])
 '038 658 225' '660 217 712' '176 620 748' '645 116 021' '586 416 208'
 '354 774 606' '250 847 837' '825 861 164' '885 260 265' '522 316 801'
 '752 283 564' '118 347 301' '285 644 605' '315 388 058' '261 054 720'
 '266 580 778' '617 412 374' '658 147 764' '476 670 856' '602 534 521'
 '347 217 200' '317 465 524' '405 465 261' '276 586 724' '380 781 625'
 '527 433 254' '356 277 814' '776 082 356' '285 540 647' '016 216 889'
 '832 670 178' '026 685 776' '347 501 538' '142 762 764' '265 508 622'
 '611 854 464' '538 235 086' '832 852 057' '685 440 166' '265 073 452'
 '220 834 675' '083 582 270' '645 622 101' '665 441 754' '430 881 557'
 '884 520 339' '481 356 202' '016 812 869' '182 254 037' '471 188 060'
 '017 355 447' '260 812 532' '145 168 407' '035 672 146' '180 622 649'
 '674 106 851' '486 104 359' '486 116 809' '220 813 349' '482 035 870'
 '470 433 251' '168 023 729' '108 628 439' '1

In [126]:
# find indices of these two columns
indis = []
for e,i in enumerate(dessi_all.columns):
    if i == "rccvvsliuwnf" or i == "lastpasswordchangeddate.2":
        print(i)
        indis.append(e)
dessi_labels_cleaned.loc[indis,:]

lastpasswordchangeddate.2
rccvvsliuwnf
lastpasswordchangeddate.2
lastpasswordchangeddate.2


Unnamed: 0,label,split_type
4168,"Date,NIN",train
18592,"Date,NIN",train
20904,"Date,NIN",validation
27102,Other_data,test


In [127]:
indis = [18592, 20904]
dessi_labels_cleaned.loc[indis,"label"] = "NIN"
for ind in indis:
    wrong_columns.append(ind)
dessi_labels_cleaned.loc[indis,:]

Unnamed: 0,label,split_type
18592,NIN,train
20904,NIN,validation


In [128]:
df_email = analyse_class("Email")
df_email.iloc[[0,1,2,3,4,-1],:]

Unnamed: 0,email.8,whxwyaaclrhc,email_address_sid.8,city.32,personal_identity_number.19,email_sid.41,email_sid.51,ekszuwwqaaym,brtatrqkunkx,email.13,family_contact_email.24,ssnid.5,email_sid.21
0,"[Email, Person]","[Email, NIN]","[Email, NIN]","[Email, Address]","[Email, NIN]","[Email, Phone_number]","[Email, Phone_number]","[Email, Phone_number]","[Email, Person]","[Email, NIN]","[Email, Phone_number]","[Email, NIN]","[Email, Phone_number]"
1,"[Person, GPE, Nationality, Religion, Address, ...","[Phone_number, Date, NIN]","[Phone_number, Date, Organization, NIN]","[Phone_number, Person, GPE, Nationality, NIN, ...","[Phone_number, Date, NIN]","[Phone_number, Other_data, ID_Card, GPE, NIN, ...","[Phone_number, Other_data, ID_Card, GPE, NIN, ...","[Phone_number, Other_data, Religion, ID_Card, ...","[Person, GPE, Address, Geolocation]","[Phone_number, Other_data, ID_Card, NIN, Date,...","[Phone_number, Other_data, ID_Card, GPE, NIN, ...","[Phone_number, Person, ID_Card, Date]","[Phone_number, Other_data, ID_Card, GPE, NIN, ..."
2,Rodrigo Analise Merritt Felton,698-64-1806,714 083 557,"97 Via Giuseppe Garibaldi, Modigliana, Emilia-...",549-13-6384,146-8631308-7,71800942454,64 38 232 8978,Jairus Seth Knowlton,32146057897,84 6538 4523,ZZ221942T,1399 68837 3875
3,Janja,716-30-1313,508 145 380,"Pailakkatie, Sodankylä, Suomi",465-30-4015,+55 (061) 8999 6405,13165508378,7619608651,Riaan Angelique Meneses,49708352614,(061) 8558-6091,ZZ 526939 T,41 7391-5100
4,Ellison Ike Hall Fortune,354-21-3931,370 528 432,"20 Moulton Avenue, Greenland, New Hampshire 03...",140-11-0700,5124273569,106.378.4050x63511,+ 91 4351 040879,Margo,30469187522,13072658878,ZZ 11 66 63 T,(6482)958 535
102,train,train,train,train,train,train,train,train,test,test,test,test,test


In [129]:
for i in df_email.columns:
    for v in df_email[i].values:
        if "@" in str(v):
            print(i)

In [130]:
indis = []
for e, (i, t) in enumerate(zip(dessi_all.columns, dessi_all.iloc[-1,:])):
    if i in df_email.columns and df_email.loc[102,i] == t:
        print(i)
        indis.append(e)
dessi_labels_cleaned.loc[indis,:]

email.8
whxwyaaclrhc
email_address_sid.8
city.32
personal_identity_number.19
email_sid.41
email_sid.51
ekszuwwqaaym
brtatrqkunkx
email.13
family_contact_email.24
ssnid.5
email_sid.21


Unnamed: 0,label,split_type
1219,"Email,Person",train
1971,"Email,NIN",train
3609,"Email,NIN",train
7891,"Email,Address",train
9106,"Email,NIN",train
11289,"Email,Phone_number",train
13786,"Email,Phone_number",train
17582,"Email,Phone_number",train
26687,"Email,Person",test
28445,"Email,NIN",test


In [131]:
#None of them contains an Email so all are wrong
for i in [0,8]:
    dessi_labels_cleaned.loc[indis[i],"label"] = "Person"
for i in [1,2,4,9,11]:
    dessi_labels_cleaned.loc[indis[i],"label"] = "NIN"
dessi_labels_cleaned.loc[indis[3],"label"] = "Address"
for i in [5,6,7,10,12]:
    dessi_labels_cleaned.loc[indis[i],"label"] = "Phone_number"
for ind in indis:
    wrong_columns.append(ind)
dessi_labels_cleaned.loc[indis,:]

Unnamed: 0,label,split_type
1219,Person,train
1971,NIN,train
3609,NIN,train
7891,Address,train
9106,NIN,train
11289,Phone_number,train
13786,Phone_number,train
17582,Phone_number,train
26687,Person,test
28445,NIN,test


**All these columns are wrong labeled there is no email address in there!**

In [132]:
df_gpe = analyse_class("GPE")
df_gpe.iloc[[0,1,2,3,4,102],:]

Unnamed: 0,state_disctrict,district,vkqsrnnbfnct,placeregion,residence_region,region.2,statedistrict,vhbbuoqdfdwm,htetqgogyoum,regionname,region_name.1,state_or_region.1,district.1,region.3,region.4,residence_region.1,placeregion.1,fkgimpenuxin,saancoqrkvjn,ylpqczfrfjzi,state_or_region.3,partofstate,district.2,state_disctrict.1,czpfcocjvovz,partofstate.1,state_disctrict.2,regionname.1,state_disctrict.3,district.3,partofstate.2,znxnfdhikpam,district.4,state_or_region.4,state_disctrict.4,sclidhkxsgsj,uxedrlhoqwfs,partofstate.3,utibnmzdbbgk,district.5,rwvvpesxwycu,partofstate.4,state_or_region.5,district.6,region.14,partofstate.5,agvnpmgnasti,state_or_region.7,statedistrict.1,state_or_region.8,placeregion.2,partofstate.6,region.19,tucdeiyfguxg,residence_region.2,state_disctrict.5,residence_region.3,placeregion.3,region_name.3,placeregion.4,statedistrict.2,kyfbfndjhrbf,partofstate.7,statedistrict.3,iibapwayertc,state_disctrict.6,state_disctrict.7,region.25,partofstate.8,region.26,regionname.2,regionname.3,region_name.4,partofstate.9,state_or_region.9,state_or_region.10,statedistrict.4,state_disctrict.8,rrqrtqqijblq,cvcycjqeccwh,dvwbsqycdlts,partofstate.10,state_disctrict.9,azvlopulbmbn,region_name.5,region.31,region.32,region.33,ssbgcarxcjzm,partofstate.11,osuhnxlacmif,ysitxblngktq,mwemjsbdbpcc,partofstate.12,region_name.6,oyhgzeobpxmr,placeregion.5,state_disctrict.10,district.7,district.8,partofstate.13,district.9,ughdhomyuivv,region.40,evluxalwfodq,statedistrict.5,district.10,region_name.7,dybxwcdfgovq,vtfopfbqxurc,region.41,statedistrict.6,residence_region.4,zqnbjxksxueq,znmdtpzhbjek,zxleigjdgljj,zcztgkfbpyhd,rvxhnpxjiyjq,statedistrict.7,regionname.4,regionname.1.1,district.11,district.1.1,district.2.1,state_disctrict.11,partofstate.14,region_name,state_disctrict.1.1,region.5,state_or_region.1.1,pmylvyapjvhg,district.3.1,ntqwxrbyngnm,residence_region.5,region.10,region.12,statedistrict.1.1,region.13,statedistrict.2.1,partofstate.1.1,placeregion.6,bvnblrfyipdt,bqnfntwgndsc,district.4.1,partofstate.2.1,region.20,daqjlfabyezv,region.21,rbxdkgouwviz,state_disctrict.2.1,region.28,placeregion.1.1,itnrypxxujon,residence_region.1.1,state_disctrict.3.1,region,statedistrict.8,statedistrict.1.2,region.2.1,lnwpxxdkmwbk,cymnqgrxqldb,district.12,residence_region.6,psdzdiefiuaw,state_disctrict.12,regionname.5,ryzfiuutvjcb,state_or_region,district.1.2,state_disctrict.1.2,muaefqabibua,district.2.2,statedistrict.2.2,state_or_region.2,kvexqumfrago,region_name.2,statedistrict.3.1,district.3.2,xgtnrvnxpybu,state_disctrict.2.2,state_disctrict.3.2,yuhgdtdeltot,statedistrict.4.1,qvqdzjmvesez,district.4.2,statedistrict.5.1,region.21.1,state_disctrict.4.1,zhjuhnpmwiav,statedistrict.6.1,tremlgjueqiz,placeregion.7,state_disctrict.5.1
0,[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE]
1,[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Person],[Other_data],[Other_data],[Person],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Person],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Person],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Person],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Person],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],"[Religion, Nationality]",[Other_data],[Other_data],[Other_data],[Other_data],[Person],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Person],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Person],[Other_data],"[Religion, Nationality]",[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Other_data],[Person],[Other_data],[Other_data],[Other_data],[Other_data]
2,district,PartOfState,StateDistrict,residence_region,PlaceRegion,region_name,StateDistrict,PartOfState,RegionName,residence_region,residence_region,RegionName,state_disctrict,RegionName,region,PlaceRegion,Region,PlaceRegion,region,region,PlaceRegion,state_disctrict,StateDistrict,StateDistrict,PlaceRegion,PartOfState,district,region,StateDistrict,state_disctrict,district,PlaceRegion,PartOfState,Region,district,PartOfState,district,StateDistrict,region,state_disctrict,Region,StateDistrict,PlaceRegion,district,Region,PartOfState,PartOfState,region,StateDistrict,residence_region,state_or_region,district,residence_region,state_or_region,residence_region,StateDistrict,state_or_region,RegionName,Region,state_or_region,StateDistrict,region_name,StateDistrict,StateDistrict,Region,district,district,residence_region,StateDistrict,RegionName,Region,residence_region,region_name,StateDistrict,Region,Region,district,district,StateDistrict,PlaceRegion,Region,state_disctrict,state_disctrict,residence_region,residence_region,region_name,Region,region_name,PartOfState,PartOfState,district,state_or_region,state_disctrict,state_disctrict,residence_region,state_disctrict,state_or_region,StateDistrict,district,state_disctrict,state_disctrict,PartOfState,PartOfState,RegionName,PartOfState,StateDistrict,state_disctrict,Region,StateDistrict,residence_region,Region,district,RegionName,district,PartOfState,state_or_region,RegionName,PartOfState,state_disctrict,PlaceRegion,RegionName,district,PartOfState,StateDistrict,district,PartOfState,PlaceRegion,district,Region,region_name,district,state_disctrict,region_name,state_or_region,PlaceRegion,residence_region,state_disctrict,region_name,state_disctrict,district,state_or_region,district,PartOfState,StateDistrict,state_disctrict,region,PartOfState,Region,PlaceRegion,StateDistrict,residence_region,Region,district,residence_region,district,RegionName,district,state_disctrict,PlaceRegion,state_disctrict,StateDistrict,state_disctrict,Region,state_disctrict,PartOfState,state_or_region,PlaceRegion,PlaceRegion,state_disctrict,PartOfState,residence_region,state_disctrict,PartOfState,RegionName,PartOfState,region,state_disctrict,StateDistrict,district,StateDistrict,state_disctrict,residence_region,district,district,state_disctrict,PartOfState,RegionName,district,state_or_region,StateDistrict,StateDistrict,residence_region,state_disctrict
3,PartOfState,district,StateDistrict,Region,region_name,state_or_region,StateDistrict,state_disctrict,state_or_region,region,residence_region,state_or_region,district,region_name,PlaceRegion,residence_region,PlaceRegion,PlaceRegion,state_or_region,residence_region,residence_region,district,StateDistrict,district,RegionName,PartOfState,StateDistrict,RegionName,PartOfState,district,StateDistrict,PlaceRegion,PartOfState,residence_region,PartOfState,StateDistrict,district,StateDistrict,PlaceRegion,state_disctrict,residence_region,district,region,district,region,state_disctrict,PartOfState,region_name,StateDistrict,state_or_region,residence_region,StateDistrict,region,RegionName,residence_region,state_disctrict,PlaceRegion,region_name,residence_region,PlaceRegion,district,state_or_region,state_disctrict,district,residence_region,StateDistrict,PartOfState,PlaceRegion,state_disctrict,RegionName,state_or_region,residence_region,region,StateDistrict,state_or_region,region_name,state_disctrict,state_disctrict,PartOfState,region,region,StateDistrict,state_disctrict,state_or_region,RegionName,region,RegionName,residence_region,StateDistrict,district,state_disctrict,region_name,state_disctrict,district,PlaceRegion,PartOfState,region,district,district,district,StateDistrict,state_disctrict,district,residence_region,district,state_disctrict,district,state_or_region,PartOfState,Region,Region,StateDistrict,region_name,StateDistrict,StateDistrict,residence_region,region_name,district,PartOfState,PlaceRegion,RegionName,state_disctrict,district,PartOfState,StateDistrict,PartOfState,PlaceRegion,StateDistrict,region_name,residence_region,StateDistrict,PartOfState,region,region_name,residence_region,state_or_region,state_disctrict,region,StateDistrict,district,region,StateDistrict,StateDistrict,district,StateDistrict,region_name,PartOfState,region_name,region,PartOfState,region_name,RegionName,StateDistrict,state_or_region,state_disctrict,RegionName,district,state_disctrict,PlaceRegion,district,PartOfState,district,Region,district,PartOfState,region_name,Region,RegionName,district,StateDistrict,state_or_region,district,district,region_name,PartOfState,RegionName,PartOfState,StateDistrict,district,district,state_disctrict,Region,district,district,state_disctrict,PartOfState,region,state_disctrict,PlaceRegion,state_disctrict,PartOfState,Region,PartOfState
4,StateDistrict,StateDistrict,district,Region,residence_region,Region,state_disctrict,district,Region,residence_region,Region,region,StateDistrict,RegionName,Region,residence_region,region,PlaceRegion,region,Region,Region,PartOfState,district,PartOfState,residence_region,state_disctrict,StateDistrict,region,StateDistrict,district,StateDistrict,residence_region,district,region,StateDistrict,district,state_disctrict,StateDistrict,PlaceRegion,StateDistrict,RegionName,state_disctrict,residence_region,district,region,PartOfState,StateDistrict,RegionName,district,region,state_or_region,PartOfState,region_name,residence_region,PlaceRegion,PartOfState,state_or_region,region,PlaceRegion,residence_region,district,residence_region,StateDistrict,state_disctrict,Region,StateDistrict,StateDistrict,RegionName,state_disctrict,region_name,residence_region,region,region,PartOfState,residence_region,PlaceRegion,PartOfState,district,district,region_name,Region,StateDistrict,state_disctrict,residence_region,residence_region,RegionName,Region,state_or_region,StateDistrict,state_disctrict,state_disctrict,state_or_region,StateDistrict,StateDistrict,PlaceRegion,PartOfState,region,PartOfState,PartOfState,district,PartOfState,state_disctrict,PartOfState,RegionName,PartOfState,StateDistrict,state_disctrict,Region,district,PlaceRegion,state_or_region,PartOfState,Region,state_disctrict,PartOfState,residence_region,residence_region,PartOfState,PartOfState,Region,residence_region,state_disctrict,state_disctrict,PartOfState,district,PartOfState,Region,StateDistrict,state_or_region,state_or_region,state_disctrict,district,residence_region,residence_region,region,PlaceRegion,PartOfState,PlaceRegion,PartOfState,state_disctrict,RegionName,StateDistrict,district,StateDistrict,district,Region,district,state_or_region,residence_region,StateDistrict,residence_region,region,PartOfState,Region,district,Region,state_disctrict,state_disctrict,Region,district,district,PartOfState,RegionName,district,state_disctrict,RegionName,state_or_region,PlaceRegion,district,StateDistrict,Region,state_disctrict,state_disctrict,region_name,PartOfState,region_name,district,district,district,PartOfState,district,Region,state_disctrict,StateDistrict,StateDistrict,StateDistrict,state_or_region,district,region_name,state_disctrict,state_disctrict,state_or_region,StateDistrict
102,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,validation,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test


In [133]:
df_gpe = analyse_class("GPE", focus = "true positives")
df_gpe.iloc[[0,1,2,3,4,102],:]

Unnamed: 0,state,countyname,ywpjaeadqwwj,province,kwwjshqmkqyy,haupfnryhrgq,state.1,postal_code,fzcpjefhgmdt,gpo,at,state_name,postal_code.1,ansi,tiggjgnzixdn,cc3,ygomngppzuda,lgsqmkiqdxhb,dnekjzbhenls,lzabyfqxizwk,name_of_state,sfkfogktoawk,province_title,state_name.1,country_origin,countrycode,gpo.1,ansi.1,uxpphqphrcwv,provincename,gpo.2,qezzlqnunejw,iunpgnipuzgd,ansi.2,countymunicipalityregion,name_of_county,at.1,cc3.1,gpo.3,ansi_abbr,state.3,usps,municipality,county.3,sfihqkwdkgob,cc3.2,ansi_abbr.1,zip_code.5,countrycode.1,postal_code.3,ansi_abbr.2,postal_code.4,province_title.1,iso_code,country_iso,county_municipality_region,iso_code.1,iso,ycztqwzpiqxu,inqttnjgzuoj,country.6,at.2,nxowfjuzcwdn,ykzqwypbhxrs,municipality.1,provincename.1,qbrspwazmskx,iso.1,municipality.2,at.3,at.4,state.4,country_iso.1,province.2,zip_code.7,iso_code.2,wb_region,lnvbmrvxqejs,gipmbavomlkq,postal_code.7,ansi.3,cc3.3,wb_region.1,ansi.4,cc3.4,county.6,lwvssgnppicx,state_or_region,postal_code.8,country.8,country_code.3,cc3.5,county.8,nzjgqccdtllm,dwtwqbbeapcp,state_code,mevatxuxcenl,state.5,province_name,fgiwkydwgrnp,biclikgcugzy,zip_code.11,kchgrgvwqqzc,country_code.5,region_name,state_code.1,znjysnqyssbe,city.6,uwozdftuvisv,cc3.6,state.6,wkhmjaiivrqw,qpogavoprhap,nwmnodjfrece,state.7,ikyowjkgewfm,mdcchelmrejp,iwivpwydaqto,state_name.2,entzgyqrmlhm,state_name.3,country_origin.1,usps.1,iso.2,gpo.4,province.4,bliryjeokamg,xlcvdpiiopxf,jhegtuhkqtmk,placename,province.5,country_name,country_iso.2,cc3.7,cc3.8,smqgmtfpmhgp,gpo.5,iso_code.3,rusvixcepfgn,country_name.1,alneuzlfamyx,countrycode.2,fjiclhznzqon,province.6,wtarqldcfulg,state.8,county.9,ansi_abbr.3,anjawwaqvuaq,country.14,name_of_state.1,ansi_abbr.4,vmcvyjvbbylv,dhwhsjtrpaqi,lzcpxbtumsbk,municipality.5,hszlgepooukq,location.2,lzavtvygakvd,utwkquevjywc,usps.2,cc3.9,wkzoegaunrtv,state_name.4,ygjchphffzgy,postal_code.12,wjlhysslkfax,country_code.6,sqpufsrkibln,state_code.2,usps.3,state.9,lagljrllasyv,country.15,kbllvstkllhj,idiavootfluc,state.11,location.4,tvouguoduddn,country.17,country.18,gpo.6,countrycode.3,tajriqhabrdk,city_name,wsarolyudldo,ubnbojcbzsry,location.5,iso_code.4,rmtuymtuutzk,zip_code.14,country.24,mguylpoftywm,state_name.5,usps.4,sgyrrzprjlzb,at.5,country.26,fjcipzffzyhc,cc3.10,county_municipality_region.1,qiwyfskkpatw,kmzwvcxfzbsj,pygfjdkoycuj,state_code.3,state.12,hwpvouurkyck,ebdeuxsqecif,gpo.7,county.11,zrhldqifmptl,residence_province,dffqmpmmuawg,usps.5,wb_region.2,rdtpglgngqwg,usps.6,usps.7,county_municipality_region.2,origin,xpdckompdjem,country.30,postal_code.13,rqwaqryrkxvr,vtisbywnznma,province_title.2,hxexmtgnacnd,ansi_abbr.5,state_name.6,cc3.11,city.13,zip_code.18,name_of_state.2,residence_county,state_or_region.2,location_of_residence,ansi_abbr.6,trtplmoimyst,municipality.7,country_code.8,residence,iso_code.5,typsktsyedhf,ansi.5,gpo.8,county.12,qcledfhyrljt,cc3.12,mqwknyvxseyn,postal_code.16,municipality.8,icvtlzhmllvg,country_name.2,engcjzrcbkdn,state_name.7,county_municipality_region.3,cc3.13,ansi_abbr.7,country_origin.2,country_origin.3,uscg,state_name.8,state_name.9,name_of_municipality,at.6,vespacwhzccq,fdfgnumhzyba,country.36,yzofbawjgvnk,country_code.9,cc3.14,state.14,ansi_abbr.8,country.37,uyrzbvfefpqi,county_name,county_name.1,state_name.10,state.15,location_of_residence.1,sphfltezfqgh,location_of_residence.2,gpo.9,vwlhwwggjria,gpo.10,name_of_municipality.1,ansi.6,county_municipality_region.4,country_name.3,cc3.15,state.16,cc3.16,municipality.9,ansi.7,state_code.4,qdqrkivzahiu,country.38,county.13,iso.3,zhskpqmazhfz,...,uwmrjrsffdgn,gpo.2.1,municipality.1.1,uwnlklvfggig,xihixzlhqjny,state_code.1.1,name_of_state.1.1,gsjehpwhahpm,municipality.2.1,cityname,bbgpgbhbphup,name_of_state.2.1,wb_region.1.1,lpzjpwmarxhi,countrycode.2.1,countymunicipalityregion.2,location.3,name_of_state.3,zunzvkmmspys,residence_county.3,country_origin.1.1,country.8.1,country_iso.3,yzwczdcesydb,wb_region.2.1,gpo.3.1,rpyxrmvqczrb,state_code.2.1,deycveduudnr,countymunicipalityregion.1,xcengnonfrta,country.9,country.10,origin.2,wb_region.3,usps.2.1,county.5,state_name.3.1,at.1.1,dnshuqohejkw,state_name.4.1,usps.3.1,countrycode.3.1,origin.3,zip_code.7.1,state_or_region.1,uscg.3,kzvcypnsgfzd,place.1,state_code.3.1,nsrwxolssvwq,zip_code.8,agdexogokgyi,qjpsgbmytnia,county_municipality_region.1.1,iso.1.1,zip_code.9,state.11.1,trpbzdqsrjtl,ansi_abbr.1.1,iducavrufhap,country_name.4,state.12.1,ehupmfsqjcfq,rsmwlvlamuzq,nipkwivkuaji,molclcgnvnsa,zip_code.11.1,unwjykuqljhs,state_code.4.1,wgavpozowynr,zfsngvqbwtnl,lnxhafvzimaf,iso.2.1,location_of_residence.1.1,state.13,county_municipality_region.2.1,jjuvwfzcrdmb,state.14.1,gpo.4.1,state_name.5.1,name_of_state.4,hqcpbgmzearn,country.13,ansi.1.1,wb_region.4,country_origin.2.1,ztmpmqodjbes,wumtaptdekxv,uscg.4,emmolhrskthf,lhksunizninb,cc3.3.1,gixxqszqojoz,state_name.6.1,usps.4.1,trkgydtonfox,hwvtsrfksiea,postal_code.9,state.16.1,gpo.5.1,avqgxpnpmvua,location.6,place.2,at.2.1,state.17,gpo.6.1,iso.3.1,cdlnlebcwhyo,state_code.5,bnqitulxmhda,zkxzlqgqprqk,state.18,postal_code.11,county.6.1,gpo.7.1,origin.4,state.19,name_of_county.2,residence_county.1,iso.4,cc3.4.1,provincename.1.1,countyname.2,state_name.7.1,state_name.8.1,gpo.8.1,country.15.1,state_name.9.1,wmumjdtzubdo,countrycode.4,xrisbdkenknr,state.20,gpo.9.1,country_origin.3.1,state.21,county.9.1,state.22,oquagcrwvnxn,country_name.5,eqzknycejwkj,gpo.10.1,state_or_region.3,ansi_abbr.2.1,qoxbpedmovku,onjhfxteyord,county.11.1,iso.5,kpkyvgkdusrw,usps.5.1,urehouksaylr,state_name.10.1,wb_region.5,ndylnkybpjmy,state_code.6,residence_province.2,state_name.11,name_of_state.5,country_origin.4,municipality.7.1,kzemgyyxxtha,country_origin.5,yivecxlfualu,usps.6.1,countrycode.5,state.23,ilufwqkkixck,gpo.11,city_name.2,cc3.5.1,ansi_abbr.3.1,country_code.6.1,nvtcefykqnir,yaknxiihkusl,at.3.1,ansi.2.1,countrycode.6,ietnlvxyhfsk,country.21,country.22,ipyuxagrorhv,imuuuwdeueix,mgexucrrxnxz,residence_county.2,countrycode.7,uqmlzlbkcfkq,county.14,residence.1,ubqkewogbjoi,gpo.12,country_name.6,sdbrhrfujokv,jwpgzkwlnbil,onotzrztafxf,wb_region.6,from,country_name.7,from.1,gpo.13,kudywablynbe,pzwsktprpclk,xruklplsuxpk,at.4.1,origin.5,country_name.8,origin.6,country.24.1,location.11,gpo.14,country_origin.6,country_name.9,country_name.10,qhdjepghsioz,cc3.6.1,zjtxfpxncjfc,eznsrfzatdhr,ansi_abbr.4.1,xwubtlbwexay,cc3.7.1,postal_code.15,iso.6,name_of_municipality.2,xljwyidgkhsj,gpo.15,state_name.12,cc3.8.1,iso.7,gpo.16,yufgpgzswahu,country_name.11,country.27,thkqtmdovnpl,uscg.5,country_origin.7,wylqgykrhvhu,state.25,wb_region.7,utzqpobybqwm,gpo.17,province_title.1.1,copamukgobae,state_name.13,cpeyhifnsnnl,province.5.1,gnaacogcxlgu,iso_code.6,ansi_abbr.5.1,province.6.1,origin.7,iso_code.1.1,province.7,state_name.14,mercqhwjfzzp,state_name.15,aemlmtkssggb,ansi.3.1,iso_code.2.1,dbiyuywmzfwb,usps.7.1,country.30.1,placename.1,etlisuxozibn,name_of_state.6,name_of_county.1,state.27,ahywspbrnhfk,iso.8,twiwgnyjnrjw,ymkuamfdyosr,gpo.18,name_of_state.7,baecpkefszpw,name_of_municipality.1.1,sknybfkqoyuo,uhpoawsgqdfi,gpo.19,postal_code.16.1,state.28,provincename.2,country_name.12,state.29,gpo.20,zip_code.31,ystpzczpjclo,state_code.7,uscg.6,cc3.9.1,utqmmmikbkqx,tnxouedlieev,ojekqiaiuazj,countrycode.8,country.33,eswntqgksivd,kbrlqslcvorx,ansi.4.1,state_name.16,lvtdopxrsfbo,city_name.1,residence.2,vnpsaqxvggty
0,[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],...,[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE],[GPE]
1,"[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation, Date]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Religion, GPE, Nationality, Person, Address, ...","[Person, GPE, Address, Geolocation, Date]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[GPE, Address, Date, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation, Date]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Religion, GPE, Nationality, Address, Geolocat...","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation, Date]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation, Date]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation, Date]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Religion, GPE, Nationality, Person, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation, Date]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation, Date]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation, Date]","[Religion, GPE, Nationality, Person, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation, Date]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation, Date]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Religion, GPE, Nationality, Person, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation, Date]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Religion, GPE, Nationality, Address, Geolocat...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Religion, GPE, Nationality, Person, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Religion, GPE, Nationality, Person, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[GPE, Address, Date, Geolocation]","[Person, GPE, Address, Geolocation, Date]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation, Date]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]",...,"[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[GPE, Address, Geolocation]","[GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation, Date]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Religion, GPE, Nationality, Person, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation, Date]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Religion, GPE, Nationality, Address, Geolocat...","[Person, GPE, Address, Geolocation, Date]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Religion, GPE, Nationality, Person, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation, Date]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation, Date]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation, Date]","[GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation, Date]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation, Date]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Religion, GPE, Nationality, Address, Geolocat...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation, Date]","[Person, GPE, Address, Geolocation]","[GPE, Address, Date, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation, Date]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Religion, GPE, Nationality, Person, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation, Date]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Nationality, Religion, Address, ...","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]","[Person, GPE, Address, Geolocation]"
2,hungary,Jastrzębie-Zdrój,panama,Sondrio,"MELBOURNE, FL",gmina Kórnik,CMR,"BRUSSELS, IL",italy,"MILWAUKEE, WI",luxembourg,egypt,"EAST ELLIJAY, GA","DURAND, WI",guatemala,spain,"ALVARADO, TX",mozambique,Bergamo,"DANIELSON, CT","LITTLE FALLS, MN","ROSEBUD, TX",Bergamo,"GROVETON, NH",chile,south korea,"CHEYENNE, OK","TRACY CITY, TN",cr,Lugo,Netherlands,"LAS VEGAS, NV","PLAINFIELD, NJ","WOODBURY, MN",powiat oleski,Napoli,guatemala,"PINEVILLE, LA","OAKLAND PARK, FL",Germany,"CLARKSDALE, MO",papua new guinea,UTI delle Valli e delle Dolomiti Friulane,"JEFFERSON COUNTY, CO",EST,KHM,"SILVERTON, OR",jersey,"AURORA, MN",GNQ,algeria,"CHARLESTON, WV",Pavia,Ustukran,united arab emirates,gmina Biała Piska,"TRUMANN, AR",india,"BILOXI, MS",poland,canada,mx,"BEULAH, ND","MANTEO, NC",Town of Middletown,Huesca,Cremona,jersey,gmina Lutomiersk,"MARINA DEL RAY, CA",benin,cyprus,"WALNUT RIDGE, AR",Lecco,switzerland,greece,"CARROLLTON, MO",Slovensko,"FOUNTAIN, CO","PORT ST. LUCIE, FL",denmark,canada,greece,russia,morocco,"FORT DEPOSIT, AL",monaco,"LOS ALAMITOS, CA",Papua New Guinea,philippines,russia,"CROSS PLAINS, TN",jersey,Como,latvia,lithuania,portugal,"RENO, NV",Pavia,"MATTESON, IL",nh,Gerede,south korea,georgia,residence_region,costa rica,argentina,Wrocław,nigeria,"MELVIN, TX","HENDERSON, NV",Unione dei comuni Valle del Savio,Corinth,Ávila,"LOUISVILLE, CO",kz,"HITCHCOCK, SD",australia,"HUNTINGTON BEACH, CA",Windsor County,united states,Peru,"PFLUGERVILLE, TX",south africa,jersey,Lecco,turkey,argentina,"CHOKIO, MN",Peabody,Pavia,taiwan,nicaragua,"LIGNITE, ND",portugal,Bezirk Reutte,"BLACKBURN, MO",ukraine,KIR,france,bh,"COLOMA, WI",oman,Brescia,ukraine,"WAUKOMIS, OK",papua new guinea,hungary,ISR,cyprus,"ESTHERVILLE, IA",bulgaria,Helsingborgs kommun,cayman islands,slovenia,Vila Real,"IPSWICH, SD","CALABASAS, CA",slovakia,Philippines,"MONROE, LA",qatar,Sweden,venezuela,"LANTANA, FL",mx,japan,"ROSELAND, NE",jersey,"COPPERAS COVE, TX","LENOIR, NC",china,finland,ut,cu,"SANTA PAULA, CA",france,Gansu,"CORNING, AR","PENDLETON, OR","SAN RAFAEL, CA",sweden,sri lanka,PLW,Hartford,"DANBURY, CT","DECKER PRAIRIE, TX","WOOD DALE, IL",Flores Island,jamaica,egypt,"BAINBRIDGE ISLAND, WA",Pavia,ghana,"ANDOVER, SD","ANTIOCH, IL","GRANTVILLE, GA",hungary,"MARCO ISLAND, FL","DURHAM, NH",gmina Czersk,Tonga,kazakhstan,Olsztyn,"WEST CHESTER, OH",taiwan,"NORTH ZULCH, TX",namibia,"FARMERS BRANCH, TX",portugal,"SHOREWOOD, IL",Sondrio,"KENNESAW, GA",macedonia,colombia,South Africa,Australia,"LAWRENCE, NE",Rimini,"COLUMBUS, IN",Forlì-Cesena,"CEDAR HILL, TX",lebanon,Marktgemeinde Reutte,"PROVIDENCE, KY",Cremona,hong kong,Bulgaria,"VALENTINE, NE","CARLISLE, IA",Uppsala,"MERKEL, TX",australia,powiat ciechanowski,"LUTESVILLE, MO",okres Nové Zámky,"SOUTHAVEN, MS",São Tomé and Príncipe,gmina Długołęka,turkey,Stadt Kufstein,bosnia and herzegovina,md,"EAST PEORIA, IL","HODGENVILLE, KY",Kreis Kleve,germany,Uganda,south africa,poland,Malbork,"CEDAR RAPIDS, IA",md,"MILFORD, KS",lithuania,Castelo Branco,vietnam,benin,israel,"EMINGTON, IL",GHA,papua new guinea,cyprus,okres Klatovy,algeria,Rochester,MCO,canada,"RIFLE, CO","FROMBERG, MT","FORESTVILLE, WI",ETH,"RED BANK, NJ",Big Bear,mexico,powiat bielski,Ordes,"SARANAC LAKE, NY","CAMDEN, IL",Hamburg,nigeria,Saint Albans,"THOMASVILLE, GA","LAMBERTON, MN",venezuela,Menorca,egypt,Salten-Schlern - Salto-Sciliar,thailand,"ROCHELLE, IL","HEWITT, TX",latvia,Unione Reno Galliera,GRC,Croatia,cayman islands,"WESSINGTON SPRINGS, SD","NASSAU BAY, TX",taiwan,"RUSH SPRINGS, OK",...,"CHANUTE, KS",india,Raiguer,Marèo - Enneberg - Marebbe,Cayman Islands,algeria,cameroon,lebanon,gmina Góra,Worcester,italy,"LEOPOLIS, WI",mw,morocco,qatar,Oeiras,brazil,azerbaijan,"BRAMAN, OK",powiat piski,"MAYFIELD, KS",uruguay,"CHASEBURG, WI",Philippines,thailand,"SEALY, TX",croatia,ky,Forlì-Cesena,UTI del Friuli Centrale,"AFTON, OK",vietnam,mz,Myanmar,"SOUTH MIAMI, FL","BROCTON, NY",Otsego County,egypt,côte d’ivoire,"FORT COLLINS, CO",ghana,"LEESVILLE, LA","CUBA, AL",egypt,"TALLULAH, LA",Iraq,cyprus,"SAN JUAN CAPISTRA, CA",Fall River,lithuania,"WEST MONROE, LA",new zealand,"BLOOMFIELD, NJ",San Cristóbal de La Laguna,gmina Nowy Żmigród,bosnia and herzegovina,france,EGY,tunisia,cm,senegal,"ROBERTSDALE, AL",papua new guinea,Ávila,Rosport-Mompach,"GLASTONBURY, CT","OAK PARK, IL",Sierra Leone,"PLYMOUTH, MA","BELLEVIEW, FL",cayman islands,"DEL CITY, OK","SEVIERVILLE, TN","SAVANNAH, TN",Jyväskylä,malaysia,Riga,powiat trzebnicki,"MARLOW, OK","ST. ONGE, SD","MILFORD, NH",colombia,LTU,Hebei,Montenegro,"WEST ALLIS, WI",macedonia,Uganda,BTN,"ROSEBURG, OR","VAN NUYS, CA",UTI del Friuli Centrale,Iraq,"NORTH MIAMI BEACH, FL","CENTER, TX",netherlands,algeria,tx,QAT,jamaica,venezuela,Senegal,"LAFAYETTE, LA",Cagliari - Casteddu,Cayman Islands,"RANTOUL, IL",côte d’ivoire,morocco,greece,"CARRINGTON, ND","EXETER, PA","CECIL, PA",bosnia and herzegovina,"SNYDER, TX","BALLINGER, TX",Ancash,Faroe Islands,"TRENTON, NJ",Cortland County,powiat jędrzejowski,malta,australia,Lugo,Bezirk St. Pölten,senegal,senegal,"CRANSTON, RI","CLIFTON, TX","ANADARKO, OK","PORTLAND, ME","CHANDLER, AZ","LEHIGHTON, PA","PLYMOUTH, MA","CHEROKEE, IA",bangladesh,"ORANGE PARK, FL",poland,"OILTON, OK",Hillsborough County,jordan,Mittweida,Hungary,egypt,united states,uruguay,Sondrio,malta,taiwan,isle of man,"BETHEL SPRINGS, TN","DECATUR, GA","LA COSTE, TX",Sri Lanka,"DILWORTH, MN",namibia,Bergamo,portugal,"DRESHER, PA",colombia,Town of Lincoln,sri lanka,Jamaica,"LEBANON, SD",MNG,guatemala,"EDGERTON, WY","SHERMAN, TX","PARKSTON, SD",Albany,estonia,"CUERO, TX",chile,romania,"HERNDON, KS",costa rica,België - Belgique - Belgien,Mexico,MEX,"KINGFISHER, OK","PENSACOLA, FL",hungary,Djibouti,nigeria,Newport County,switzerland,switzerland,"EUGENE, MO",Wuppertal,RUS,georgia,"LIBERTY, TX","CLAXTON, GA",nicaragua,monaco,jordan,Albany,kenya,Linz,"PERRY, GA","CONYERS, GA","ALVARADO, TX",Huesca,benin,"KANSAS CITY, KS",morocco,uruguay,tn,Monaco,"MACKEY, IN","BAY ST. LOUIS, MS",austria,"TECUMSEH, OK","FT. SAM HOUSTON, TX","BERKELEY, IL",singapore,"GOLD CANYON, AZ","PANAMA CITY, FL",south korea,azerbaijan,india,benin,Upravna Enota Ljubljana,cayman islands,"KINGSLAND, TX","REIDSVILLE, GA",czechia,mw,"SEILING, OK",oman,bangladesh,kenya,iran,malaysia,Gibraltar,"WILLOW, OK","CAMDEN, NJ",GIN,Norway,denmark,Mantova,"PRAIRIE VILLAGE, KS","LIEBENTHAL, KS","GRAND SALINE, TX",Cremona,IRQ,Qatar,mozambique,Sondrio,"TUSKEGEE, AL",bulgaria,Bergamo,turkey,Burdur,"SIMI VALLEY, CA",Italy,"MT. ZION, KY","PASADENA, CA",powiat oleśnicki,papua new guinea,portugal,Salzburg,Peru,"MAZEPPA, MN",Rockingham County,bosnia and herzegovina,Libya,"BANDERA, TX",Brescia,Huesca,"BRITTON, SD",dk,KEN,Town of Hague,Windsor County,nigeria,Sudan,"BROWNSTOWN, IN",kenya,Lugo,japan,pakistan,"PLANTSVILLE, CT","ELMWOOD PARK, NJ",namibia,ISL,algeria,"EARTH, TX",serbia,tunisia,jamaica,San Francisco,turkey,"ENGLEWOOD, FL",turkey,"HYANNIS, MA",denmark,lithuania,Hamburg,Casnate con Bernate,lithuania
3,romania,Dukes County,"WILLIS, TX",Mantova,Yugoslavia,UTI Giuliana / Julijska MTU,cameroon,"IRVING, TX",panama,"MIDLOTHIAN, TX","MAYNARDVILLE, TN",morocco,cayman islands,philippines,oman,taiwan,"NORTHVILLE, MI",Eswatini,Lecco,"OCALA, FL",czechia,KOR,Como,romania,slovenia,"STAFFORD, TX","VIOLA, KS","PARAMOUNT, CA",South Sudan,Huesca,"HARDIN, MO",cyprus,"ALTUS, OK","LUDINGTON, MI",Västra Götalands län,Medina de Rioseco,no,nz,sweden,"PITTSFIELD, IL",italy,monaco,Aalborg Kommune,slovakia,denmark,Kenya,spain,benin,colombia,"SOUTH MIAMI, FL",belgium,"DRAPER, NC",Sondrio,south africa,"GREENSBORO, NC",Pustertal - Val Pusteria,morocco,costa rica,united kingdom,saudi arabia,denmark,zimbabwe,albania,ukraine,Unione della Romagna Faentina,Pavia,Lugo,"HAMILTON, OH",Österåkers kommun,lebanon,côte d’ivoire,"HIAWASSEE, GA",peru,Bergamo,vietnam,"FAIRFIELD, NE",Gerede,bangladesh,FSM,"GRAND PRAIRIE, TX",turkey,jordan,mg,monaco,spain,malaysia,panama,"ABILENE, TX",switzerland,bw,new zealand,"PARIS, TX",do,Huesca,zimbabwe,Malta,morocco,Armenia,Sondrio,"MACON, GA","FRANKLIN, PA",romania,"COMSTOCK, NE","COBDEN, IL",Region,"SILVERTON, OR",slovenia,Cambridge,kenya,china,bangladesh,gmina Udanin,Hradec Králové,Parma,"CUBA, AL",pl,az,"NOTASULGA, AL","SOUTHPORT, CT",Camden County,"TRENTON, TN",south africa,uruguay,"LANDER, WY",venezuela,Forlì-Cesena,germany,"CANTON, WI","ROGERS, TX",Salzburg,Huesca,saudi arabia,"ANDALUSIA, AL","ANCHORAGE, AK",mexico,Tarn,isle of man,"AUBURN, IA",france,"COUDERSPORT, PA",estonia,togo,"GRETNA, LA",Lecco,cambodia,iran,"AILEY, GA",qatar,pakistan,south korea,"GARDNERVILLE, NV","WESTFIELD, NY",Lahden seutukunta,sweden,romania,gmina Gorzków,japan,ecuador,"DANBURY, CT",Yokohama,italy,montenegro,"VALENTINE, NE","COSTA MESA, CA",Ancash,tn,"CORDELL, OK","BELLEVIEW, FL",algeria,côte d’ivoire,malta,Northeast,australia,"HOBOKEN, NJ",vietnam,"STRAFFORD, MO",senegal,"HAYESVILLE, IA",ua,"BRADLEY, IL",cambodia,"REDWATER, TX",namibia,sweden,New Bedford,az,tunisia,ga,Central African Republic,"CLARKESVILLE, GA","BLACK HAWK, CO",Sichuan,Huesca,ecuador,bulgaria,"BOISE, ID",Ukraine,jordan,"SHAWNEE, OK",Gibraltar,Vila Franca de Xira,germany,taiwan,Riga,"RAWLINS, WY","LACOMBE, LA","ELDORADO, OK",bulgaria,"PALM BEACH, FL","HAMMONTON, NJ",cyprus,Bergamo,tx,"FORT DEPOSIT, AL",ghana,"ZION, IL",rwanda,ecuador,powiat strzelecki,peru,Pavia,"ROCHESTER, TX",israel,Corteolona e Genzone,lebanon,Huesca,taiwan,"EAGLE, WI","HAYTI, MO","LOUISBURG, KS",Oliveto Lario,GMB,Samoa,powiat jasielski,Jordan,Portsmouth,Ecuador,singapore,UTI del Friuli Centrale,estonia,Gemeinde Roppen,"JOLIET, IL","HOBBS, NM",china,no,Rimini,georgia,vietnam,monaco,brazil,Town of Ramapo,"SALT LAKE COUNTY, UT",czechia,"PERTH AMBOY, NJ",lithuania,Jõgeva maakond,albania,"GREENWOOD, LA","URSA, IL",cz,ireland,russia,greece,Marki,chile,Stockholm,bangladesh,jordan,cameroon,"MACKEY, IN","WEATHERFORD, TX","SALT LAKE COUNTY, UT","BROWNWOOD, TX",indonesia,new zealand,powiat olsztyński,powiat rycki,syria,"BROOKFIELD, CT",Stadt Imst,"FORT DODGE, IA",Manchester,"BORDEN, IN","PORT ST. LUCIE, FL",Curaçao,Kungota,"PRAIRIE VILLAGE, KS",Comunità montana della valle Camonica,lithuania,"WELLSVILLE, MO",nv,"PANAMA CITY BEACH, FL",Wheatland,"ODESSA, TX",pl,"MARGATE CITY, NJ",australia,Philippines,"ROCHELLE, IL","KERMIT, TX",...,malaysia,"SPRINGFIELD, CO",Unione dei comuni Valle del Savio,Gemeinde Tulln an der Donau,panama,"MT. ZION, KY","FALLS CHURCH, VA","ALBA, MO",Dornburg-Camburg,Casnate con Bernate,"LEANDER, TX",Taiwan,"PORTSMOUTH, OH",United Kingdom of Great Britain and Northern I...,"BENTONVILLE, AR",gmina Żmigród,LIE,zimbabwe,GBR,powiat piski,Lesotho,togo,netherlands,guatemala,"FOUNTAIN VALLEY, CA",kazakhstan,ABW,"RALEIGH, NC",Mantova,Västerås kommun,bulgaria,estonia,"JOLIET, IL",Norway,"ATKINS, AR","KOSHKONONG, MO",Tompkins County,hungary,Makran Coast,ghana,"PLAINFIELD, NJ",AZE,"SISSETON, SD","SAN ANTONIO, TX",Kangra,senegal,egypt,"WHITE CLOUD, MI",Uppsala,"LONGMONT, CO","FRISCO, TX",iran,ir,Vilnius,Vila de Rei,"LAPORTE, TX",panama,Flores Island,austria,India-Nepal,senegal,"OAK PARK, IL","LIBERTY CITY, TX",Ordes,Grumello Cremonese ed Uniti,"CANTON, OK",cameroon,united kingdom,"PORTLAND, ME",zimbabwe,SWE,"SUWANNEE, GA",LSO,BHS,East Providence,"SAVANNAH, MO",Sävsjö kommun,Addison County,namibia,"MAYWOOD, IL",morocco,"GRANITE CITY, IL",spain,lithuania,"CLARKESVILLE, GA","EAGLE, WI","HAMPTON, VA","SOUTHAMPTON, PA",costa rica,"KIOWA, KS",lebanon,Oeiras,India,czechia,croatia,"HEMPSTEAD, NY",ct,"DANNEBROG, NE","SILVIS, IL","HATTIESBURG, MS",panama,Central,mozambique,Concord,Syrian Arab Republic,"WILMONT, MN",china,"WATSON, MN",isle of man,france,"NEW BRAUNFELS, TX","TONKAWA, OK",denmark,ghana,"AREDALE, IA",nigeria,"LEWISTON, IL",nepal,Firenze,Varese,cayman islands,BGR,Mantova,Belknap County,zimbabwe,slovenia,serbia,"LAGUNA BEACH, CA","PORT SAINT LUCIE, FL",finland,isle of man,pakistan,"SANTA BARBARA, CA",Cameroon,france,monaco,hungary,"CULLOM, IL",Landkreis Gotha,"HILTON HEAD ISLAND, SC",Nacka kommun,belgium,nepal,ecuador,canada,Como,poland,"EL RENO, OK",panama,albania,"PAWLEYS ISLAND, SC",austria,"ACWORTH, GA","SOUTHAMPTON, PA",South Africa,Forlì-Cesena,cambodia,"AURELIA, IA","CLINTON TOWNSHIP, NJ",Vinschgau - Val Venosta,serbia,qatar,"ALBIA, IA","DYER, IN",romania,"MELBOURNE, FL","SOLDOTNA, AK",belgium,Millville,"CANTON, OK",canada,india,sweden,lebanon,"POWERS LAKE, ND",il,philippines,"EL RENO, OK",cyprus,india,ukraine,"WILLOWS, CA","BUCKEYE, AZ",powiat dąbrowski,australia,mexico,"ARCADIA, KS",Köln,iran,Ecuador,"BEREA, KY",finland,"BROWNSVILLE, IN","HAMILTON, MO",montenegro,Herne,russia,Nashua,"STONEHAM, MA",costa rica,ukraine,Forlì-Cesena,italy,jo,Miao-Li,norway,taiwan,"KEMPTON, IL","BIWABIK, MN","LESLIE, GA","MONROEVILLE, PA",tunisia,"FOUNTAIN VALLEY, CA",Albania,"WOODMAN, WI",SLE,GRC,"ANDALUSIA, AL","RAWLINS, WY",Iran (Islamic Republic of),united arab emirates,Unione Terre d'Acqua,"LUTHER, OK",vietnam,new zealand,jersey,"LEWISTON, ME",ghana,"MESQUITE, TX",morocco,"SILSBEE, TX",Dominican Republic,south korea,peru,al,india,Romania,Lietuva,côte d’ivoire,Forlì-Cesena,taiwan,"KAYSVILLE, UT","INA, IL",Lugo,"SPARTA, KY","BOCA RATON, FL","RAHWAY, NJ",Mantova,"SELDEN, KS","MIAMI, OK",Forlì-Cesena,Viet Nam,"BURR OAK, KS",taiwan,georgia,Albania,serbia,Windham County,bangladesh,Chile,Madrid,namibia,"STAMFORD, CT",Madison County,"PARKSTON, SD","GIBBON, MN","ELLIJAY, GA",Cremona,Pavia,"BUNA, TX",Somalia,denmark,Vila Franca de Xira,powiat poznański,philippines,south korea,"HALTOM CITY, TX",côte d’ivoire,Lugo,jamaica,Jordan,united kingdom,monaco,"BROWNSVILLE, IN","PLACENTIA, CA",georgia,"MOUNT PLEASANT, IA",dz,austria,North,"ST LOUIS, MO","CAVE JUNCTION, OR",india,"EASTON, PA",india,china,"BARRON, WI",Herne,"Alhandra, São João dos Montes e Calhandriz",azerbaijan
4,"BRASELTON, GA",powiat brzozowski,Uganda,Como,poland,Lancaster,united states,georgia,new zealand,slovenia,argentina,bangladesh,"FARGO, ND",philippines,"PARSONS, TN",ISL,pakistan,"BURNS, OR",Lugo,nicaragua,"AVONDALE, AZ","TUCKERMAN, AR",Como,co,Montserrat,"ESCONDIDO, CA","LUCEDALE, MS",portugal,côte d’ivoire,Pavia,belgium,"DANIELSON, CT",qatar,argentina,Terni,powiat niżański,belgium,"OAK LAWN, IL",Monaco,vietnam,"ROCK ISLAND, IL",jordan,gmina Warta,"KNOXVILLE, TN",lebanon,"MICHIGAN CITY, IN",brazil,cyprus,"BISHOP, CA","JERSEY VILLAGE, TX","WOBURN, MA",kazakhstan,Mantova,pakistan,"FAIRFIELD, NJ",gmina Nowy Żmigród,nicaragua,India,"MARYVILLE, MO","BAINBRIDGE ISLAND, WA",china,ZAF,hong kong,"TRACY CITY, TN",Tallinn,Forlì-Cesena,Brescia,macedonia,Åboland,"DALLAS, OR",peru,slovenia,singapore,Mantova,"CLAREMONT, NH","OZARK, MO","CENTER, ND",senegal,jersey,"ROWLETT, TX","WAUKEGAN, IL","WEST CHICAGO, IL",lt,syria,"GOLD CANYON, AZ","SAN MARINO, CA","SUMMERVILLE, GA","BRONSON, KS",syria,Andorra,"ARLINGTON, WA","BLUEFIELD, WV",ghana,Pavia,czechia,Egypt,Spain,"DIERKS, AR",Lecco,united states,south africa,hong kong,hungary,argentina,PlaceRegion,"LAKE CHARLES, LA",monaco,Burlington,"WOBURN, MA","DEERFIELD BEACH, FL",monaco,gmina Żmigród,Claremont,Genova,hong kong,brazil,cayman islands,"LORETTO, TN",latvia,Västra Götalands län,papua new guinea,"MT. PLEASANT, TX","BRANFORD, CT","ENVILLE, TN","MARLIN, TX",Forlì-Cesena,"HARPER, TX",south africa,"LINDEN, WI",Plattsburgh,Sondrio,papua new guinea,brazil,uruguay,"BURLINGTON, IA",Bezirk Landeck,"RIDGEWOOD, NJ","SCHULENBERG, TX",argentina,Zimbabwe,malta,"JONESBORO, AR",russia,Cremona,brazil,romania,cayman islands,"LAS VEGAS, NM",mozambique,ukraine,"RED HILL, PA",canada,Rauman seutukunta,poland,"MILES, TX",Marki,benin,"PASCAGOULA, MS",IND,West Bank and Gaza,"BRIGHTON, CO",united arab emirates,serbia,"GLASTONBURY, CT",MNG,"TENAHA, TX",Ecuador,switzerland,panama,"TAYLOR, TX","MAYWOOD, IL",france,"ROCHESTER, TX",nicaragua,"LAMBERTON, MN",venezuela,oman,"LA PLACE, LA","FRANKLIN, TN",morocco,albania,"PAWTUCKET, MA","JUPITER, FL",saudi arabia,Marktgemeinde Reutte,"EL RENO, OK",THA,"PLAINFIELD, NJ",ghana,cambodia,"BRAMAN, OK",united kingdom,Forlì-Cesena,"WILLOW, OK","MT. CARMEL, PA",benin,sweden,finland,Malaysia,Fiji,Pianura Reggiana,côte d’ivoire,"OAKDALE, MN",Unione dei comuni Isola Mantovana,namibia,ukraine,"WHITMAN, MA",zimbabwe,lithuania,bulgaria,Chad,Mantova,colombia,"FORT MYERS, FL",DEU,"CROMWELL, IA","TOMS RIVER, NJ",cameroon,Plymouth County,united arab emirates,Bergamo,singapore,"MASSILON, OH",Madrid,mexico,Cremona,kazakhstan,"HILLSBOROUGH TWNS, NJ","LIBERTY CITY, TX",ps,okres Vranov nad Topľou,"CASSVILLE, WI","FOUNTAIN VALLEY, CA",Bezirk Horn,guatemala,Gemeinde Erl,georgia,"BLUFFTON, SC",Gribskov Kommune,saudi arabia,Marèo - Enneberg - Marebbe,nicaragua,"MALONE, FL",canada,"QUINCY, IL",Greene County,"MARGATE CITY, NJ","PONCA CITY, OK",united states,ukraine,gmina Jasienica Rosielna,"OSTEGO, MN","CHAMPAIGN, IL","LOCKESBURG, AR",Norway,Středočeský kraj,Republic of Moldova,"HUTCHINSON, KS","SCRANTON, ND","JENA, LA","China, Hong Kong Special Administrative Region",tg,switzerland,Vestal Town,austria,Gemeinde Meiningen,zimbabwe,Syrian Arab Republic,philippines,russia,china,San Fernando Valley,"NAVASOTA, TX",Tottori,costa rica,Cumberland County,powiat jasielski,denmark,"STOCKTON, CA",Hamburg,"PITTSBURG, CA",Warwick,"BREMEN, KS",finland,Japan,okres Klatovy,monaco,Esbjerg Kommune,zimbabwe,"EMMAUS, PA","KIHEI, HI",south korea,Town of Hague,gb,"VENICE, FL","BLANCHARD, LA","WARRENTON, VA",malta,"AMARILLO, TX",nicaragua,...,TTO,"CHERRY HILL, NJ",Uppsala kommun,Castiraga Vidardo,egypt,"CUMMING, GA",denmark,Romania,Mittweida,Pawtucket,monaco,united kingdom,chile,El Salvador,"KEARNY, NJ",Turun seutukunta,"GALENA PARK, TX","WESTON, OH","MILFORD, MA",Robleda,venezuela,"ROYSTON, GA","COLUMBIA CITY, IN",nepal,GBR,tunisia,south korea,"WENATCHEE, WA",Lecco,gmina Kolno,togo,guatemala,slovenia,"ABBEVILLE, LA",ireland,"EUGENE, MO",Ferrara,nepal,"CONCORD, NH",Northwest,"TUCUMCARI, NM",Colombia,estonia,united arab emirates,China,"MORRICE, MI",vietnam,vn,Köln,tunisia,singapore,"MCKINNEY, TX",Barbados,Stamford,gmina Góra,"FROST, MN","HEREFORD, CO",ukraine,iran,"CORINTH, MS",kr,"LAYTON, UT",algeria,Morris County,Gemeinde Meiningen,"CLIFTON, TX",CAF,morocco,"SPRINGFIELD, IL",syria,chile,LBR,czechia,"FORT LANDERDALE, FL",Ferrara,austria,Österåkers kommun,Ponferrada,MDG,bo,montenegro,"RATON, NM","MARKHAM, IL","CARTHAGE, MS","LUEDERS, TX",nicaragua,estonia,Lietuva,china,chile,"PARAMOUNT, CA",UTI Riviera - Bassa Friulana,oman,egypt,"NORTH BERGEN, NJ","CRANFORD, NJ",saudi arabia,Russian Federation,Argentina,finland,jersey,nepal,namibia,Stadt Kufstein,"GERING, NE",Argentina,"NEWPORT, CA",Indonesia,netherlands,"WENATCHEE, WA","TWENTYNINE PALMS, CA","HENDERSON, KY","HAMMOND, LA","BLACKWELL, OK",togo,mexico,united states,costa rica,Bahía de Cádiz,Lodi,estonia,Guinea-Bissau,Mantova,Berkshire County,"LONGVIEW, WA",syria,azerbaijan,monaco,bosnia and herzegovina,oman,"KENOSHA, WI",slovakia,albania,"CHAMPAIGN, IL","BROWNSVILLE, IN","HENDERSON, KY",senegal,"MAYWOOD, NE",Carroll County,"FAIR OAKS, CA",Jämsä,ghana,south korea,"RYE, NY",costa rica,Cremona,"KEYSTONE, WV",colombia,"TUCKERTON, NJ","VENTURA, CA","GHENT, KY",chile,saudi arabia,"MILFORD, NH",indonesia,Forlì-Cesena,"RIVERHEAD, NY","GERMANTOWN, MD","PALM BEACH, FL",UTI delle Valli e delle Dolomiti Friulane,"ANDOVER, MN",Algeria,"MEEKER, CO","OAK FOREST, IL",hungary,panama,canada,LBR,Peekskill,cayman islands,egypt,czechia,KIR,mozambique,nicaragua,argentina,"REDMOND, OR","MARINA DEL RAY, CA",al,côte d’ivoire,ecuador,"FAIRBANKS, AK",united states,Greene County,estonia,Bosnia and Herzegovina,cm,Ferrara,sri lanka,"YORK, NE","HUNTINGTON, CA","COLE CAMP, MO",georgia,"PERRY, GA",ireland,White Plains,"WESTPORT, CT",Oliveto Lario,turkey,singapore,albania,Mantova,"SPRINGFIELD, MN",bulgaria,"MORGANTON, NC","BROWNSVILLE, IN",ghana,"BROOKSVILLE, FL",Lithuania,"THE DALLES, OR","MARTINSBURG, WV",poland,taiwan,"MIDWEST CITY, OK",lebanon,British Virgin Islands,SLE,croatia,bulgaria,Mongolia,jamaica,gmina Kolno,bulgaria,"CASTLE ROCK, CO",Makran Coast,sweden,"NAPLES, FL",south africa,poland,"GRAND PRAIRIE, TX",turkey,"HILLSBORO, IL","FORESTVILLE, WI",macedonia,"WESTFIELD, NJ",portugal,"VIDALIA, GA",ireland,"MELBOURNE, FL",Forlì-Cesena,jp,macedonia,"LIBERTY, TX",Lecco,"WIMBERLEY, TX","MANTEO, NC",af,Como,cyprus,china,Forlì-Cesena,"HARVEY, IL","DURHAM, MO",W Arabian Peninsula,portugal,"FAIRVIEW, OK",qatar,Medina de Rioseco,ecuador,MDA,Parma,Colombia,hong kong,Lisboa,mx,thailand,spain,Lugo,Bergamo,new zealand,BEL,"WARNER ROBINS, GA",Marki,Varsinais-Suomi,ALB,"BERTHOLD, ND","SONOMA, CA",austria,Brescia,"MORGAN CITY, LA",cambodia,"TAKOMA PARK, MD","CHANUTE, KS",india,georgia,"MIAMI, FL",Saudi Arabia,Hindu Kush,"YUKON, OK",colombia,venezuela,slovakia,philippines,malaysia,"ALEXANDRIA, NE",bosnia and herzegovina,"RANCHO CUCAMONGA, CA",Jefferson Township,Växjö,guatemala
102,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,train,...,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test,test


**I think Presidio can't detect that, these column values, they are not personal-related**  
 It can only detect cities or county names

In [134]:
df_gpe = analyse_class("GPE")
indis = []
for e, (i, t) in enumerate(zip(dessi_all.columns, dessi_all.iloc[-1,:])):
    try:
        if (i in df_gpe.columns) and (t in df_gpe.loc[102,i].values):
            indis.append(e)
    except:
        if (i in df_gpe.columns) and (t in df_gpe.loc[102,i]):
            indis.append(e)
for ind in indis:
    wrong_columns.append(ind)
    dessi_labels_cleaned.loc[ind,"label"] = "Other_data"

In [135]:
pd.DataFrame(wrong_columns).to_csv("dessi_cleaned/wrong_columns.csv", index=False)
dessi_labels_cleaned.to_csv("dessi_cleaned/all_labels_cleaned.csv", index=False)

Continuation in 'find_label_errors_2.ipynb'