In [8]:
# !pip install pip --upgrade
import numpy as np
from scipy import spatial
import matplotlib.pyplot as plt
from sklearn.manifold import TSNE

import pandas as pd
# !pip install pyopenssl --upgrade
# !pip install --upgrade smart_open
from nltk.corpus import stopwords
from nltk.tokenize import word_tokenize
import string

# for processing
import re
import nltk
from nltk.tokenize import word_tokenize


from IPython.display import display, HTML
display(HTML("<style>.container { width:100% !important; }</style>"))
pd.set_option('display.max_colwidth', None)

from datetime import datetime
from nltk.tokenize import RegexpTokenizer

In [2]:
%%time
embeddings_dict_6B_50D = {}
with open("glove.6B/glove.6B.50d.txt", 'r', encoding="utf-8") as f:
    for line in f:
        values = line.split()
        word = ' '.join(values[:-50]).lower().strip()
        vector = np.asarray(values[-50:], "float32")
        embeddings_dict_6B_50D[word] = vector
        
def vectorize_text(text):
    vectors = [embeddings_dict_6B_50D.get(word) for word in str(text).split() if word in embeddings_dict_6B_50D]
    vectors = [v for v in vectors if v is not None]  # remove any None values
    if vectors:
        vectorized = np.mean(vectors, axis=0)
    else:
        vectorized = np.zeros(50)  # if there are no vectors, return a zero-vector
    return vectorized

Wall time: 3.95 s


In [3]:
def text_normalizer(text):
    if text:
        # Use NLTK RegexpTokenizer for tokenization. 
        # This tokenizer splits the text by white space and also keeps tokens like "wasn't" and "don't".
        tokenizer = RegexpTokenizer(r'\b\w[\w\'-]*\w\b|\w')
        words = tokenizer.tokenize(text)

        # Clean up any token with repeating characters like '666', 'aaa', '!!!!!!', substitute them with empty string ''.
        # This includes 'XXXX' maskings in the text created by CFPB.
        words = [re.sub(r'(\w)\1{2,}', '', word) if re.search(r'(\w)\1{2,}', word) else word for word in words]

        # Convert to lowercase and remove punctuations.
        words = [word.lower().strip() for word in words]

        # Substitute the tokens with "" where they are just numbers.
        words = ['' if word.isdigit() else word for word in words]

        # Join the words back into a single string.
        text = ' '.join([word for word in words if word])
    
    return text

In [9]:
%%time
cfpb_df = pd.read_csv("CFPB RAW complaints 5.9.2023.csv")



Wall time: 18.1 s


In [10]:
%%time
# Convert the 'date' column to datetime format
print("Before droping nan narrative: ", len(cfpb_df))
cfpb_df.dropna(subset=['Consumer complaint narrative'], inplace=True)
cfpb_df['Date received'] = pd.to_datetime(cfpb_df['Date received'])
cfpb_df['narr_len'] = cfpb_df['Consumer complaint narrative'].apply(lambda x:len(str(x)))
cfpb_df['days_to_today'] = (datetime.now().date() - cfpb_df['Date received'].dt.date).dt.days

cfpb_df['narr_len'] = cfpb_df['narr_len'].astype(int)
cfpb_df['days_to_today'] = cfpb_df['days_to_today'].astype(int)

cfpb_df['days_to_today'] = (datetime.now().date() - cfpb_df['Date received'].dt.date).dt.days

cfpb_df['clean_narr'] = cfpb_df['Consumer complaint narrative'].apply(text_normalizer)
cfpb_df['narr_head_vec'] = cfpb_df['clean_narr'].apply(lambda x: vectorize_text(x[:500]))

print("After droping nan narrative: ", len(cfpb_df))

Before droping nan narrative:  3599657
After droping nan narrative:  1300361
Wall time: 5min 25s


In [41]:
# df = cfpb_df[cfpb_df['Complaint ID'].isin([5830282,5830057,5830027,5830056])].copy()#sample(15)
# df

In [42]:
# from scipy.spatial.distance import pdist, squareform
# vectors = df['narr_head_vec'].tolist()

# vectors_2d = np.vstack(vectors)
# dists = pdist(vectors_2d, metric='euclidean')
# dist_matrix = squareform(dists)
# pd.DataFrame(dist_matrix)

In [43]:
# point1 = df['narr_head_vec'].to_list()[0]
# point2 = df['narr_head_vec'].to_list()[1]
# point3 = df['narr_head_vec'].to_list()[2]
# point4 = df['narr_head_vec'].to_list()[3]
# point5 = cfpb_df['narr_head_vec'].sample().to_list()[0]

# print(np.linalg.norm(point1 - point2))
# print(np.linalg.norm(point1 - point3))
# print(np.linalg.norm(point1 - point5))

In [44]:
small_cfpb_df = cfpb_df[['State', 'ZIP code','Complaint ID','narr_len', 'days_to_today','narr_head_vec']].copy()
small_cfpb_df[['State', 'ZIP code']] = small_cfpb_df[['State', 'ZIP code']].fillna('')

In [45]:
# when running group by, the input is a mini dataframe with same ['Product', 'Issue', 'State', 'ZIP code']
def find_duplicate_narr(df):
    small_df = df[['Complaint ID','narr_len', 'days_to_today', 'narr_head_vec']].copy()
    
    def find_dupi_in_small_df(row_narr_len, row_to_day, row_narr_head_vec, small_df):
        tmp_df = small_df.query("narr_len <= @row_narr_len*1.2 & narr_len >= @row_narr_len*0.8 & days_to_today <= @row_to_day+5 & days_to_today >= @row_to_day-5").copy()    
        tmp_df['eclidean_dist'] = tmp_df['narr_head_vec'].apply(lambda x: np.linalg.norm(x - row_narr_head_vec))
        dupli_df = tmp_df[tmp_df['eclidean_dist']<0.25]
        dupli_id_list = sorted(dupli_df['Complaint ID'].to_list())
        return dupli_id_list
    
    df['dupi_id'] = small_df.apply(lambda row: find_dupi_in_small_df(row['narr_len'], int(row['days_to_today']), row['narr_head_vec'], small_df),axis=1)
    
    return df

In [46]:
%%time
small_cfpb_df = small_cfpb_df.groupby(['State', 'ZIP code']).apply(func=find_duplicate_narr)

Wall time: 42min 14s


In [47]:
small_cfpb_df['dupi_len'] = small_cfpb_df['dupi_id'].apply(lambda x: len(x))
small_cfpb_df['dupi_id'] = small_cfpb_df['dupi_id'].apply(lambda x: ";".join([str(y) for y in x]))

In [49]:
merged_df = cfpb_df.merge(small_cfpb_df[['Complaint ID', 'dupi_id', 'dupi_len']], on='Complaint ID', how='left').drop(['narr_head_vec'], axis=1)

In [59]:
dupli_df = merged_df[merged_df.dupi_len>1].sort_values('dupi_id').copy()
dupli_df

Unnamed: 0,Date received,Product,Sub-product,Issue,Sub-issue,Consumer complaint narrative,Company public response,Company,State,ZIP code,...,Date sent to company,Company response to consumer,Timely response?,Consumer disputed?,Complaint ID,narr_len,days_to_today,clean_narr,dupi_id,dupi_len
366585,2015-03-19,Credit reporting,,Incorrect information on credit report,Account status,"I have been disputing incorrect information on my Experian XXXX XXXX XXXX credit report but they are unwilling to allow me to dispute their "" investigation results ''. The creditors are XXXX XXXX and XXXX XXXX XXXX. The report reflects late payments and the information is inaccurate. XXXX creditors have agreed to have the items corrected on all XXXX credit bureaus but only XXXX made the correction.",Company chooses not to provide a public response,Experian Information Solutions Inc.,FL,33157,...,2015-03-19,Closed with explanation,Yes,No,1290842,401,3035,i have been disputing incorrect information on my experian credit report but they are unwilling to allow me to dispute their investigation results the creditors are and the report reflects late payments and the information is inaccurate creditors have agreed to have the items corrected on all credit bureaus but only made the correction,1290842;1290843,2
253477,2015-03-19,Credit reporting,,Incorrect information on credit report,Account status,"I have been disputing incorrect information on my XXXX & Trans Union credit report but they are unwilling to allow me to dispute their "" investigation results ''. The creditors are XXXX XXXX and XXXX XXXX XXXX. The report reflects late payments and the information is inaccurate. Both creditors have agreed to have the items corrected on all XXXX credit bureaus but only XXXX made the correction.",,"TRANSUNION INTERMEDIATE HOLDINGS, INC.",FL,33157,...,2015-03-19,Closed with explanation,Yes,No,1290843,396,3035,i have been disputing incorrect information on my trans union credit report but they are unwilling to allow me to dispute their investigation results the creditors are and the report reflects late payments and the information is inaccurate both creditors have agreed to have the items corrected on all credit bureaus but only made the correction,1290842;1290843,2
46863,2015-03-19,Credit reporting,,Incorrect information on credit report,Information is not mine,there is a XXXX XXXX account on my credit report that does not belong to me. I have attem have attempted to dispute several times to no avail.,,"TRANSUNION INTERMEDIATE HOLDINGS, INC.",FL,33157.0,...,2015-03-25,Closed with non-monetary relief,Yes,No,1290847,142,3035,there is a account on my credit report that does not belong to me i have attem have attempted to dispute several times to no avail,1290847;1290849,2
1122799,2015-03-19,Credit reporting,,Incorrect information on credit report,Information is not mine,there is a XXXX BP account on my credit report that does not belong to me. I have attem have attempted to dispute several times to no avail.,Company chooses not to provide a public response,Experian Information Solutions Inc.,FL,33157.0,...,2015-03-19,Closed with explanation,Yes,No,1290849,140,3035,there is a bp account on my credit report that does not belong to me i have attem have attempted to dispute several times to no avail,1290847;1290849,2
762120,2015-03-19,Debt collection,I do not know,Cont'd attempts collect debt not owed,Debt is not mine,"Call from XXXX XXXX XXXX XXXX XXXX XXXX seeking XXXX XXXX. XXXX purchased bad debt or bad contact information from Northland Group. Call from ( XXXX ) XXXX, I explained debt is not mine. Lady got rude when I refused to answer her questions about me. Told her do not call again. Subsequently received an automated call from ( XXXX ) XXXX seeking XXXX XXXX.",,Northland Group Inc,FL,32256.0,...,2015-03-19,Closed with explanation,Yes,No,1291079,355,3035,call from seeking purchased bad debt or bad contact information from northland group call from i explained debt is not mine lady got rude when i refused to answer her questions about me told her do not call again subsequently received an automated call from seeking,1291079;1292604,2
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
54804,2023-04-22,"Credit reporting, credit repair services, or other personal consumer reports",Credit reporting,Improper use of your report,Reporting company used your report improperly,"In accordance with the Fair Credit Report Act XXXX, XXXX, XXXX XXXX XXXX , has violated my rights. \n15 U.S.C 1681 Section 602 A, States I have the right to privacy.\n\n15 U.S.C 1681 Section 604 A, Section 2 : It also states a consumer reporting agency can not furnish an account without my written instructions. \nI do not owe this debt collector.",Company has responded to the consumer and the CFPB and chooses not to provide a public response,Experian Information Solutions Inc.,FL,33435.0,...,2023-04-22,Closed with explanation,Yes,,6876195,344,79,in accordance with the fair credit report act has violated my rights u s c section a states i have the right to privacy u s c section a section it also states a consumer reporting agency can not furnish an account without my written instructions i do not owe this debt collector,6876195;6876460,2
3466,2023-04-27,Debt collection,Other debt,Attempts to collect debt not owed,Debt was result of identity theft,TEK COLLECT INC ( XXXX XXXX XXXX XXXX XXXX ) is a result of identity theft. I recently discovered through my new monitoring service this account being reported I made efforts to remove this account from my file as the amount of {$240.00} does not belong to me. This account was fraudulently opened through this company in XXXX of 2020 an has been reported to the FTC and authorities as Identity theft. I have submitted all of my information needed to resolve this matter in this complaint and through the FTC report attached and do not feel comfortable giving any further information in any way to any others at this time due to the further possibilities of identity theft.,Company believes it acted appropriately as authorized by contract or law,TekCollect Inc.,TX,75040.0,...,2023-04-27,Closed with explanation,Yes,,6892933,673,74,tek collect inc is a result of identity theft i recently discovered through my new monitoring service this account being reported i made efforts to remove this account from my file as the amount of does not belong to me this account was fraudulently opened through this company in of an has been reported to the ftc and authorities as identity theft i have submitted all of my information needed to resolve this matter in this complaint and through the ftc report attached and do not feel comfortable giving any further information in any way to any others at this time due to the further possibilities of identity theft,6892933;6894971,2
134734,2023-04-26,Debt collection,Other debt,Attempts to collect debt not owed,Debt was result of identity theft,SUNRISE CREDIT SERVICES ( XXXX XXXXXXXX XXXX ) is a result of identity theft. I recently discovered through my Identity monitoring service this account being reported I made efforts to remove this account from my file as the amount of {$1900.00} does not belong to me. This account was fraudulently opened through this company in XXXX of 2022 an has been reported to the FTC and authorities as Identity theft. I have submitted all of my information needed to resolve this matter in this complaint and through the FTC report attached and do not feel comfortable giving any further information in any way to any others at this time due to the further possibilities of identity theft.,Company has responded to the consumer and the CFPB and chooses not to provide a public response,"SUNRISE CREDIT SERVICES, INC",TX,75040.0,...,2023-04-26,Closed with explanation,Yes,,6894971,681,75,sunrise credit services is a result of identity theft i recently discovered through my identity monitoring service this account being reported i made efforts to remove this account from my file as the amount of does not belong to me this account was fraudulently opened through this company in of an has been reported to the ftc and authorities as identity theft i have submitted all of my information needed to resolve this matter in this complaint and through the ftc report attached and do not feel comfortable giving any further information in any way to any others at this time due to the further possibilities of identity theft,6892933;6894971,2
115015,2023-04-26,Debt collection,Credit card debt,Attempts to collect debt not owed,Debt was result of identity theft,"The open dates for are not accurate and the account numbers are invalid. XXXX, never represents or corresponds to appropriate account informations. Its been more than 6 months and you have never given me any response to my request to validate the debt and of its origin. I have never given any approval or permission for you to report this account. \n\nThis is a violation of my rights as a consumer. I will be seeking legal assistance due to noncompliance with 15 U.S. Code 1681 ( e ) ( B ) and XXXX XXXX Compliance Standards, there are multiple deviations, deficiencies, inaccurate information, and unauthorized information listed on my credit report. Please remove these accounts referenced from my credit report.",Company believes it acted appropriately as authorized by contract or law,"CCS Financial Services, Inc.",NJ,08701,...,2023-04-26,Closed with explanation,Yes,,6895848,714,75,the open dates for are not accurate and the account numbers are invalid never represents or corresponds to appropriate account informations its been more than months and you have never given me any response to my request to validate the debt and of its origin i have never given any approval or permission for you to report this account this is a violation of my rights as a consumer i will be seeking legal assistance due to noncompliance with u s code e b and compliance standards there are multiple deviations deficiencies inaccurate information and unauthorized information listed on my credit report please remove these accounts referenced from my credit report,6895848;6895883,2


In [76]:
df = dupli_df.groupby(['Product','dupi_id']).sum().reset_index()
df['dupi_id_len'] = df['dupi_id'].apply(lambda x: len(x.split(";")))
df[df['dupi_id_len']!=np.sqrt(df['dupi_len'])].sort_values('days_to_today')

Unnamed: 0,Product,dupi_id,Complaint ID,narr_len,days_to_today,dupi_len,dupi_id_len
148374,"Credit reporting, credit repair services, or other personal consumer reports",6876195;6876460,6876195,300,79,2,2
148373,"Credit reporting, credit repair services, or other personal consumer reports",6876043;6876460,6876043,400,79,2,2
148372,"Credit reporting, credit repair services, or other personal consumer reports",6876043;6876195;6876460,6876460,400,79,3,3
148345,"Credit reporting, credit repair services, or other personal consumer reports",6803373;6803530,6803373,100,95,2,2
148341,"Credit reporting, credit repair services, or other personal consumer reports",6799272;6799484,6799484,400,96,2,2
...,...,...,...,...,...,...,...
36098,"Credit reporting, credit repair services, or other personal consumer reports",3594857;3594862;3594921;3594923;3594927;3594933;3594953;3594954;3594958;3594960;3594961;3594965;3595013;3595014;3595030;3595035;3595036;3595065;3595069;3595070;3595071;3595072;3595074;3595076;3595103;3595106;3595108;3595110;3595112;3595113;3595146;3595147;3595454;3595459;3595690;3595691,79091790,4400,26178,792,36
17964,"Credit reporting, credit repair services, or other personal consumer reports",3056242;3056257;3056267;3056285;3056286;3056325;3058078;3058081;3058082;3058084;3059126;3059171;3059275;3059298;3059310;3059359;3059360;3059382;3059392;3060236;3060301;3060310;3060336;3060425;3060435;3061514;3061529;3061530;3061534;3061539;3061541;3061544;3061546,55067805,14400,30877,594,33
2640,Credit reporting,1605520;1605526;1605527;1607824;1607826;1607827;1607828;1607830;1607832;1607834;1607836;1607842;1610146;1610148;1610150;1610151;1610153;1610154;1610156;1610161;1610165;1610170;1610171;1610177;1610178;1610180;1610183,28973582,16200,50836,486,27
2638,Credit reporting,1605519;1605521;1605522;1605523;1605524;1605525;1607811;1607825;1607829;1607831;1607837;1607838;1607840;1607841;1610147;1610149;1610152;1610155;1610157;1610158;1610159;1610160;1610162;1610163;1610164;1610166;1610167;1610168;1610169;1610172;1610173;1610174;1610175;1610176;1610179;1610181;1610182;1610184,37033808,20800,64952,874,38


In [78]:
x = "3594857;3594862;3594921;3594923;3594927;3594933;3594953;3594954;3594958;3594960;3594961;3594965;3595013;3595014;3595030;3595035;3595036;3595065;3595069;3595070;3595071;3595072;3595074;3595076;3595103;3595106;3595108;3595110;3595112;3595113;3595146;3595147;3595454;3595459;3595690;3595691"
len(x.split(";"))

36

In [60]:
pivot_table = pd.pivot_table(dupli_df, index='dupi_len', columns='Product', aggfunc=len, fill_value=0)
pivot_table

Unnamed: 0_level_0,Company,Company,Company,Company,Company,Company,Company,Company,Company,Company,...,narr_len,narr_len,narr_len,narr_len,narr_len,narr_len,narr_len,narr_len,narr_len,narr_len
Product,Bank account or service,Checking or savings account,Consumer Loan,Credit card,Credit card or prepaid card,Credit reporting,"Credit reporting, credit repair services, or other personal consumer reports",Debt collection,"Money transfer, virtual currency, or money service",Money transfers,...,"Money transfer, virtual currency, or money service",Money transfers,Mortgage,Other financial service,Payday loan,"Payday loan, title loan, or personal loan",Prepaid card,Student loan,Vehicle loan or lease,Virtual currency
dupi_len,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2,Unnamed: 9_level_2,Unnamed: 10_level_2,Unnamed: 11_level_2,Unnamed: 12_level_2,Unnamed: 13_level_2,Unnamed: 14_level_2,Unnamed: 15_level_2,Unnamed: 16_level_2,Unnamed: 17_level_2,Unnamed: 18_level_2,Unnamed: 19_level_2,Unnamed: 20_level_2,Unnamed: 21_level_2
2,82,333,45,263,1732,3280,191184,18263,305,2,...,305,2,625,2,25,200,5,275,331,0
3,13,49,29,56,516,961,98136,3772,49,0,...,49,0,79,0,2,58,0,63,107,3
4,5,21,14,27,250,196,16655,1847,12,0,...,12,0,35,0,2,21,0,24,52,0
5,2,3,0,4,115,87,8991,867,13,0,...,13,0,13,0,0,2,0,21,27,0
6,0,5,0,1,62,60,5598,686,3,0,...,3,0,0,0,0,10,0,7,7,0
7,0,3,3,11,45,8,3377,369,16,0,...,16,0,1,0,0,0,0,0,7,0
8,0,3,1,2,11,8,2669,206,3,0,...,3,0,0,0,0,0,0,0,0,0
9,0,0,0,0,8,31,2124,141,3,0,...,3,0,1,0,0,1,0,0,4,0
10,0,1,0,0,15,21,1549,135,9,0,...,9,0,2,0,0,2,0,0,12,0
11,0,0,1,0,4,7,1413,122,6,0,...,6,0,0,0,0,0,0,0,2,0


In [61]:
dupli_df['narr_len'] = dupli_df['narr_len'].apply(lambda x: round(x, -2))
pivot_table = pd.pivot_table(dupli_df, index='dupi_len', columns='narr_len', aggfunc=len, fill_value=0)
pivot_table

Unnamed: 0_level_0,Company,Company,Company,Company,Company,Company,Company,Company,Company,Company,...,dupi_id,dupi_id,dupi_id,dupi_id,dupi_id,dupi_id,dupi_id,dupi_id,dupi_id,dupi_id
narr_len,0,100,200,300,400,500,600,700,800,900,...,30700,30900,31100,31200,31300,31400,31600,31700,32400,32500
dupi_len,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2,Unnamed: 9_level_2,Unnamed: 10_level_2,Unnamed: 11_level_2,Unnamed: 12_level_2,Unnamed: 13_level_2,Unnamed: 14_level_2,Unnamed: 15_level_2,Unnamed: 16_level_2,Unnamed: 17_level_2,Unnamed: 18_level_2,Unnamed: 19_level_2,Unnamed: 20_level_2,Unnamed: 21_level_2
2,1899,14648,18273,23625,22948,19950,18045,16508,11134,9347,...,0,0,4,2,2,2,1,1,1,3
3,968,6338,8095,11907,11450,9603,8298,8021,5492,4302,...,2,3,0,0,0,0,0,0,0,0
4,88,873,1370,2655,1933,1543,1533,1403,928,703,...,0,0,0,0,0,0,0,0,0,0
5,59,458,789,1775,1013,767,739,817,425,318,...,0,0,0,0,0,0,0,0,0,0
6,50,323,401,1067,556,497,421,576,272,189,...,0,0,0,0,0,0,0,0,0,0
7,21,203,216,852,266,328,224,194,136,92,...,0,0,0,0,0,0,0,0,0,0
8,0,135,174,590,266,168,170,181,116,100,...,0,0,0,0,0,0,0,0,0,0
9,0,113,155,543,186,122,94,134,93,30,...,0,0,0,0,0,0,0,0,0,0
10,10,58,112,397,116,114,84,114,55,12,...,0,0,0,0,0,0,0,0,0,0
11,33,88,93,362,141,95,91,66,16,40,...,0,0,0,0,0,0,0,0,0,0


In [63]:
dupli_df[dupli_df.dupi_len>25]

Unnamed: 0,Date received,Product,Sub-product,Issue,Sub-issue,Consumer complaint narrative,Company public response,Company,State,ZIP code,...,Date sent to company,Company response to consumer,Timely response?,Consumer disputed?,Complaint ID,narr_len,days_to_today,clean_narr,dupi_id,dupi_len
379287,2015-08-08,Credit reporting,,Improper use of my credit report,Report improperly shared by CRC,"While checking my personal credit report, I noticed an unauthorized and fraudulent credit inquiry made by XXXX on or about XX/XX/XXXX on Transunion. I did not authorized anyone employed by this company to make any inquiry and view my credit report. XXXX has violated the Fair Credit Reporting Act Section 1681b ( c ). They were not legally entitled to make this fraudulent inquiry. This is a serious breach of my privacy rights. \nI have requested that they mail me a copy of my signed authorization form that gave them the right to view my credit within XXXX ( XXXX ) business days so that I can verify its validity and advised them that if they can not provide me with proof that I authorized them to view my credit report then I am demanding that they contact the credit bureaus immediately and have them remove the unauthorized and fraudulent hard inquiry immediately. I also requested that they remove my personal information from their records. My Social Security # is XXXX and my Date of Birth is XX/XX/XXXX in case it is needed to locate the fraudulent inquiry in their system.",Company chooses not to provide a public response,"TRANSUNION INTERMEDIATE HOLDINGS, INC.",CA,92563.0,...,2015-08-08,Closed with explanation,Yes,No,1509798,1100,2893,while checking my personal credit report i noticed an unauthorized and fraudulent credit inquiry made by on or about xx xx on transunion i did not authorized anyone employed by this company to make any inquiry and view my credit report has violated the fair credit reporting act section 1681b c they were not legally entitled to make this fraudulent inquiry this is a serious breach of my privacy rights i have requested that they mail me a copy of my signed authorization form that gave them the right to view my credit within business days so that i can verify its validity and advised them that if they can not provide me with proof that i authorized them to view my credit report then i am demanding that they contact the credit bureaus immediately and have them remove the unauthorized and fraudulent hard inquiry immediately i also requested that they remove my personal information from their records my social security is and my date of birth is xx xx in case it is needed to locate the fraudulent inquiry in their system,1509792;1509793;1509794;1509796;1509798;1509799;1509801;1509805;1509806;1509807;1509808;1509810;1509811;1509812;1509814;1509815;1509816;1509819;1509820;1510117;1510119;1510126;1510131;1510134;1510136;1510141;1510142;1510145;1510146;1510148;1510149;1510152;1510154;1510157,34
585415,2015-08-09,Credit reporting,,Improper use of my credit report,Report improperly shared by CRC,"While checking my personal credit report, I noticed an unauthorized and fraudulent credit inquiry made by XXXX XXXX XXXX XXXX CO on or about XX/XX/XXXX on Transunion. I did not authorized anyone employed by this company to make any inquiry and view my credit report. XXXX XXXX XXXX XXXX CO has violated the Fair Credit Reporting Act Section 1681b ( c ). They were not legally entitled to make this fraudulent inquiry. This is a serious breach of my privacy rights. \nI have requested that they mail me a copy of my signed authorization form that gave them the right to view my credit within five ( 5 ) business days so that I can verify its validity and advised them that if they can not provide me with proof that I authorized them to view my credit report then I am demanding that they contact the credit bureaus immediately and have them remove the unauthorized and fraudulent hard inquiry immediately. I also requested that they remove my personal information from their records. My Social Security # is XXXX and my Date of Birth is XX/XX/XXXX in case it is needed to locate the fraudulent inquiry in their system.",Company chooses not to provide a public response,"TRANSUNION INTERMEDIATE HOLDINGS, INC.",CA,92563.0,...,2015-08-10,Closed with explanation,Yes,No,1510119,1100,2892,while checking my personal credit report i noticed an unauthorized and fraudulent credit inquiry made by co on or about xx xx on transunion i did not authorized anyone employed by this company to make any inquiry and view my credit report co has violated the fair credit reporting act section 1681b c they were not legally entitled to make this fraudulent inquiry this is a serious breach of my privacy rights i have requested that they mail me a copy of my signed authorization form that gave them the right to view my credit within five business days so that i can verify its validity and advised them that if they can not provide me with proof that i authorized them to view my credit report then i am demanding that they contact the credit bureaus immediately and have them remove the unauthorized and fraudulent hard inquiry immediately i also requested that they remove my personal information from their records my social security is and my date of birth is xx xx in case it is needed to locate the fraudulent inquiry in their system,1509792;1509793;1509794;1509796;1509798;1509799;1509801;1509805;1509806;1509807;1509808;1509810;1509811;1509812;1509814;1509815;1509816;1509819;1509820;1510117;1510119;1510126;1510131;1510134;1510136;1510141;1510142;1510145;1510146;1510148;1510149;1510152;1510154;1510157,34
472019,2015-08-08,Credit reporting,,Improper use of my credit report,Report improperly shared by CRC,"While checking my personal credit report, I noticed an unauthorized and fraudulent credit inquiry made by XXXX on or about XX/XX/XXXX onTransunion. I did not authorized anyone employed by this company to make any inquiry and view my credit report. XXXX has violated the Fair Credit Reporting Act Section 1681b ( c ). They were not legally entitled to make this fraudulent inquiry. This is a serious breach of my privacy rights. \nI have requested that they mail me a copy of my signed authorization form that gave them the right to view my credit within five ( 5 ) business days so that I can verify its validity and advised them that if they can not provide me with proof that I authorized them to view my credit report then I am demanding that they contact the credit bureaus immediately and have them remove the unauthorized and fraudulent hard inquiry immediately. I also requested that they remove my personal information from their records. My Social Security # is XXXX and my Date of Birth is XX/XX/XXXX in case it is needed to locate the fraudulent inquiry in their system.",Company chooses not to provide a public response,"TRANSUNION INTERMEDIATE HOLDINGS, INC.",CA,92563.0,...,2015-08-10,Closed with explanation,Yes,No,1509816,1100,2893,while checking my personal credit report i noticed an unauthorized and fraudulent credit inquiry made by on or about xx xx ontransunion i did not authorized anyone employed by this company to make any inquiry and view my credit report has violated the fair credit reporting act section 1681b c they were not legally entitled to make this fraudulent inquiry this is a serious breach of my privacy rights i have requested that they mail me a copy of my signed authorization form that gave them the right to view my credit within five business days so that i can verify its validity and advised them that if they can not provide me with proof that i authorized them to view my credit report then i am demanding that they contact the credit bureaus immediately and have them remove the unauthorized and fraudulent hard inquiry immediately i also requested that they remove my personal information from their records my social security is and my date of birth is xx xx in case it is needed to locate the fraudulent inquiry in their system,1509792;1509793;1509794;1509796;1509798;1509799;1509801;1509805;1509806;1509807;1509808;1509810;1509811;1509812;1509814;1509815;1509816;1509819;1509820;1510117;1510119;1510126;1510131;1510134;1510136;1510141;1510142;1510145;1510146;1510148;1510149;1510152;1510154;1510157,34
1254374,2015-08-08,Credit reporting,,Improper use of my credit report,Report improperly shared by CRC,"While checking my personal credit report, I noticed an unauthorized and fraudulent credit inquiry made by XXXX XXXX on or about XX/XX/XXXX on Experian. I did not authothize anyone employed by this company to make any inquiry and view my credit report. XXXX XXXX has violated the Fair Credit Reporting Act Section 1681b ( c ). They were not legally entitled to make this fraudulent inquiry. This is a serious breach of my privacy rights. \nI have requested that they mail me a copy of my signed authorization form that gave them the right to view my credit within XXXX ( XXXX ) business days so that I can verify its validity and advised them that if they can not provide me with proof that I authorized them to viewmy credit report then I am demanding that they contact the credit bureaus immediately and have them remove the unauthorized and fraudulent hard inquiry immediately. I also requested that they remove my personal information from their records. My Social Security # is XXXX and my Date of Birth is XX/XX/XXXX in case it is needed to locate the fraudulent inquiry in their system.",Company chooses not to provide a public response,Experian Information Solutions Inc.,CA,92563.0,...,2015-08-08,Closed with non-monetary relief,Yes,No,1509792,1100,2893,while checking my personal credit report i noticed an unauthorized and fraudulent credit inquiry made by on or about xx xx on experian i did not authothize anyone employed by this company to make any inquiry and view my credit report has violated the fair credit reporting act section 1681b c they were not legally entitled to make this fraudulent inquiry this is a serious breach of my privacy rights i have requested that they mail me a copy of my signed authorization form that gave them the right to view my credit within business days so that i can verify its validity and advised them that if they can not provide me with proof that i authorized them to viewmy credit report then i am demanding that they contact the credit bureaus immediately and have them remove the unauthorized and fraudulent hard inquiry immediately i also requested that they remove my personal information from their records my social security is and my date of birth is xx xx in case it is needed to locate the fraudulent inquiry in their system,1509792;1509793;1509794;1509796;1509798;1509799;1509801;1509805;1509806;1509807;1509808;1509810;1509811;1509812;1509814;1509815;1509816;1509819;1509820;1510117;1510119;1510126;1510131;1510134;1510136;1510141;1510142;1510145;1510146;1510148;1510149;1510152;1510154;1510157,34
958667,2015-08-09,Credit reporting,,Improper use of my credit report,Report improperly shared by CRC,"While checking my personal credit report, I noticed an unauthorized and fraudulent credit inquiry made by XXXX on or about XX/XX/XXXX on Equifax. I did not authorized anyone employed by this company to make any inquiry and view my credit report. XXXX XXXX XXXX has violated the Fair Credit Reporting Act Section 1681b ( c ). They were not legally entitled to make this fraudulent inquiry. This is a serious breach of my privacy rights. \nI have requested that they mail me a copy of my signed authorization form that gave them the right to view my credit within five ( 5 ) business days so that I can verify its validity and advised them that if they can not provide me with proof that I authorized them to view my credit report then I am demanding that they contact the credit bureaus immediately and have them remove the unauthorized and fraudulent hard inquiry immediately. I also requested that they remove my personal information from their records. My Social Security # is XXXX and my Date of Birth is XX/XX/XXXX in case it is needed to locate the fraudulent inquiry in their system.",,"EQUIFAX, INC.",CA,92563.0,...,2015-08-10,Closed with explanation,Yes,No,1510145,1100,2892,while checking my personal credit report i noticed an unauthorized and fraudulent credit inquiry made by on or about xx xx on equifax i did not authorized anyone employed by this company to make any inquiry and view my credit report has violated the fair credit reporting act section 1681b c they were not legally entitled to make this fraudulent inquiry this is a serious breach of my privacy rights i have requested that they mail me a copy of my signed authorization form that gave them the right to view my credit within five business days so that i can verify its validity and advised them that if they can not provide me with proof that i authorized them to view my credit report then i am demanding that they contact the credit bureaus immediately and have them remove the unauthorized and fraudulent hard inquiry immediately i also requested that they remove my personal information from their records my social security is and my date of birth is xx xx in case it is needed to locate the fraudulent inquiry in their system,1509792;1509793;1509794;1509796;1509798;1509799;1509801;1509805;1509806;1509807;1509808;1509810;1509811;1509812;1509814;1509815;1509816;1509819;1509820;1510117;1510119;1510126;1510131;1510134;1510136;1510141;1510142;1510145;1510146;1510148;1510149;1510152;1510154;1510157,34
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
146804,2023-02-11,"Credit reporting, credit repair services, or other personal consumer reports",Credit reporting,Problem with a credit reporting company's investigation into an existing problem,Investigation took more than 30 days,My first letters to the credit bureaus regarding this account were in XX/XX/2022 and I have sent out letters each month since. This account is fraudulent and has been in dispute since I first seen it around XXXX XXXX last year but according to the credit bureaus they have it listed as not in dispute and remains unverified in the last several months. How is this possible if I have sent repeated letters to each bureau disputing this as well as letter to the alleged creditor. These are all violations of my rights under Title 15USC1681 and I demand that CFPB investigate this. Each bureau had 30 days to verify the account and not only did they send me letters stating it was verified but yet on their own report it states that there has been no verification and it is not in dispute. I have copied the XXXX FTC and the Attorney General for Florida.,,"EQUIFAX, INC.",FL,33030,...,2023-02-11,Closed with explanation,Yes,,6560867,900,149,my first letters to the credit bureaus regarding this account were in xx xx and i have sent out letters each month since this account is fraudulent and has been in dispute since i first seen it around last year but according to the credit bureaus they have it listed as not in dispute and remains unverified in the last several months how is this possible if i have sent repeated letters to each bureau disputing this as well as letter to the alleged creditor these are all violations of my rights under title 15usc1681 and i demand that cfpb investigate this each bureau had days to verify the account and not only did they send me letters stating it was verified but yet on their own report it states that there has been no verification and it is not in dispute i have copied the ftc and the attorney general for florida,6559636;6559641;6559650;6560617;6560618;6560627;6560648;6560691;6560692;6560693;6560697;6560700;6560728;6560742;6560745;6560756;6560760;6560770;6560773;6560776;6560777;6560780;6560804;6560808;6560811;6560815;6560820;6560823;6560867,29
205249,2023-02-11,"Credit reporting, credit repair services, or other personal consumer reports",Credit reporting,Problem with a credit reporting company's investigation into an existing problem,Investigation took more than 30 days,"My first letters to the credit bureaus regarding this account were in XX/XX/2022 and I have sent out letters each month since. This account is fraudulent and has been in dispute since I first seen it around labor day last year but according to the credit bureaus they have it listed as not in dispute and remains unverified in the last several months. How is this possible if I have sent repeated letters to each bureau disputing this as well as letter to the alleged creditor. These are all violations of my rights under Title 15USC1681 and I demand that CFPB investigate this. Each bureau had 30 days to verify the account and not only did they send me letters stating it was verified but yet on their own report it states that there has been no verification and it is not in dispute. I have copied the XXXX, FTC and the Attorney General for Florida.",Company has responded to the consumer and the CFPB and chooses not to provide a public response,Experian Information Solutions Inc.,FL,33030,...,2023-02-11,Closed with explanation,Yes,,6559641,900,149,my first letters to the credit bureaus regarding this account were in xx xx and i have sent out letters each month since this account is fraudulent and has been in dispute since i first seen it around labor day last year but according to the credit bureaus they have it listed as not in dispute and remains unverified in the last several months how is this possible if i have sent repeated letters to each bureau disputing this as well as letter to the alleged creditor these are all violations of my rights under title 15usc1681 and i demand that cfpb investigate this each bureau had days to verify the account and not only did they send me letters stating it was verified but yet on their own report it states that there has been no verification and it is not in dispute i have copied the ftc and the attorney general for florida,6559636;6559641;6559650;6560617;6560618;6560627;6560648;6560691;6560692;6560693;6560697;6560700;6560728;6560742;6560745;6560756;6560760;6560770;6560773;6560776;6560777;6560780;6560804;6560808;6560811;6560815;6560820;6560823;6560867,29
433442,2023-02-11,"Credit reporting, credit repair services, or other personal consumer reports",Credit reporting,Problem with a credit reporting company's investigation into an existing problem,Investigation took more than 30 days,"My first letters to the credit bureaus regarding this account were in XX/XX/2022 and I have sent out letters each month since. This account is fraudulent and has been in dispute since I first seen it around labor day last year but according to the credit bureaus they have it listed as not in dispute and remains unverified in the last several months. How is this possible if I have sent repeated letters to each bureau disputing this as well as letter to the alleged creditor. These are all violations of my rights under Title 15USC1681 and I demand that CFPB investigate this. Each bureau had 30 days to verify the account and not only did they send me letters stating it was verified but yet on their own report it states that there has been no verification and it is not in dispute. I have copied the XXXX, FTC and the Attorney General for Florida.",Company has responded to the consumer and the CFPB and chooses not to provide a public response,Experian Information Solutions Inc.,FL,33030,...,2023-02-11,Closed with explanation,Yes,,6560692,900,149,my first letters to the credit bureaus regarding this account were in xx xx and i have sent out letters each month since this account is fraudulent and has been in dispute since i first seen it around labor day last year but according to the credit bureaus they have it listed as not in dispute and remains unverified in the last several months how is this possible if i have sent repeated letters to each bureau disputing this as well as letter to the alleged creditor these are all violations of my rights under title 15usc1681 and i demand that cfpb investigate this each bureau had days to verify the account and not only did they send me letters stating it was verified but yet on their own report it states that there has been no verification and it is not in dispute i have copied the ftc and the attorney general for florida,6559636;6559641;6559650;6560617;6560618;6560627;6560648;6560691;6560692;6560693;6560697;6560700;6560728;6560742;6560745;6560756;6560760;6560770;6560773;6560776;6560777;6560780;6560804;6560808;6560811;6560815;6560820;6560823;6560867,29
146658,2023-02-11,"Credit reporting, credit repair services, or other personal consumer reports",Credit reporting,Problem with a credit reporting company's investigation into an existing problem,Investigation took more than 30 days,"My first letters to the credit bureaus regarding this account were in XX/XX/2022 and I have sent out letters each month since. This account is fraudulent and has been in dispute since I first seen it around labor day last year but according to the credit bureaus they have it listed as not in dispute and remains unverified in the last several months. How is this possible if I have sent repeated letters to each bureau disputing this as well as letter to the alleged creditor. These are all violations of my rights under Title 15USC1681 and I demand that CFPB investigate this. Each bureau had 30 days to verify the account and not only did they send me letters stating it was verified but yet on their own report it states that there has been no verification and it is not in dispute. I have copied the XXXX, FTC and the Attorney General for Florida.",Company has responded to the consumer and the CFPB and chooses not to provide a public response,"TRANSUNION INTERMEDIATE HOLDINGS, INC.",FL,33030,...,2023-02-11,Closed with non-monetary relief,Yes,,6560691,900,149,my first letters to the credit bureaus regarding this account were in xx xx and i have sent out letters each month since this account is fraudulent and has been in dispute since i first seen it around labor day last year but according to the credit bureaus they have it listed as not in dispute and remains unverified in the last several months how is this possible if i have sent repeated letters to each bureau disputing this as well as letter to the alleged creditor these are all violations of my rights under title 15usc1681 and i demand that cfpb investigate this each bureau had days to verify the account and not only did they send me letters stating it was verified but yet on their own report it states that there has been no verification and it is not in dispute i have copied the ftc and the attorney general for florida,6559636;6559641;6559650;6560617;6560618;6560627;6560648;6560691;6560692;6560693;6560697;6560700;6560728;6560742;6560745;6560756;6560760;6560770;6560773;6560776;6560777;6560780;6560804;6560808;6560811;6560815;6560820;6560823;6560867,29


In [77]:
merged_df.to_csv('CFPB with Duplicate Marked NEW.csv', index=False)