In [1]:
"""
Fetching data module. Aim is import all necessary fields up front, but if needed, you can define another function to be called here.

Usage:
    import src.cdutils.database
"""

import cdutils.database.connect # type: ignore
from sqlalchemy import text # type: ignore

def fetch_data():
    househldacct =  text("""
    SELECT 
        a.HOUSEHOLDNBR, 
        a.ACCTNBR
    FROM 
        OSIEXTN.HOUSEHLDACCT a
    """)

    queries = [
        {'key':'househldacct', 'sql':househldacct, 'engine':1},
    ]

    data = cdutils.database.connect.retrieve_data(queries)
    return data

In [2]:
data = fetch_data()

In [3]:
hh = data['househldacct'].copy()

In [4]:
import cdutils.deduplication

In [5]:
dedupe_list = [
    {'df':hh, 'field':'acctnbr'}
]
hh_cleaned = cdutils.deduplication.dedupe(dedupe_list)

In [7]:
assert hh_cleaned['acctnbr'].is_unique, "Failure"

In [8]:
import pandas as pd

In [14]:
INPUT_FILE = ('Alerts2025_Q3_Detail_no_ELOC_ALPlumbing_Farland.xlsx')
df = pd.read_excel(INPUT_FILE)

In [10]:
df

Unnamed: 0,acctnbr,effdate,ownername,product,loanofficer,inactivedate,Net Balance,Net Available,Net Collateral Reserve,cobal,...,Deposit Change Pct,ttm line utilization,cleanup_provision,riskratingcd,past_due_flag,ttm_overdrafts_flag,deposit_change_flag,ttm_utilization_flag,score_flag,passed_all_flag
0,4102783,2025-07-11,PIERCE PACKAGING PRODUCTS INC,FNB - SBA Line of Credit,SBLC LOAN OFFICER,2026-09-17,0.00,150000.00,0.0,0,...,-0.108228,0.000000,0,3P,0,0,0,0,0,1
1,151160167,2025-07-11,"TAUNTON ANTIQUES CENTER, INC.",Express Business LOC,EBL PROGRAM ADMIN,2026-04-18,0.00,19500.00,0.0,0,...,-0.398881,0.000000,0,3E,0,0,0,0,0,1
2,150664441,2025-07-11,"FERNANDES & CHAREST, P.C.",Express Business LOC,EBL PROGRAM ADMIN,2026-09-10,0.00,100000.00,0.0,0,...,0.313928,0.000000,0,3E,0,0,0,0,0,1
3,200191880989,2025-07-11,AOL PROPERTIES LLC,Line of Credit,SBLC LOAN OFFICER,2026-04-30,0.00,150000.00,0.0,0,...,-0.056928,0.000000,0,3P,0,0,0,0,0,1
4,600207481760,2025-07-11,"J & R SALES AND SERVICE, INC.",Line of Credit,SBLC LOAN OFFICER,2026-01-31,0.00,100000.00,0.0,0,...,0.234617,0.000000,0,3P,0,0,0,0,0,1
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
280,150928045,2025-07-11,"HASELTON PLUMBING & HEATING, INC.",Express Business LOC,EBL PROGRAM ADMIN,2026-07-21,10636.19,59363.81,0.0,0,...,-0.008942,0.161621,1,3E,0,0,0,0,0,0
281,151110005,2025-07-11,"OSAMEQUIN FARM, INC",Line of Credit,SBLC LOAN OFFICER,2025-10-18,0.00,15000.00,0.0,0,...,0.253614,0.265371,1,3L,0,0,0,0,0,0
282,150240960,2025-07-11,"PATEAKOS & POULIN , PC",Line of Credit,SBLC LOAN OFFICER,2025-11-29,0.00,50000.00,0.0,0,...,,0.000000,0,3P,0,0,0,0,0,1
283,150662932,2025-07-11,BRANDYWINE MATERIALS INC.,SBA Secured Line of Credit,MARK A. BORKMAN,2025-10-25,0.00,240000.00,0.0,0,...,0.390122,0.000000,0,3M,0,0,0,0,0,1


In [15]:
merged_df = pd.merge(df, hh_cleaned, how='left', on='acctnbr')

In [16]:
merged_df

Unnamed: 0,acctnbr,effdate,ownername,product,loanofficer,inactivedate,Net Balance,Net Available,Net Collateral Reserve,cobal,...,ttm line utilization,cleanup_provision,riskratingcd,past_due_flag,ttm_overdrafts_flag,deposit_change_flag,ttm_utilization_flag,score_flag,passed_all_flag,householdnbr
0,102199,2025-06-20,NORTHERN RHODE ISLAND CHAMBER OF COMMERCE,FNB - CML Line of Credit,SBLC LOAN OFFICER,2026-02-09,0.00,50000.00,0.0,0,...,0.000000,0,3P,0,0,0,0,0,1,230957
1,100957,2025-06-20,GRAPHIC INNOVATIONS INC,FNB - CML Line of Credit,SBLC LOAN OFFICER,2025-08-31,24442.32,125557.68,0.0,0,...,0.165745,1,3P,0,0,0,0,0,0,230174
2,101895,2025-06-20,FORE COURT RACQUET & FITNESS CLUB INC,FNB - CML Line of Credit,SBLC LOAN OFFICER,2026-03-12,0.00,50000.00,0.0,0,...,0.000000,0,3P,0,0,0,0,0,1,230222
3,101199,2025-06-20,ANDERSON-WINFIELD FUNERAL HOME INC,FNB - CML Line of Credit,SBLC LOAN OFFICER,2025-07-31,34169.09,65830.91,0.0,0,...,0.453117,1,3P,0,0,0,0,0,0,182482
4,100135,2025-06-20,"H.B. PRECISION PRODUCTS, INC.",FNB - CML Line of Credit,SBLC LOAN OFFICER,2075-01-01,0.00,0.00,0.0,0,...,0.000000,0,3P,0,0,0,0,0,1,230237
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
276,151158229,2025-06-20,"THERMAL SOLUTION RESOURCES, LLC",Express Business LOC,EBL PROGRAM ADMIN,2026-03-14,90000.00,60000.00,0.0,0,...,0.408955,1,3E,0,0,0,0,0,0,311218
277,151129577,2025-06-20,"HIGHWAY INTER STATE TRANSPORTATION COMPANY, INC.",SBA Secured Line of Credit,SBLC LOAN OFFICER,2025-12-23,45000.00,5000.00,0.0,0,...,0.551220,1,3L,0,0,0,0,0,0,185712
278,151150449,2025-06-20,"AMERICA'S BEST DEFENSE, INC.",Express Business LOC,EBL PROGRAM ADMIN,2026-02-12,24200.00,75800.00,0.0,0,...,0.158452,1,3E,0,0,1,0,0,0,182429
279,151125301,2025-06-20,BEAUPRE ELECTRIC INC,Line of Credit,WILLITTS S. MENDONCA,2025-12-09,0.00,350000.00,0.0,0,...,0.000000,0,3C,0,0,0,0,0,1,100756
