*# This section loads, cleans, and merges the Customer, Checking, and Credit Card datasets to create a unified banking transactions dataset for analysis and visualization in Power BI.*

In [None]:
pip install pandas numpy



In [None]:
import pandas as pd

# Loading all CSVs
customer_df = pd.read_csv("/content/Customer_Info.csv")
checking_df = pd.read_csv("/content/Checking_Account.csv")
credit_df = pd.read_csv("/content/Credit_Card.csv")

In [None]:
# Converting the date columns to datetime format
checking_df['Transaction_Date'] = pd.to_datetime(checking_df['Transaction_Date'])
credit_df['Transaction_Date'] = pd.to_datetime(credit_df['Transaction_Date'])
customer_df['Join_Date'] = pd.to_datetime(customer_df['Join_Date'])

# Dropping any duplicates just in case
customer_df.drop_duplicates(subset='Customer_ID', inplace=True)
checking_df.drop_duplicates(subset='Transaction_ID', inplace=True)
credit_df.drop_duplicates(subset='Card_Id', inplace=True)

In [None]:
checking_df['Source'] = 'Checking'
credit_df['Source'] = 'Credit Card'

In [None]:
checking_df.rename(columns={
    'Transaction_ID': 'Transaction_ID',
    'Transaction_Date': 'Date',
    'Amount': 'Amount',
    'Transaction_Type': 'Category',
    'Branch_City': 'City'
}, inplace=True)

credit_df.rename(columns={
    'Card_ID': 'Transaction_ID',
    'Transaction_Date': 'Date',
    'Amount': 'Amount',
    'Category': 'Category',
    'City': 'City'
}, inplace=True)


In [None]:
# Combine both datasets
transactions_df = pd.concat([checking_df, credit_df], ignore_index=True)

In [None]:
unified_df = transactions_df.merge(customer_df, on='Customer_ID', how='left')

In [None]:
unified_df.to_csv("Unified_Transactions.csv", index=False)
print("✅ Unified dataset created successfully!")

✅ Unified dataset created successfully!


In [None]:
print(unified_df.head())
print(unified_df.info())

   Transaction_ID  Customer_ID       Date    Category  Amount  \
0             1.0            1 2022-03-15  Withdrawal    4057   
1             2.0            2 2024-09-06    Transfer    3145   
2             3.0            3 2023-02-08    Transfer    3823   
3             4.0            4 2023-04-23    Transfer    1912   
4             5.0            5 2023-02-04     Deposit     633   

   Account_Balance      City_x Channel    Source  Card_Id Merchant First_Name  \
0              NaN      Berovo  Online  Checking      NaN      NaN   Phyllida   
1              NaN  Södertälje  Branch  Checking      NaN      NaN     Chrisy   
2              NaN     Shilibu     ATM  Checking      NaN      NaN     Elvera   
3              NaN     Xiadong  Branch  Checking      NaN      NaN     Layton   
4              NaN  Bayan Hure  Branch  Checking      NaN      NaN    Filippa   

  Last_Name                         Email  Gender        City_y  Join_Date  \
0    Gowing  pgowing0@theglobeandmail.com  F