# 🧠 Credit Card Fraud Detection EDA

This notebook performs exploratory data analysis (EDA) on the credit card transactions dataset.

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

# Set style
sns.set(style='whitegrid')

# Load the dataset
df = pd.read_csv('../data/creditcard.csv')
df.head()

## 📊 Basic Info

In [None]:
# Dataset shape
print("Shape:", df.shape)

# Info
df.info()

# Missing values
df.isnull().sum()

## 📉 Class Distribution

In [None]:
# Class counts
print(df['Class'].value_counts())

# Plot class distribution
sns.countplot(x='Class', data=df)
plt.title('Class Distribution (0 = Non-Fraud, 1 = Fraud)')
plt.show()

## 💸 Amount Analysis

In [None]:
# Distribution of transaction amount
sns.histplot(df['Amount'], bins=50, kde=True)
plt.title('Transaction Amount Distribution')
plt.xlabel('Amount')
plt.ylabel('Frequency')
plt.show()

## ⏱️ Time of Transaction

In [None]:
# Time feature
sns.histplot(df['Time'], bins=50)
plt.title('Transaction Time Distribution (in seconds)')
plt.xlabel('Time')
plt.ylabel('Frequency')
plt.show()

## 🔍 Correlation with Class

In [None]:
# Correlation with target
correlations = df.corr()['Class'].sort_values(ascending=False)
print(correlations.head(10))

# Optional: plot top 5 correlated features
top_features = correlations.index[1:6]
sns.pairplot(df[top_features.to_list() + ['Class']], hue='Class')
plt.show()

## 🧼 Summary

In [None]:
# Summary statistics
df.describe()