In [None]:
# Step 1: Import Libraries
import pandas as pd
import matplotlib.pyplot as plt
from sklearn.ensemble import IsolationForest
import numpy as np

# Step 2: Load Dataset
# Simulating a financial transactions dataset
np.random.seed(42)
normal_data = np.random.normal(loc=1000, scale=100, size=200)
anomalies = np.random.normal(loc=1500, scale=50, size=10)
data = np.concatenate([normal_data, anomalies])
df = pd.DataFrame(data, columns=['TransactionAmount'])

# Step 3: Apply Isolation Forest
iso_forest = IsolationForest(contamination=0.05, random_state=42)
df['Anomaly'] = iso_forest.fit_predict(df[['TransactionAmount']])

# Step 4: Visualize Anomalies
plt.figure(figsize=(10, 5))
colors = df['Anomaly'].map({1: 'green', -1: 'red'})
plt.scatter(df.index, df['TransactionAmount'], c=colors)
plt.title("Anomaly Detection in Financial Transactions (Isolation Forest)")
plt.xlabel("Transaction Index")
plt.ylabel("Transaction Amount")
plt.show()

# Count of anomalies
print("\nAnomalies Detected:")
print(df['Anomaly'].value_counts())

In [None]:
from google.colab import drive
drive.mount('/content/drive')