# 📊 Transaction Intelligence Pipeline Demo

In [None]:
# Load a sample document (receipt)
with open("../data/raw_documents/receipt.txt") as f:
    text = f.read()

print("📄 Sample Receipt Document:")
print("=" * 50)
print(text)


In [None]:
from etl_pipeline.parse_fields import extract_fields

fields = extract_fields(text)

print("🧾 Extracted Fields:")
for k, v in fields.items():
    print(f"{k}: {v}")


In [None]:
# Mock prediction from trained classifier
sample_text = "Uber receipt from March 2024 total $35.70"
predicted_label = "Receipt"
print("📂 Document classified as:", predicted_label)


In [None]:
import pandas as pd
import matplotlib.pyplot as plt

# Simulate daily transaction counts
df = pd.DataFrame({
    "date": pd.date_range("2024-03-01", periods=14),
    "count": [200, 190, 210, 220, 180, 250, 230, 210, 205, 215, 220, 230, 240, 235]
}).set_index("date")

df.plot(title="📈 Daily Transactions (Simulated)")
plt.ylabel("Transaction Count")
plt.grid(True)
plt.tight_layout()
plt.show()



---

## ✅ Summary

- Parsed a raw receipt for vendor, date, and total
- Simulated document classification using ML
- Visualized historical transaction volume
- Ready for further analytics like fraud risk scoring, time series modeling, and dashboarding!
