# Chapter 3: Analysis of Accounting Transactions

Accounting transactions are the 'raw data' of accounting systems. This chapter demonstrates tools to cost-effectively prepare and analyze accounting transaction data.

## Setup

In [None]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
from scipy import stats
import auditanalytics as aa

sns.set_style('whitegrid')
plt.rcParams['figure.figsize'] = (12, 6)

## Loading Transaction Data

In [None]:
# Load various journal entries
sales_journal = aa.load_dataset('sales_journal')
purchase_journal = aa.load_dataset('purchase_journal')
disbursement_journal = aa.load_dataset('disbursement_journal')

print("Sales Journal:")
print(sales_journal.head())
print(f"\nTotal records: {len(sales_journal)}")

## Transaction Analysis

In [None]:
# Analyze transaction amounts
numeric_cols = sales_journal.select_dtypes(include=[np.number]).columns
if len(numeric_cols) > 0:
    amount_col = numeric_cols[0]
    print(f"\nStatistics for {amount_col}:")
    print(sales_journal[amount_col].describe())
    
    # Plot distribution
    plt.figure(figsize=(12, 5))
    plt.subplot(1, 2, 1)
    sns.histplot(sales_journal[amount_col], kde=True)
    plt.title(f'Distribution of {amount_col}')
    
    plt.subplot(1, 2, 2)
    sns.boxplot(y=sales_journal[amount_col])
    plt.title(f'Box Plot of {amount_col}')
    plt.tight_layout()
    plt.show()

## Ledger Analysis

In [None]:
# Load ledger data
ap_ledger = aa.load_dataset('ap_ledger')
print("\nAccounts Payable Ledger:")
print(ap_ledger.head())
print(f"\nSummary:")
print(ap_ledger.describe())

## Data Quality Checks

In [None]:
# Check for missing values
print("Missing values in sales journal:")
print(sales_journal.isnull().sum())

# Check for duplicates
print(f"\nDuplicate records: {sales_journal.duplicated().sum()}")

# Check data types
print("\nData types:")
print(sales_journal.dtypes)

## Conclusion

This notebook demonstrates fundamental techniques for analyzing accounting transactions, including data quality checks, statistical analysis, and visualization.