In [None]:
"""
exploratory_analysis.py

This script performs a minimal data exploration on a CSV file. It:
1. Loads the data from a specified path.
2. Prints a preview of the DataFrame (head).
3. Shows info about data types, memory usage, etc.
4. Checks for missing values and duplicates.
5. Generates basic statistical summaries for numerical columns.

Usage:
------
1. Adjust the CSV path in config.py if needed (default is '../data/network_data.csv').
2. Run:
   python exploratory_analysis.py
3. Ensure you have pandas installed:
   pip install pandas
"""

import pandas as pd

# Minimal change: import DATA_PATH from config
# If you have an __init__.py in the same folder and plan to run with -m, use:
# from .config import DATA_PATH
# Otherwise, if you run directly, do:
from config import DATA_PATH

def main():
    # 1. Load the network traffic data from config.py
    df = pd.read_csv(DATA_PATH)

    # 2. Display the first few rows to understand the structure
    print("=== First 5 Rows of the Data ===")
    print(df.head())

    # 3. Get basic information about the dataset
    print("\n=== DataFrame Info ===")
    print(df.info())

    # 4. Check for missing values in each column
    print("\n=== Missing Values in Each Column ===")
    print(df.isnull().sum())

    # 5. Check for duplicate rows
    duplicates = df.duplicated().sum()
    print(f"\n=== Number of Duplicate Rows: {duplicates} ===")

    # 6. Generate basic statistics for numerical columns
    print("\n=== Basic Statistical Summary ===")
    print(df.describe())

if __name__ == "__main__":
    main()
