# 🔍 Data Exploration - Cybersecurity Threats Analysis

This notebook provides comprehensive exploration of the Global Cybersecurity Threats Dataset (2015-2024).

## 📋 Contents
1. Data Loading and Basic Information
2. Dataset Structure Analysis
3. Missing Values Assessment
4. Statistical Summary
5. Initial Visualizations

In [None]:
# Import required libraries
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
import sqlite3
from pathlib import Path
import sys

# Add src to path for imports
sys.path.append('../src')

from utils.data_loader import DataLoader
from analysis.threat_analyzer import ThreatAnalyzer

# Configure plotting
plt.style.use('seaborn-v0_8')
sns.set_palette('viridis')
plt.rcParams['figure.figsize'] = (12, 8)

# Suppress warnings
import warnings
warnings.filterwarnings('ignore')

In [None]:
# Load the dataset
data_loader = DataLoader()

# Update this path to your actual dataset location
data_path = '../data/raw/cybersecurity_threats.csv'

try:
    df = data_loader.load_csv(data_path)
    print(f"✅ Dataset loaded successfully!")
    print(f"📊 Shape: {df.shape}")
    print(f"📅 Columns: {list(df.columns)}")
except FileNotFoundError:
    print("❌ Dataset file not found. Please check the file path.")
    print("💡 Make sure to place your dataset in the '../data/raw/' directory")