In [None]:
import pandas as pd
import os

folder = '../output_data/clean'

for file in os.listdir(folder):
    file_path = os.path.join(folder, file)

    # Skip if the file is empty
    if os.path.getsize(file_path) == 0:
        print(f"⚠️ Skipped empty file: {file}")
        continue

    try:
        df = pd.read_csv(file_path)

        # Check if required column exists
        if 'temperature' not in df.columns:
            print(f"⚠️ Skipped {file}: 'temperature' column missing.")
            continue

        # Basic anomaly detection using Z-score
        z_scores = (df['temperature'] - df['temperature'].mean()) / df['temperature'].std()
        anomalies = df[z_scores.abs() > 2.5]
        print(f"{file}: 🚨 {len(anomalies)} anomalies detected")

    except Exception as e:
        print(f"❌ Failed to process {file}: {e}")
