# Engine Emissions & Health Analysis
This notebook demonstrates analysis of synthetic engine emission data and its relation to engine health.

In [1]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
import numpy as np

# Generate synthetic dataset
np.random.seed(42)
n = 200
co2 = np.random.normal(200, 40, n)
nox = np.random.normal(50, 15, n)
so2 = np.random.normal(30, 10, n)
engine_hours = np.random.randint(500, 5000, n)
maintenance_score = np.clip(100 - (engine_hours/100 + (co2/10 + nox/5 + so2/3)), 0, 100)

df = pd.DataFrame({
    'CO2_emission_ppm': co2,
    'NOx_emission_ppm': nox,
    'SO2_emission_ppm': so2,
    'Operating_Hours': engine_hours,
    'Maintenance_Score': maintenance_score
})
df.head()

In [2]:
# Correlation heatmap
plt.figure(figsize=(6,5))
sns.heatmap(df.corr(), annot=True, cmap='coolwarm')
plt.title('Correlation Between Emissions and Engine Health')
plt.show()

In [3]:
# Scatter plot
sns.scatterplot(x='CO2_emission_ppm', y='Maintenance_Score', hue='Operating_Hours', data=df, palette='viridis')
plt.title('CO2 Emissions vs Maintenance Score')
plt.show()