# Exploratory Data Analysis
## Objectives
* Visualize correlations between car attributes and selling price.
* Validate hypotheses about price correlations.

## Outputs
* Correlation heatmap and scatter plots saved as images.

## Additional Comments
* Use seaborn for visualizations.

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

# Load cleaned dataset
df = pd.read_csv('../../datasets/cleaned_car_data.csv')

# Correlation heatmap
plt.figure(figsize=(10, 8))
sns.heatmap(df.corr(), annot=True, cmap='coolwarm')
plt.title('Correlation Heatmap')
plt.savefig('../../outputs/correlation_heatmap.png')

# Scatter plot: Present_Price vs Selling_Price
plt.figure(figsize=(8, 6))
sns.scatterplot(x='Present_Price(lacs)', y='Selling_Price(lacs)', data=df)
plt.title('Present Price vs Selling Price')
plt.savefig('../../outputs/present_vs_selling_price.png')

# Box plot: Fuel_Type vs Selling_Price
plt.figure(figsize=(8, 6))
sns.boxplot(x='Fuel_Type', y='Selling_Price(lacs)', data=df)
plt.title('Fuel Type vs Selling Price')
plt.savefig('../../outputs/fuel_type_vs_selling_price.png')

# Box plot: Transmission vs Selling_Price
plt.figure(figsize=(8, 6))
sns.boxplot(x='Transmission', y='Selling_Price(lacs)', data=df)
plt.title('Transmission vs Selling Price')
plt.savefig('../../outputs/transmission_vs_selling_price.png')

plt.close('all')