# 💎 Diamond Price Analysis

This notebook analyzes the relationship between diamond attributes and their prices using the provided dataset.

In [None]:
import pandas as pd
import seaborn as sns
import matplotlib.pyplot as plt
import numpy as np

# Enable inline plotting
%matplotlib inline

In [None]:
# Load the dataset
df = pd.read_csv('diamonds.csv')
df.head()

In [None]:
df.info()

In [None]:
# Create a new column 'size' = x * y * z
df['size'] = df['x'] * df['y'] * df['z']
df[['x', 'y', 'z', 'size']].head()

In [None]:
df.describe(include='all')

In [None]:
df.isnull().sum()

In [None]:
plt.figure(figsize=(10, 5))
sns.histplot(df['price'], kde=True, bins=50)
plt.title('Price Distribution')
plt.xlabel('Price')

In [None]:
plt.figure(figsize=(10, 5))
sns.scatterplot(x='carat', y='price', data=df, alpha=0.5)
plt.title('Price vs Carat')

In [None]:
plt.figure(figsize=(10, 5))
sns.boxplot(x='cut', y='price', data=df)
plt.title('Price vs Cut')

In [None]:
plt.figure(figsize=(10, 8))
sns.heatmap(df.corr(numeric_only=True), annot=True, cmap='coolwarm')
plt.title('Correlation Heatmap')