# Iris Dataset Analysis
This project involves loading, exploring, analyzing, and visualizing the Iris dataset using Python. The goal is to understand patterns in the flower measurements and species classification.

In [None]:
import pandas as pd
from sklearn.datasets import load_iris

# Load the Iris dataset
iris = load_iris()

# Convert to a DataFrame
df = pd.DataFrame(data=iris.data, columns=iris.feature_names)
df['species'] = iris.target
df['species'] = df['species'].map(dict(zip(range(3), iris.target_names)))

# Show first 5 rows
df.head()

In [None]:
# Dataset info
df.info()

In [None]:
# Check for missing values
df.isnull().sum()

In [None]:
# Basic statistics
df.describe()

In [None]:
# Mean values grouped by species
df.groupby('species').mean()

In [None]:
import matplotlib.pyplot as plt
import seaborn as sns
sns.set(style="whitegrid")

In [None]:
# Line Chart
plt.figure(figsize=(10, 5))
plt.plot(df.index, df['sepal length (cm)'], label='Sepal Length')
plt.plot(df.index, df['sepal width (cm)'], label='Sepal Width')
plt.title('Sepal Dimensions Over Samples')
plt.xlabel('Sample Index')
plt.ylabel('cm')
plt.legend()
plt.show()

In [None]:
# Bar Chart
plt.figure(figsize=(7, 5))
df.groupby('species')['petal length (cm)'].mean().plot(kind='bar', color='skyblue')
plt.title('Average Petal Length by Species')
plt.xlabel('Species')
plt.ylabel('Petal Length (cm)')
plt.xticks(rotation=0)
plt.show()

In [None]:
# Histogram
plt.figure(figsize=(7, 5))
plt.hist(df['sepal length (cm)'], bins=20, color='salmon', edgecolor='black')
plt.title('Sepal Length Distribution')
plt.xlabel('Sepal Length (cm)')
plt.ylabel('Frequency')
plt.show()

In [None]:
# Scatter Plot
plt.figure(figsize=(8, 6))
sns.scatterplot(data=df, x='sepal length (cm)', y='petal length (cm)', hue='species', palette='deep')
plt.title('Sepal Length vs Petal Length')
plt.xlabel('Sepal Length (cm)')
plt.ylabel('Petal Length (cm)')
plt.legend()
plt.show()

## 📌 Observations
1. 'Setosa' has the smallest sepal and petal lengths on average.
2. 'Virginica' has the highest values in petal length.
3. Sepal length shows a uniform distribution.
4. There’s a strong correlation between sepal and petal lengths.