# 🌸 Iris Flower Classification – Machine Learning Project


This notebook is part of my **AI & ML Internship (Week 1)**.  
The goal is to classify **Iris flowers** into three species based on their **sepal and petal measurements**.

Species in dataset:  
- 🌱 Setosa  
- 🌿 Versicolor  
- 🌸 Virginica  


## 📌 Step 0: Import Libraries

In [None]:

import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns

from sklearn.datasets import load_iris
from sklearn.model_selection import train_test_split
from sklearn.neighbors import KNeighborsClassifier
from sklearn.tree import DecisionTreeClassifier
from sklearn.metrics import accuracy_score, confusion_matrix, classification_report


## 📌 Step 1: Load Dataset

In [None]:

iris = load_iris()
df = pd.DataFrame(data=iris.data, columns=iris.feature_names)
df['species'] = iris.target

# Map numeric target to species names
df['species'] = df['species'].map({0:'setosa', 1:'versicolor', 2:'virginica'})

print("First 5 rows of dataset:")
df.head()


## 📌 Step 2: Explore Dataset

In [None]:

print("Dataset Info:")
print(df.info())

print("\nStatistical Summary:")
print(df.describe())

# Pairplot visualization
sns.pairplot(df, hue="species")
plt.show()

# Correlation heatmap
plt.figure(figsize=(6,4))
sns.heatmap(df.iloc[:,:-1].corr(), annot=True, cmap="coolwarm")
plt.title("Feature Correlation")
plt.show()


## 📌 Step 3: Preprocess Data

In [None]:

X = df.drop("species", axis=1)
y = df["species"]

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

print("Training set size:", X_train.shape)
print("Testing set size:", X_test.shape)


## 📌 Step 4: Train Models

In [None]:

# Model 1: K-Nearest Neighbors
knn = KNeighborsClassifier()
knn.fit(X_train, y_train)

# Model 2: Decision Tree
dt = DecisionTreeClassifier(random_state=42)
dt.fit(X_train, y_train)


## 📌 Step 5: Evaluate Models

In [None]:

def evaluate_model(model, model_name):
    y_pred = model.predict(X_test)
    print(f"\n🔹 {model_name} Results 🔹")
    print("Accuracy:", accuracy_score(y_test, y_pred))
    print("\nClassification Report:\n", classification_report(y_test, y_pred))

    # Confusion Matrix
    cm = confusion_matrix(y_test, y_pred)
    plt.figure(figsize=(5,4))
    sns.heatmap(cm, annot=True, fmt="d", cmap="Blues",
                xticklabels=iris.target_names,
                yticklabels=iris.target_names)
    plt.xlabel("Predicted")
    plt.ylabel("Actual")
    plt.title(f"{model_name} - Confusion Matrix")
    plt.show()

# Evaluate KNN
evaluate_model(knn, "K-Nearest Neighbors")

# Evaluate Decision Tree
evaluate_model(dt, "Decision Tree")


## 📌 Step 6: Save & Wrap Up

In [None]:

# Save dataset (optional)
df.to_csv("iris_dataset.csv", index=False)
print("Project Completed ✅ - Upload your notebook & README.md to GitHub")
