# Task 2: Predictive Analysis using Machine Learning
**Internship:** CODTECH

**Dataset Used:** Iris Flower Dataset (from sklearn)

This notebook builds a classification model to predict the species of an iris flower based on its features. It includes feature selection, model training, and evaluation steps.

In [None]:
import pandas as pd
import seaborn as sns
import matplotlib.pyplot as plt
from sklearn.datasets import load_iris
from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import accuracy_score, classification_report, confusion_matrix


In [None]:
# Load the iris dataset
iris = load_iris()
df = pd.DataFrame(iris.data, columns=iris.feature_names)
df['species'] = iris.target

# Map target numbers to actual names
df['species'] = df['species'].map(dict(enumerate(iris.target_names)))

# Display first few rows
df.head()


In [None]:
# Visualize pairplot
sns.pairplot(df, hue="species")
plt.show()


In [None]:
# Features and labels
X = df.drop("species", axis=1)
y = df["species"]

# Train-test split
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)


In [None]:
# Train a Random Forest Classifier
model = RandomForestClassifier(n_estimators=100, random_state=42)
model.fit(X_train, y_train)


In [None]:
# Make predictions
y_pred = model.predict(X_test)

# Evaluate the model
print("Accuracy Score:", accuracy_score(y_test, y_pred))
print("\nClassification Report:\n", classification_report(y_test, y_pred))
print("\nConfusion Matrix:\n", confusion_matrix(y_test, y_pred))
