In [None]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns

from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler
from sklearn.linear_model import LogisticRegression
from sklearn.tree import DecisionTreeClassifier
from sklearn.metrics import accuracy_score, confusion_matrix, classification_report

In [None]:
# Load dataset
df = pd.read_csv("Iris.csv")

In [None]:
df.head()

In [None]:
df.info()

In [None]:
df.shape

In [None]:
df.columns

In [None]:
df.describe()

In [None]:
# Check for nulls
df.isnull().sum()

In [None]:
# Count of species
df['Species'].value_counts()

In [None]:
# Pairplot for feature relationships
sns.pairplot(df, hue="Species")
plt.show()

In [None]:
# Drop unnecessary column if exists
X = df.drop(["Species","Id"], axis=1)
y = df["Species"]

In [None]:
# Train-test split
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

In [None]:
# Standardize features
scaler = StandardScaler()
X_train_scaled = scaler.fit_transform(X_train)
X_test_scaled = scaler.transform(X_test)

In [None]:
#Logistic Regression
log_reg = LogisticRegression(max_iter=200)
log_reg.fit(X_train_scaled, y_train)
y_pred_log = log_reg.predict(X_test_scaled)

acc_log = accuracy_score(y_test, y_pred_log)
print("Logistic Regression Accuracy:", acc_log)


In [None]:
#Decision Tree
dt_clf = DecisionTreeClassifier()
dt_clf.fit(X_train, y_train)
y_pred_dt = dt_clf.predict(X_test)

acc_dt = accuracy_score(y_test, y_pred_dt)
print("Decision Tree Accuracy:", acc_dt)


In [None]:
# Confusion matrices
cm_log = confusion_matrix(y_test, y_pred_log)
cm_dt = confusion_matrix(y_test, y_pred_dt)

In [None]:
# Plot Logistic Regression Confusion Matrix
plt.figure(figsize=(6,5))
sns.heatmap(cm_log, annot=True, fmt="d", cmap="Blues",
            xticklabels=log_reg.classes_, yticklabels=log_reg.classes_)
plt.title("Logistic Regression Confusion Matrix")
plt.ylabel("Actual")
plt.xlabel("Predicted")
plt.show()

In [None]:
# Plot Decision Tree Confusion Matrix
plt.figure(figsize=(6,5))
sns.heatmap(cm_dt, annot=True, fmt="d", cmap="Greens",
            xticklabels=dt_clf.classes_, yticklabels=dt_clf.classes_)
plt.title("Decision Tree Confusion Matrix")
plt.ylabel("Actual")
plt.xlabel("Predicted")
plt.show()

In [None]:
print("Logistic Regression Report:")
print(classification_report(y_test, y_pred_log))

In [None]:
print("Decision Tree Report:")
print(classification_report(y_test, y_pred_dt))

In [None]:
import pickle

pickle.dump(log_reg, open("model.pkl", "wb"))
pickle.dump(scaler, open("scaler.pkl", "wb"))