In [8]:
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestClassifier
from sklearn.preprocessing import StandardScaler
from sklearn.metrics import accuracy_score, classification_report, confusion_matrix

# Load dataset
df = pd.read_csv("iris_flower.csv")

# Select features and target variable
X = df[['sepal_length', 'sepal_width', 'petal_length', 'petal_width']]
y = df['species']

# Standardize the data
scaler = StandardScaler()
X_scaled = scaler.fit_transform(X)

# Split into training and testing sets
X_train, X_test, y_train, y_test = train_test_split(X_scaled, y, test_size=0.3, random_state=42)

# Train Random Forest model
model = RandomForestClassifier(n_estimators=100, random_state=42)
model.fit(X_train, y_train)

# Make predictions
y_pred = model.predict(X_test)

# Evaluate model performance
print(f"Accuracy: {accuracy_score(y_test, y_pred)}")
print("Confusion Matrix:\n", confusion_matrix(y_test, y_pred))
print("Classification Report:\n", classification_report(y_test, y_pred))

# Display predictions with actual labels
predictions_df = pd.DataFrame({"Actual": y_test, "Predicted": y_pred})
print("\nPredicted Species for Test Data:\n")
print(predictions_df.to_string(index=False))


Accuracy: 1.0
Confusion Matrix:
 [[2 0 0]
 [0 3 0]
 [0 0 4]]
Classification Report:
               precision    recall  f1-score   support

      setosa       1.00      1.00      1.00         2
  versicolor       1.00      1.00      1.00         3
   virginica       1.00      1.00      1.00         4

    accuracy                           1.00         9
   macro avg       1.00      1.00      1.00         9
weighted avg       1.00      1.00      1.00         9


Predicted Species for Test Data:

    Actual  Predicted
 virginica  virginica
versicolor versicolor
 virginica  virginica
versicolor versicolor
    setosa     setosa
    setosa     setosa
 virginica  virginica
 virginica  virginica
versicolor versicolor
