# Classification Workflow with edaflow
This notebook demonstrates a typical classification workflow using edaflow.

In [None]:
# Import required libraries
import pandas as pd
import edaflow as eda
from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestClassifier

## 1. Load Sample Data
Synthetic classification dataset.

In [None]:
df = pd.DataFrame({
    'feature1': [2, 3, 1, 5, 4, 2, 3, 4, 5, 1],
    'feature2': [7, 8, 6, 5, 7, 8, 6, 5, 7, 8],
    'target': [0, 1, 0, 1, 1, 0, 1, 0, 1, 0]
})
df.head()

## 2. Preprocess Data
Split into train and test sets.

In [None]:
X = df[['feature1', 'feature2']]
y = df['target']
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=42)

## 3. Train Classifier
Fit a RandomForestClassifier.

In [None]:
clf = RandomForestClassifier()
clf.fit(X_train, y_train)

## 4. Evaluate Metrics
Use edaflow to visualize and evaluate classification metrics.

In [None]:
y_pred = clf.predict(X_test)
eda.ml.plot_confusion_matrix(y_test, y_pred)

## 5. Visualize Results
Show feature importance.

In [None]:
eda.ml.plot_feature_importance(clf, X.columns)