# eCommerce ML Use Case – Conversion Prediction

Conversion = Bestellung (NumOrders > 0)

## 1. Daten laden

In [None]:

import pandas as pd

df = pd.read_csv("Data_eCommerce.csv")
df.head()


## 2. Datenüberblick

In [None]:

df.info()
df.describe()


## 3. Zielvariable definieren
Conversion = NumOrders > 0

In [None]:

target = "NumOrders"

numeric_df = df.select_dtypes(include="number")

y = (df[target] > 0).astype(int)
X = numeric_df.drop(columns=[target])

y.value_counts()


## 4. Modell: Random Forest

In [None]:

from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import classification_report, roc_auc_score

X_train, X_test, y_train, y_test = train_test_split(
    X, y, test_size=0.2, random_state=42, stratify=y
)

model = RandomForestClassifier(
    n_estimators=200,
    random_state=42,
    n_jobs=-1
)

model.fit(X_train, y_train)

y_pred = model.predict(X_test)
y_proba = model.predict_proba(X_test)[:, 1]

print(classification_report(y_test, y_pred))
print("ROC-AUC:", roc_auc_score(y_test, y_proba))


## 5. Fazit
Random Forest ist robust, erklärbar und gut geeignet für strukturierte eCommerce-Daten.