# 1. Get the dataset

In [1]:
import pandas as pd
from sklearn.datasets import load_iris

data = load_iris()

df = pd.DataFrame(data.data, columns=data.feature_names)
df["target"] = data.target

x, y = df.drop(columns="target"), df["target"]

# 2. Run auto transformations

In [None]:
from cross import CrossTransformer

transformer = CrossTransformer()
problem_type = "classification"

transformations = transformer.auto_transform(x, y, problem_type)

# Create transformer based on transformations
transformer = CrossTransformer(transformations)

# 3. Define the pipeline

In [3]:
from sklearn.ensemble import RandomForestClassifier
from sklearn.neighbors import KNeighborsClassifier
from sklearn.pipeline import Pipeline

model = KNeighborsClassifier()
pipe = Pipeline(steps=[('t', transformer), ('m', model)])

# 4. Evalute

In [None]:
from numpy import mean, std
from sklearn.model_selection import cross_val_score
from sklearn.model_selection import RepeatedStratifiedKFold

cv = RepeatedStratifiedKFold(n_splits=10, n_repeats=3, random_state=1)
scores = cross_val_score(pipe, x, y, scoring='accuracy', cv=cv, n_jobs=-1)

print(f"{mean(scores):.3f} ({std(scores):.3f})")