In [1]:
import mlflow
import mlflow.sklearn
from sklearn.datasets import load_iris
from sklearn.model_selection import train_test_split
from sklearn.tree import DecisionTreeClassifier
from sklearn.metrics import accuracy_score

In [2]:
# Carga el dataset iris
data = load_iris()
X = data.data
y = data.target

In [3]:
# Divide en entrenamiento y prueba
X_train, X_test, y_train, y_test = train_test_split(X, y, random_state=42)

In [4]:
# Configura el experimento de MLflow (crea uno si no existe)
mlflow.set_tracking_uri("http://mlflow:5000")
mlflow.set_experiment("Iris_Classifier")

with mlflow.start_run():
    # Entrena modelo
    clf = DecisionTreeClassifier(max_depth=3, random_state=42)
    clf.fit(X_train, y_train)

    # Predice
    y_pred = clf.predict(X_test)
    acc = accuracy_score(y_test, y_pred)

    # Loguea parámetros, métricas y modelo
    mlflow.log_param("max_depth", 3)
    mlflow.log_metric("accuracy", acc)
    mlflow.sklearn.log_model(clf, "model")

    print(f"Accuracy: {acc}")
    print("Modelo guardado en MLflow.")



Accuracy: 1.0
Modelo guardado en MLflow.
🏃 View run tasteful-steed-542 at: http://mlflow:5000/#/experiments/1/runs/0f3efbdb4573489bb4d5191312307fd4
🧪 View experiment at: http://mlflow:5000/#/experiments/1


In [5]:
import pyspark