# 1. 데이터셋 로드

In [2]:
import mlflow
import mlflow.sklearn
from sklearn.datasets import fetch_california_housing
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LinearRegression
from sklearn.metrics import mean_squared_error

# 데이터셋 로드
california = fetch_california_housing()
X, y = california.data, california.target

# 데이터를 학습 세트와 테스트 세트로 분할
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# 2. 실험

In [3]:
# MLflow 실험 시작
mlflow.start_run()

# 모델 학습
model = LinearRegression()
model.fit(X_train, y_train)

# 예측 및 메트릭 계산
predictions = model.predict(X_test)
mse = mean_squared_error(y_test, predictions)

# 매개변수, 메트릭, 모델 기록
mlflow.log_param("model_type", "linear_regression")
mlflow.log_metric("mse", mse)

# 모델 저장
mlflow.sklearn.log_model(model, "model")

# MLflow 실험 종료
mlflow.end_run()