## Scenario 1: A single data scientist participating in an ML competition

MLflow setup:
* Tracking server: no
* Backend store: local filesystem
* Artifacts store: local filesystem

The experiments can be explored locally by launching the MLflow UI.

In [1]:
import mlflow

In [2]:
print(f"tracking URI: '{mlflow.get_tracking_uri()}'")

tracking URI: 'file:///D:/Learning/09.%20mlops/00.%20Zoomcamp/mlops-zoomcamp/02_Week_2/running-mlflow-examples/mlruns'


In [4]:
mlflow.list_experiments()

AttributeError: module 'mlflow' has no attribute 'list_experiments'

In [5]:
# Fetch the list of experiments
experiments = mlflow.search_experiments()

# Print out the experiment details
for exp in experiments:
    print(f"Experiment Name: {exp.name}")
    print(f"Experiment ID: {exp.experiment_id}")
    print(f"Lifecycle Stage: {exp.lifecycle_stage}")
    print("-" * 20)

Experiment Name: Default
Experiment ID: 0
Lifecycle Stage: active
--------------------


### Creating an experiment and logging a new run

In [6]:
from sklearn.linear_model import LogisticRegression
from sklearn.datasets import load_iris
from sklearn.metrics import accuracy_score

mlflow.set_experiment("my-experiment-1")

with mlflow.start_run():

    X, y = load_iris(return_X_y=True)

    params = {"C": 0.1, "random_state": 42}
    mlflow.log_params(params)

    lr = LogisticRegression(**params).fit(X, y)
    y_pred = lr.predict(X)
    mlflow.log_metric("accuracy", accuracy_score(y, y_pred))

    mlflow.sklearn.log_model(lr, artifact_path="models")
    print(f"default artifacts URI: '{mlflow.get_artifact_uri()}'")

2024/05/24 16:12:00 INFO mlflow.tracking.fluent: Experiment with name 'my-experiment-1' does not exist. Creating a new experiment.


default artifacts URI: 'file:///D:/Learning/09.%20mlops/00.%20Zoomcamp/mlops-zoomcamp/02_Week_2/running-mlflow-examples/mlruns/889484265817659470/50c304af5c5e4a6fa51e91cd81ee2457/artifacts'


In [8]:
# Fetch the list of experiments
experiments = mlflow.search_experiments()

# Print out the experiment details
for exp in experiments:
    print(f"Experiment Name: {exp.name}")
    print(f"Experiment ID: {exp.experiment_id}")
    print(f"Lifecycle Stage: {exp.lifecycle_stage}")
    print("-" * 20)

Experiment Name: my-experiment-1
Experiment ID: 889484265817659470
Lifecycle Stage: active
--------------------
Experiment Name: Default
Experiment ID: 0
Lifecycle Stage: active
--------------------


In [9]:
experiments

[<Experiment: artifact_location='file:///D:/Learning/09.%20mlops/00.%20Zoomcamp/mlops-zoomcamp/02_Week_2/running-mlflow-examples/mlruns/889484265817659470', creation_time=1716559920929, experiment_id='889484265817659470', last_update_time=1716559920929, lifecycle_stage='active', name='my-experiment-1', tags={}>,
 <Experiment: artifact_location='file:///D:/Learning/09.%20mlops/00.%20Zoomcamp/mlops-zoomcamp/02_Week_2/running-mlflow-examples/mlruns/0', creation_time=1716559828472, experiment_id='0', last_update_time=1716559828472, lifecycle_stage='active', name='Default', tags={}>]

### Interacting with the model registry

In [10]:
from mlflow.tracking import MlflowClient

client = MlflowClient()

In [12]:
from mlflow.exceptions import MlflowException

try:
    client.search_registered_models()
except MlflowException:
    print("It's not possible to access the model registry :(")

In [13]:
client.search_registered_models()

[]