# Register Best Model in MLFlow Model Registry

In [1]:
%load_ext autoreload
%autoreload 2

::: {.content-hidden}
Import necessary Python modules
:::

In [2]:
import json
import os
import sys
from glob import glob

import mlflow.sklearn
import pandas as pd
from mlflow import MlflowClient

::: {.content-hidden}
Get relative path to project root directory
:::

In [3]:
PROJ_ROOT_DIR = os.path.join(os.pardir)
src_dir = os.path.join(PROJ_ROOT_DIR, "src")
sys.path.append(src_dir)

::: {.content-hidden}
Import custom Python modules
:::

In [4]:
%aimport model_helpers
import model_helpers as modh

## About

This step retrieves the best ML model across all the MLFlow experiment runs that were tracked during ML development. This best model is then registered in the MLFlow Model Registry.

## User Inputs

Define the primary ML scoring metric

In [5]:
#| echo: true
primary_metric = "fbeta2"

::: {.content-hidden}
Get path to data sub-folders
:::

In [6]:
data_dir = os.path.join(PROJ_ROOT_DIR, "data")
raw_data_dir = os.path.join(data_dir, "raw")

::: {.content-hidden}
Define MLFlow storage paths
:::

In [7]:
mlruns_db_fpath = f"{raw_data_dir}/mlruns.db"
mlflow.set_tracking_uri(f"sqlite:///{mlruns_db_fpath}")

::: {.content-hidden}
Set environment variable to silence MLFlow `git` warning messsage
:::

In [8]:
os.environ["GIT_PYTHON_REFRESH"] = "quiet"

## Manage ML Experiments

### Inspect Experiment Run Outputs

Get all runs of all experiments

In [9]:
#| echo: true
df_expt_runs = modh.get_all_experiment_runs()

2023/07/10 18:58:19 INFO mlflow.store.db.utils: Creating initial MLflow database tables...
2023/07/10 18:58:19 INFO mlflow.store.db.utils: Updating database tables
INFO  [alembic.runtime.migration] Context impl SQLiteImpl.
INFO  [alembic.runtime.migration] Will assume non-transactional DDL.
INFO  [alembic.runtime.migration] Context impl SQLiteImpl.
INFO  [alembic.runtime.migration] Will assume non-transactional DDL.


In [10]:
#| output: false
with pd.option_context("display.max_columns", None):
    display(df_expt_runs.drop(columns=["params", "column_names"]))

Unnamed: 0,resampling_approach,clf,param_clf__a,param_clf__b,param_preprocessor__cat__rarecats__fe__ignore_format,param_preprocessor__cat__rarecats__fe__n_categories,param_preprocessor__cat__rarecats__fe__replace_with,param_preprocessor__cat__rarecats__fe__tol,param_resampler__sampling_strategy,param_select__threshold,test_accuracy,test_balanced_accuracy,test_precision,test_recall,test_roc_auc,test_f1,test_fbeta05,test_fbeta2,test_pr_auc,test_avg_precision,fit_time,score_time,experiment_run_type,train_val_accuracy,train_val_balanced_accuracy,train_val_precision,train_val_recall,train_val_roc_auc,train_val_f1,train_val_fbeta05,train_val_fbeta2,train_val_pr_auc,train_val_avg_precision,train_start_date,test_end_date,num_observations,num_columns,experiment_id,run_id
0,os,BetaDistClassifier,0.2,2.31,True,1,other,0.1,0.1,0.7,0.937904,0.501539,0.501726,0.501539,0.501539,0.501568,0.501646,0.501536,0.035103,0.034205,0.809488,0.123062,nested,,,,,,,,,,,20160901,20170228,113728,29,1,f805253a6ba64ee6a41bf14310ef16a4
1,os,BetaDistClassifier,0.2,2.25,True,1,other,0.1,0.1,0.7,0.935732,0.497742,0.497604,0.497742,0.497742,0.497659,0.497622,0.497705,0.034681,0.033965,0.805559,0.12235,nested,,,,,,,,,,,20160901,20170228,113728,29,1,f805253a6ba64ee6a41bf14310ef16a4
2,os,BetaDistClassifier,0.2,2.35,True,1,other,0.1,0.1,0.7,0.938707,0.499282,0.499163,0.499282,0.499282,0.499125,0.499121,0.499198,0.032796,0.034049,0.805286,0.121149,nested,,,,,,,,,,,20160901,20170228,113728,29,1,f805253a6ba64ee6a41bf14310ef16a4
3,os,BetaDistClassifier,0.2,2.4,True,1,other,0.1,0.1,0.7,0.940549,0.504244,0.505168,0.504244,0.504244,0.504495,0.50484,0.504301,0.035744,0.034455,0.803107,0.122443,nested,,,,,,,,,,,20160901,20170228,113728,29,1,f805253a6ba64ee6a41bf14310ef16a4
4,os,BetaDistClassifier,0.2,2.5,True,1,other,0.1,0.1,0.7,0.942532,0.499926,0.4999,0.499926,0.499926,0.499561,0.499658,0.499713,0.032515,0.034089,0.801959,0.121958,nested,,,,,,,,,,,20160901,20170228,113728,29,1,f805253a6ba64ee6a41bf14310ef16a4
5,os,BetaDistClassifier,0.3,2.31,True,1,other,0.1,0.1,0.7,0.919866,0.498214,0.498741,0.498214,0.498214,0.497814,0.498251,0.497846,0.034976,0.033984,0.803779,0.122666,nested,,,,,,,,,,,20160901,20170228,113728,29,1,f805253a6ba64ee6a41bf14310ef16a4
6,os,BetaDistClassifier,0.3,2.25,True,1,other,0.1,0.1,0.7,0.91741,0.498947,0.499295,0.498947,0.498947,0.498194,0.498695,0.498343,0.033065,0.034027,0.81925,0.122459,nested,,,,,,,,,,,20160901,20170228,113728,29,1,f805253a6ba64ee6a41bf14310ef16a4
7,os,BetaDistClassifier,0.3,2.35,True,1,other,0.1,0.1,0.7,0.921471,0.499713,0.499792,0.499713,0.499713,0.499173,0.499437,0.499319,0.035574,0.034075,0.802816,0.122655,nested,,,,,,,,,,,20160901,20170228,113728,29,1,f805253a6ba64ee6a41bf14310ef16a4
8,os,BetaDistClassifier,0.3,2.4,True,1,other,0.1,0.1,0.7,0.925296,0.509042,0.506949,0.509042,0.509042,0.50747,0.507056,0.508258,0.034781,0.034921,0.802461,0.12219,nested,,,,,,,,,,,20160901,20170228,113728,29,1,f805253a6ba64ee6a41bf14310ef16a4
9,os,BetaDistClassifier,0.3,2.5,True,1,other,0.1,0.1,0.7,0.92728,0.497375,0.497806,0.497375,0.497375,0.497442,0.497629,0.49736,0.034528,0.033942,0.802324,0.122535,nested,,,,,,,,,,,20160901,20170228,113728,29,1,f805253a6ba64ee6a41bf14310ef16a4


### Get Outputs of Best Experiment Run

In [11]:
#| echo: true
df_best_expt_run = modh.get_best_experiment_run(
    df_expt_runs, "experiment_run_type == 'parent'", f"test_{primary_metric}"
)

In [12]:
#| output: false
with pd.option_context("display.max_columns", None):
    display(df_best_expt_run.to_frame().transpose())

Unnamed: 0,resampling_approach,clf,param_clf__a,param_clf__b,param_preprocessor__cat__rarecats__fe__ignore_format,param_preprocessor__cat__rarecats__fe__n_categories,param_preprocessor__cat__rarecats__fe__replace_with,param_preprocessor__cat__rarecats__fe__tol,param_resampler__sampling_strategy,param_select__threshold,params,test_accuracy,test_balanced_accuracy,test_precision,test_recall,test_roc_auc,test_f1,test_fbeta05,test_fbeta2,test_pr_auc,test_avg_precision,fit_time,score_time,experiment_run_type,train_val_accuracy,train_val_balanced_accuracy,train_val_precision,train_val_recall,train_val_roc_auc,train_val_f1,train_val_fbeta05,train_val_fbeta2,train_val_pr_auc,train_val_avg_precision,train_start_date,test_end_date,num_observations,num_columns,column_names,experiment_id,run_id
30,os,BetaDistClassifier,0.3,2.4,True,1,other,0.1,0.1,0.7,"{""clf__a"": 0.3, ""clf__b"": 2.4, ""preprocessor__...",0.936669,0.499338,0.022353,0.499338,0.499338,0.498082,0.498804,0.498315,0.023243,0.023032,,,parent,0.915096,0.49881,0.041504,0.49881,0.49881,0.498821,0.498832,0.498814,0.043402,0.043624,20160901,20170228,113728,29,"[""fullvisitorid"", ""visitId"", ""visitNumber"", ""v...",1,f805253a6ba64ee6a41bf14310ef16a4


### Get Parameters Associated With Best Experiment Run

Get the metadata and metrics for all available data and experiment run ID for best performing run

1. features
   - list of column names
2. metrics
   - primary metric score on the test split, during ML evaluation
3. run ID
   - MLFlow experiment run ID

In [13]:
#| echo: true
cols_best_expt_run = json.loads(df_best_expt_run["column_names"])
best_model_eval_score = df_best_expt_run[f"test_{primary_metric}"]
best_run_id = df_best_expt_run["run_id"]

In [14]:
#| output: false
print(best_model_eval_score)
cols_best_expt_run

0.49831454715525647


['fullvisitorid',
 'visitId',
 'visitNumber',
 'visitStartTime',
 'quarter',
 'month',
 'day_of_month',
 'day_of_week',
 'hour',
 'minute',
 'second',
 'source',
 'medium',
 'channelGrouping',
 'hits',
 'bounces',
 'last_action',
 'promos_displayed',
 'promos_clicked',
 'product_views',
 'product_clicks',
 'pageviews',
 'time_on_site',
 'browser',
 'os',
 'deviceCategory',
 'added_to_cart',
 'revenue',
 'made_purchase_on_future_visit']

### Get Name of Logged Model Associated with Best Experiment Run

Get name of model associated with best run

In [15]:
#| echo: true
df_best_run_model = modh.get_single_registered_model(f"run_id == '{best_run_id}'")
best_run_model_name = df_best_run_model.squeeze()["name"]

2023/07/10 18:58:20 INFO mlflow.store.db.utils: Creating initial MLflow database tables...
2023/07/10 18:58:20 INFO mlflow.store.db.utils: Updating database tables
INFO  [alembic.runtime.migration] Context impl SQLiteImpl.
INFO  [alembic.runtime.migration] Will assume non-transactional DDL.


In [16]:
# output: false
with pd.option_context("display.max_colwidth", None):
    display(df_best_run_model)
print(best_run_model_name)

Unnamed: 0,name,run_id,description,source,version,status
0,BetaDistClassifier_20160901_20170228_133892_feats__20230710_184102,f805253a6ba64ee6a41bf14310ef16a4,Best BetaDistClassifier model with fbeta2 score of 0.4983145472,/home/jovyan/notebooks/mlruns/f805253a6ba64ee6a41bf14310ef16a4/artifacts/model,1,READY


BetaDistClassifier_20160901_20170228_133892_feats__20230710_184102


### Load Best Deployment Candidate Model from Model Registry

In [17]:
best_model_uri = f"models:/{best_run_model_name}/latest"
model = mlflow.sklearn.load_model(model_uri=best_model_uri)

In [18]:
model

### Add MLFlow Model Associated with Best Experiment Run to Model Registry

Create a new registered model, with a version

In [19]:
#| echo: true
client = MlflowClient(tracking_uri=mlflow.get_tracking_uri())
result = client.create_model_version(
    name=best_run_model_name,
    await_creation_for=None,
    tags={'deployment-candidate': "yes"},
    description=(
        f"Best Model based on {primary_metric} score of "
        f"{best_model_eval_score:.10f}"
    ),
    source=f"mlruns/{best_run_id}/artifacts/model",
    run_id=best_run_id,
)

## Next Step

The registered model will be used during downstream steps such as inference to make predictions for first-time visitors to the store during the production period (following the end of the test data split).