In [3]:
import logging
import pandas as pd
from IPython.display import display, Image

logging.root.setLevel(logging.INFO)
pd.set_option("display.max_colwidth", None)
pd.options.display.max_rows = 4000


In [7]:
import os
from pathlib import Path
PROJECT_ROOT_DIR = Path(os.getcwd()).parent

In [2]:
import os
import sys
import mlflow

MLFLOW_EXPERIMENT_NAME = "Spam Detection"

def mlflow_connect() -> mlflow.entities.experiment.Experiment:
    import requests

    try:
        response = requests.get('http://localhost:5000', timeout=1)
        print(f"OK - mlflow server is up and running. Setting Tracking URI to http://localhost:5000. Setting Experiment to '{MLFLOW_EXPERIMENT_NAME}'")
        mlflow.set_tracking_uri("http://localhost:5000")
        return mlflow.set_experiment(MLFLOW_EXPERIMENT_NAME)
    except requests.exceptions.RequestException as e:
        print(f"MLflow server is not running. Please run '{PROJECT_ROOT_DIR}/start_mlflow_native.sh' in a terminal.", file=sys.stderr)
        print("Once MLflow is running, make sure you open http://localhost:5000/ in a browser.", file=sys.stderr)
        display(Image(filename=f"{PROJECT_ROOT_DIR}/course_helpers/images/mlflow_open_port.png", width=300))
        sys.exit(1)


In [6]:
"""
Dataset: http://archive.ics.uci.edu/dataset/380/youtube+spam+collection
"""

from pathlib import Path

import pandas as pd

spam_data_file = Path.cwd().parent / "data" / "comments.csv"
if not spam_data_file.exists():
    logging.error(f"Can't find {spam_data_file}")
    raise SystemExit(1)

df = pd.read_csv(spam_data_file)

print(f"Loaded {len(df)} rows from {spam_data_file}")
print("First ten rows of the dataframe `df`:")
display(df.head(10))


Loaded 1565 rows from /workspaces/mlops-course/data/comments.csv
First ten rows of the dataframe `df`:


Unnamed: 0,content,is_spam
0,Best Music Ever!!!﻿,0
1,please look up DHG SONGS this is my playlist with a bunch of amazing songs ﻿,1
2,just :( superr!!!﻿,0
3,Check out this playlist on YouTube:﻿,1
4,subscribed :) btw you have a good style keep it up brother :)),1
5,she is horrible at acting. cringe-worhty.﻿,0
6,https://m.facebook.com/story.php?story_fbid=764484966942313&amp;id=754989901225153&amp;ref=stream gf﻿,1
7,WOw,0
8,I loved this song when I was in my teenage years!﻿,0
9,Where did she find all that make up in a freakin jungle?!﻿,0
