In [2]:
import pandas as pd
import os.path
import logging

df = pd.read_csv('data/KaggleV2-May-2016.csv')

In [10]:
# function for creating a log-file which we'll write into
def get_logger(path, file):
    '''
    [Creates a log file for logging into it]
    Args:
        path {string} -- dir path
        file {string} -- file name
    Returns:
        [obj] -- [logger]
    '''
    # checking if file exists
    log_file = os.path.join(path, file)
    
    # if no file, create it
    if not os.path.isfile(log_file):
        open(log_file, "w+").close()
        
    # changing the logging format
    file_logging_format = "%(levelname)s: %(asctime)s: %(message)s"
    
    # config the log file
    logging.basicConfig(
        level=logging.INFO,
        format=file_logging_format)
    logger = logging.getLogger()
    
    # creating handler for recording logs into the file
    handler = logging.FileHandler(log_file)
    
    # setting the logging level
    handler.setLevel(logging.INFO)
    
    # creating the logging format
    formatter = logging.Formatter(file_logging_format)
    handler.setFormatter(formatter)
    
    # add handler to the logger
    logger.addHandler(handler)
    
    return logger

In [11]:
# create log file
logger = get_logger(path="logs/", file="data.logs")
logger.info("Data")
logger.info("Data shape {}".format(df.shape))
logger.info("Percentage of women: {}".format(df[df['No-show']=='Yes']['Gender'].value_counts(True)[0]))
logger.info("Percentage of men: {}".format(df[df['No-show']=='Yes']['Gender'].value_counts(True)[1]))

INFO: 2024-06-14 12:44:45,303: Data
INFO: 2024-06-14 12:44:45,304: Data shape (110527, 14)
INFO: 2024-06-14 12:44:45,321: Percentage of women: 0.653882342398853
INFO: 2024-06-14 12:44:45,336: Percentage of men: 0.346117657601147


In [12]:
if df.shape != (110526, 14):
    logger.error('Data shape is incorrect!')

ERROR: 2024-06-14 12:45:34,584: Data shape is incorrect!


## Creating experiment with Comet.ml

In [13]:
from comet_ml import Experiment
from dotenv import load_dotenv
from os import getenv
load_dotenv()

experiment = Experiment(
    api_key=getenv('COMET_API_KEY'),
    project_name='medical-appointment',
    workspace=getenv('WORKSPACE_NAME')
)

experiment.end()

[1;38;5;39mCOMET INFO:[0m Experiment is live on comet.com https://www.comet.com/gettergit/medical-appointment/0a0e753193c04fcda1bdd591a035f04b



![comet_methods](images/comet_methods.png)