# PyCaret 2 Anomaly Example
This notebook is created using PyCaret 2.0. Last updated : 28-07-2020

In [1]:
# check version
from pycaret.utils import version
version()

pycaret-nightly-0.39


# 1. Loading Dataset

In [2]:
from pycaret.datasets import get_data
data = get_data('anomaly')

Unnamed: 0,Col1,Col2,Col3,Col4,Col5,Col6,Col7,Col8,Col9,Col10
0,0.263995,0.764929,0.138424,0.935242,0.605867,0.51879,0.912225,0.608234,0.723782,0.733591
1,0.546092,0.653975,0.065575,0.227772,0.845269,0.837066,0.272379,0.331679,0.429297,0.367422
2,0.336714,0.538842,0.192801,0.553563,0.074515,0.332993,0.365792,0.861309,0.899017,0.0886
3,0.092108,0.995017,0.014465,0.176371,0.24153,0.514724,0.562208,0.158963,0.073715,0.208463
4,0.325261,0.805968,0.957033,0.331665,0.307923,0.355315,0.501899,0.558449,0.885169,0.182754


# 2. Initialize Setup

In [3]:
from pycaret.anomaly import *
ano1 = setup(data, session_id=123, log_experiment=True, experiment_name='anomaly1')

Setup Succesfully Completed!


Unnamed: 0,Description,Value
0,session_id,123
1,Original Data,"(1000, 10)"
2,Missing Values,False
3,Numeric Features,10
4,Categorical Features,0
5,Ordinal Features,False
6,High Cardinality Features,False
7,Transformed Data,"(1000, 10)"
8,Numeric Imputer,mean
9,Categorical Imputer,constant


# 3. Create Model

In [4]:
models()

Unnamed: 0_level_0,Name,Reference
ID,Unnamed: 1_level_1,Unnamed: 2_level_1
abod,Angle-base Outlier Detection,pyod.models.abod.ABOD
iforest,Isolation Forest,pyod.models.iforest
cluster,Clustering-Based Local Outlier,pyod.models.cblof
cof,Connectivity-Based Outlier Factor,pyod.models.cof
histogram,Histogram-based Outlier Detection,pyod.models.hbos
knn,k-Nearest Neighbors Detector,pyod.models.knn
lof,Local Outlier Factor,pyod.models.lof
svm,One-class SVM detector,pyod.models.ocsvm
pca,Principal Component Analysis,pyod.models.pca
mcd,Minimum Covariance Determinant,pyod.models.mcd


In [5]:
iforest = create_model('iforest')

In [6]:
knn = create_model('knn', fraction = 0.1)

# 4. Assign Labels

In [7]:
iforest_results = assign_model(iforest)
iforest_results.head()

Unnamed: 0,Col1,Col2,Col3,Col4,Col5,Col6,Col7,Col8,Col9,Col10,Label,Score
0,0.263995,0.764929,0.138424,0.935242,0.605867,0.51879,0.912225,0.608234,0.723782,0.733591,0,-0.035865
1,0.546092,0.653975,0.065575,0.227772,0.845269,0.837066,0.272379,0.331679,0.429297,0.367422,0,-0.084927
2,0.336714,0.538842,0.192801,0.553563,0.074515,0.332993,0.365792,0.861309,0.899017,0.0886,1,0.025356
3,0.092108,0.995017,0.014465,0.176371,0.24153,0.514724,0.562208,0.158963,0.073715,0.208463,1,0.042415
4,0.325261,0.805968,0.957033,0.331665,0.307923,0.355315,0.501899,0.558449,0.885169,0.182754,0,-0.023408


# 5. Analyze Model

In [8]:
plot_model(iforest)

In [9]:
plot_model(iforest, plot = 'umap')

# 6. Predict Model

In [10]:
pred_new = predict_model(iforest, data=data)
pred_new.head()

Unnamed: 0,Col1,Col2,Col3,Col4,Col5,Col6,Col7,Col8,Col9,Col10,Label,Score
0,0.263995,0.764929,0.138424,0.935242,0.605867,0.51879,0.912225,0.608234,0.723782,0.733591,0,-0.035865
1,0.546092,0.653975,0.065575,0.227772,0.845269,0.837066,0.272379,0.331679,0.429297,0.367422,0,-0.084927
2,0.336714,0.538842,0.192801,0.553563,0.074515,0.332993,0.365792,0.861309,0.899017,0.0886,1,0.025356
3,0.092108,0.995017,0.014465,0.176371,0.24153,0.514724,0.562208,0.158963,0.073715,0.208463,1,0.042415
4,0.325261,0.805968,0.957033,0.331665,0.307923,0.355315,0.501899,0.558449,0.885169,0.182754,0,-0.023408


# 7. Save / Load Model

In [11]:
save_model(iforest, model_name='iforest')

Transformation Pipeline and Model Succesfully Saved


In [12]:
loaded_iforest = load_model('iforest')
print(loaded_iforest)

Transformation Pipeline and Model Sucessfully Loaded
[Pipeline(memory=None,
         steps=[('dtypes',
                 DataTypes_Auto_infer(categorical_features=[],
                                      display_types=True, features_todrop=[],
                                      ml_usecase='regression',
                                      numerical_features=[],
                                      target='dummy_target',
                                      time_features=[])),
                ('imputer',
                 Simple_Imputer(categorical_strategy='not_available',
                                numeric_strategy='mean',
                                target_variable=None)),
                ('new_levels1',
                 New_Catagorical_L...
                                                    target='dummy_target')),
                ('feature_time',
                 Make_Time_Features(list_of_features=None, time_feature=[])),
                ('group', Empty()), ('scalin

In [13]:
from sklearn import set_config
set_config(display='diagram')
loaded_iforest[0]

In [14]:
from sklearn import set_config
set_config(display='text')

# 8. Deploy Model

In [15]:
deploy_model(iforest, model_name = 'iforest-aws', authentication = {'bucket' : 'pycaret-test'})

Model Succesfully Deployed on AWS S3


# 9. Get Config / Set Config

In [16]:
X = get_config('X')
X.head()

Unnamed: 0,Col1,Col2,Col3,Col4,Col5,Col6,Col7,Col8,Col9,Col10
0,0.263995,0.764929,0.138424,0.935242,0.605867,0.51879,0.912225,0.608234,0.723782,0.733591
1,0.546092,0.653975,0.065575,0.227772,0.845269,0.837066,0.272379,0.331679,0.429297,0.367422
2,0.336714,0.538842,0.192801,0.553563,0.074515,0.332993,0.365792,0.861309,0.899017,0.0886
3,0.092108,0.995017,0.014465,0.176371,0.24153,0.514724,0.562208,0.158963,0.073715,0.208463
4,0.325261,0.805968,0.957033,0.331665,0.307923,0.355315,0.501899,0.558449,0.885169,0.182754


In [17]:
get_config('seed')

123

In [18]:
from pycaret.anomaly import set_config
set_config('seed', 999)

In [19]:
get_config('seed')

999

# 10. Get System Logs

In [20]:
get_system_logs()

['2020-07-28 21', '03', '39,795', 'INFO', 'PyCaret Classification Module']
['2020-07-28 21', '03', '39,795', 'INFO', 'version pycaret-nightly-0.39']
['2020-07-28 21', '03', '39,796', 'INFO', 'Initializing setup()']
['2020-07-28 21', '03', '39,796', 'INFO', 'USI', '86aa']
['2020-07-28 21', '03', '39,796', 'INFO', 'setup(data=(1070, 19), target=Purchase, train_size=0.7, sampling=True, sample_estimator=None, categorical_features=None, categorical_imputation=constant, ordinal_features=None,']
['high_cardinality_features=None, high_cardinality_method=frequency, numeric_features=None, numeric_imputation=mean, date_features=None, ignore_features=None, normalize=False,']
['normalize_method=zscore, transformation=False, transformation_method=yeo-johnson, handle_unknown_categorical=True, unknown_categorical_method=least_frequent, pca=False, pca_method=linear,']
['pca_components=None, ignore_low_variance=False, combine_rare_levels=False, rare_level_threshold=0.1, bin_numeric_features=None, remove

["('new_levels1',"]
['New_Catagorical_...']
["('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),"]
["('P_transform', Empty()), ('pt_target', Empty()),"]
["('binn', Empty()), ('rem_outliers', Empty()),"]
["('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),"]
["('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),"]
["('feature_select', Empty()), ('fix_multi', Empty()),"]
["('dfs', Empty()), ('pca', Empty())],"]
['verbose=False), RidgeClassifier(alpha=1.0, class_weight=None, copy_X=True, fit_intercept=True,']
['max_iter=None, normalize=False, random_state=3844,']
["solver='auto', tol=0.001)]"]
['2020-07-28 21', '05', '55,432', 'INFO', 'save_model() succesfully completed......................................']
['2020-07-28 21', '05', '55,483', 'INFO', 'Initializing Random Forest Classifier']
['2020-07-28 21', '05', '55,485', 'INFO', 'Initializing Fold 1']
['2020-07-28 21', '05', '55,486', 'INFO', 'Fitting Model']
['2020-07-28 21', '05', '55,595', 'INF

['2020-07-28 21', '06', '35,624', 'INFO', 'Checking exceptions']
['2020-07-28 21', '06', '35,625', 'INFO', 'Preloading libraries']
['2020-07-28 21', '06', '35,625', 'INFO', 'Preparing display monitor']
['2020-07-28 21', '06', '35,632', 'INFO', 'Copying training dataset']
['2020-07-28 21', '06', '35,633', 'INFO', 'Importing libraries']
['2020-07-28 21', '06', '35,633', 'INFO', 'Defining folds']
['2020-07-28 21', '06', '35,633', 'INFO', 'Declaring metric variables']
['2020-07-28 21', '06', '35,633', 'INFO', 'Importing untrained model']
['2020-07-28 21', '06', '35,633', 'INFO', 'CatBoost Classifier Imported succesfully']
['2020-07-28 21', '06', '35,633', 'INFO', 'Checking ensemble method']
['2020-07-28 21', '06', '35,635', 'INFO', 'Initializing Fold 1']
['2020-07-28 21', '06', '35,636', 'INFO', 'Fitting Model']
['2020-07-28 21', '06', '37,886', 'INFO', 'Evaluating Metrics']
['2020-07-28 21', '06', '37,895', 'INFO', 'Compiling Metrics']
['2020-07-28 21', '06', '37,901', 'INFO', 'Initializi

['2020-07-28 21', '10', '32,616', 'INFO', 'Compiling Metrics']
['2020-07-28 21', '10', '32,626', 'INFO', 'Initializing Fold 5']
['2020-07-28 21', '10', '32,636', 'INFO', 'Fitting Model']
['2020-07-28 21', '10', '32,755', 'INFO', 'Evaluating Metrics']
['2020-07-28 21', '10', '33,005', 'INFO', 'Compiling Metrics']
['2020-07-28 21', '10', '33,015', 'INFO', 'Initializing Fold 6']
['2020-07-28 21', '10', '33,026', 'INFO', 'Fitting Model']
['2020-07-28 21', '10', '33,143', 'INFO', 'Evaluating Metrics']
['2020-07-28 21', '10', '33,382', 'INFO', 'Compiling Metrics']
['2020-07-28 21', '10', '33,386', 'INFO', 'Initializing Fold 7']
['2020-07-28 21', '10', '33,394', 'INFO', 'Fitting Model']
['2020-07-28 21', '10', '33,510', 'INFO', 'Evaluating Metrics']
['2020-07-28 21', '10', '33,762', 'INFO', 'Compiling Metrics']
['2020-07-28 21', '10', '33,771', 'INFO', 'Initializing Fold 8']
['2020-07-28 21', '10', '33,782', 'INFO', 'Fitting Model']
['2020-07-28 21', '10', '33,899', 'INFO', 'Evaluating Metric

['2020-07-28 21', '15', '14,260', 'INFO', 'Appending prep pipeline']
['2020-07-28 21', '15', '14,270', 'INFO', 'pycaret-clf-best.pkl saved in current working directory']
['2020-07-28 21', '15', '14,278', 'INFO', '[Pipeline(memory=None,']
["steps=[('dtypes',"]
['DataTypes_Auto_infer(categorical_features=[],']
['display_types=False, features_todrop=[],']
["ml_usecase='classification',"]
["numerical_features=[], target='default',"]
['time_features=[])),']
["('imputer',"]
["Simple_Imputer(categorical_strategy='not_available',"]
["numeric_strategy='mean',"]
['target_variable=None)),']
["('new_levels1',"]
['New_Catagorical_L...']
["('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),"]
["('P_transform', Empty()), ('pt_target', Empty()),"]
["('binn', Empty()), ('rem_outliers', Empty()),"]
["('cluster_all', Empty()), ('dummy', Dummify(target='default')),"]
["('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),"]
["('feature_select', Empty()), ('fix_multi', Empty()),"]
["

['2020-07-28 23', '36', '49,919', 'INFO', 'Checking libraries']
['2020-07-28 23', '36', '49,919', 'INFO', 'pd==1.0.4']
['2020-07-28 23', '36', '49,919', 'INFO', 'numpy==1.18.5']
['2020-07-28 23', '36', '50,108', 'INFO', 'nltk==3.5']
['2020-07-28 23', '36', '50,165', 'INFO', 'textblob==0.15.3']
['2020-07-28 23', '36', '50,337', 'INFO', 'pyLDAvis==2.1.2']
['2020-07-28 23', '36', '50,359', 'INFO', 'gensim==3.8.3']
['2020-07-28 23', '36', '50,451', 'INFO', 'wordcloud==1.7.0']
['2020-07-28 23', '36', '50,774', 'INFO', 'pyLDAvis==2.1.2']
['2020-07-28 23', '36', '50,881', 'INFO', 'wordcloud==1.7.0']
['2020-07-28 23', '36', '50,938', 'INFO', 'spacy==2.2.4']
['2020-07-28 23', '36', '51,111', 'INFO', 'mlflow==1.8.0']
['2020-07-28 23', '36', '51,112', 'INFO', 'Checking Exceptions']
['2020-07-28 23', '36', '51,114', 'INFO', 'gensim==3.8.3']
['2020-07-28 23', '36', '51,521', 'INFO', 'mlflow==1.8.0']
['2020-07-28 23', '36', '51,521', 'INFO', 'Checking Exceptions']
['2020-07-28 23', '36', '51,638', '

['2020-07-28 23', '45', '35,540', 'INFO', 'Copying training dataset']
['2020-07-28 23', '45', '35,541', 'INFO', 'Importing stopwords from nltk']
['2020-07-28 23', '45', '35,880', 'INFO', 'No custom stopwords defined']
['2020-07-28 23', '45', '35,880', 'INFO', 'Removing numeric characters from the text']
['2020-07-28 23', '45', '36,041', 'INFO', 'nltk==3.5']
['2020-07-28 23', '45', '36,097', 'INFO', 'textblob==0.15.3']
['2020-07-28 23', '45', '36,214', 'INFO', 'gensim==3.8.3']
['2020-07-28 23', '45', '36,230', 'INFO', 'Removing special characters from the text']
['2020-07-28 23', '45', '36,705', 'INFO', 'Tokenizing Words']
['2020-07-28 23', '45', '36,728', 'INFO', 'pyLDAvis==2.1.2']
['2020-07-28 23', '45', '36,793', 'INFO', 'spacy==2.2.4']
['2020-07-28 23', '45', '36,842', 'INFO', 'wordcloud==1.7.0']
['2020-07-28 23', '45', '37,510', 'INFO', 'mlflow==1.8.0']
['2020-07-28 23', '45', '37,510', 'INFO', 'Checking Exceptions']
['2020-07-28 23', '45', '37,524', 'INFO', 'nltk==3.5']
['2020-07-

['2020-07-28 23', '56', '47,476', 'INFO', 'Extracting Trigrams']
['2020-07-28 23', '56', '52,540', 'INFO', 'Extracting Trigrams']
['2020-07-28 23', '56', '53,866', 'INFO', 'Extracting Trigrams']
['2020-07-28 23', '57', '05,923', 'INFO', 'Lemmatizing tokens']
['2020-07-28 23', '57', '06,816', 'INFO', 'Lemmatizing tokens']
['2020-07-28 23', '57', '13,409', 'INFO', 'Lemmatizing tokens']
['2020-07-28 23', '57', '14,441', 'INFO', 'Lemmatizing tokens']
['2020-07-28 23', '58', '17,679', 'INFO', 'Removing stopwords after lemmatizing']
['2020-07-28 23', '58', '18,474', 'INFO', 'Removing stopwords after lemmatizing']
['2020-07-28 23', '58', '19,477', 'INFO', 'Creating corpus and dictionary']
['2020-07-28 23', '58', '20,319', 'INFO', 'Creating corpus and dictionary']
['2020-07-28 23', '58', '21,379', 'INFO', 'Compiling processed text']
['2020-07-28 23', '58', '21,402', 'INFO', 'Compiling information grid']
['2020-07-28 23', '58', '21,884', 'INFO', 'Creating MLFlow logs']
['2020-07-28 23', '58', '

['2020-07-29 00', '05', '04,695', 'INFO', 'Checking Exceptions']
['2020-07-29 00', '05', '05,175', 'INFO', 'Preloading libraries']
['2020-07-29 00', '05', '05,413', 'INFO', 'Preparing display monitor']
['2020-07-29 00', '05', '05,426', 'INFO', 'Importing libraries']
['2020-07-29 00', '05', '05,426', 'INFO', 'Declaring global variables']
['2020-07-29 00', '05', '05,426', 'INFO', 'Input provided', 'dataframe']
['2020-07-29 00', '05', '05,427', 'INFO', 'session_id set to', '1527']
['2020-07-29 00', '05', '05,427', 'INFO', 'Copying training dataset']
['2020-07-29 00', '05', '05,428', 'INFO', 'Importing stopwords from nltk']
['2020-07-29 00', '05', '05,688', 'INFO', 'Creating corpus and dictionary']
['2020-07-29 00', '05', '05,741', 'INFO', 'No custom stopwords defined']
['2020-07-29 00', '05', '05,742', 'INFO', 'Removing numeric characters from the text']
['2020-07-29 00', '05', '05,799', 'INFO', 'PyCaret NLP Module']
['2020-07-29 00', '05', '05,800', 'INFO', 'version pycaret-nightly-0.39'

['2020-07-29 00', '11', '31,814', 'INFO', 'spacy==2.2.4']
['2020-07-29 00', '11', '32,220', 'INFO', 'gensim==3.8.3']
['2020-07-29 00', '11', '32,611', 'INFO', 'nltk==3.5']
['2020-07-29 00', '11', '32,671', 'INFO', 'textblob==0.15.3']
['2020-07-29 00', '11', '32,821', 'INFO', 'spacy==2.2.4']
['2020-07-29 00', '11', '33,335', 'INFO', 'pyLDAvis==2.1.2']
['2020-07-29 00', '11', '33,458', 'INFO', 'wordcloud==1.7.0']
['2020-07-29 00', '11', '33,600', 'INFO', 'nltk==3.5']
['2020-07-29 00', '11', '33,668', 'INFO', 'textblob==0.15.3']
['2020-07-29 00', '11', '34,128', 'INFO', 'mlflow==1.8.0']
['2020-07-29 00', '11', '34,128', 'INFO', 'Checking Exceptions']
['2020-07-29 00', '11', '34,302', 'INFO', 'pyLDAvis==2.1.2']
['2020-07-29 00', '11', '34,419', 'INFO', 'wordcloud==1.7.0']
['2020-07-29 00', '11', '34,737', 'INFO', 'PyCaret NLP Module']
['2020-07-29 00', '11', '34,737', 'INFO', 'version pycaret-nightly-0.39']
['2020-07-29 00', '11', '34,737', 'INFO', 'Initializing setup()']
['2020-07-29 00',

['2020-07-29 00', '20', '30,524', 'INFO', 'Input provided', 'dataframe']
['2020-07-29 00', '20', '30,524', 'INFO', 'session_id set to', '414']
['2020-07-29 00', '20', '30,524', 'INFO', 'Copying training dataset']
['2020-07-29 00', '20', '30,525', 'INFO', 'Importing stopwords from nltk']
['2020-07-29 00', '20', '30,874', 'INFO', 'No custom stopwords defined']
['2020-07-29 00', '20', '30,875', 'INFO', 'Removing numeric characters from the text']
['2020-07-29 00', '20', '31,227', 'INFO', 'Removing special characters from the text']
['2020-07-29 00', '20', '32,058', 'INFO', 'Extracting Bigrams']
['2020-07-29 00', '20', '32,933', 'INFO', 'Extracting Bigrams']
['2020-07-29 00', '20', '34,051', 'INFO', 'Tokenizing Words']
['2020-07-29 00', '20', '41,157', 'INFO', 'Extracting Trigrams']
['2020-07-29 00', '20', '41,901', 'INFO', 'Removing stopwords']
['2020-07-29 00', '20', '43,866', 'INFO', 'Extracting Trigrams']
['2020-07-29 00', '20', '44,623', 'INFO', 'Extracting Trigrams']
['2020-07-29 00'

['2020-07-29 00', '27', '01,808', 'INFO', 'Removing stopwords']
['2020-07-29 00', '27', '02,011', 'INFO', 'gensim==3.8.3']
['2020-07-29 00', '27', '02,567', 'INFO', 'spacy==2.2.4']
['2020-07-29 00', '27', '03,279', 'INFO', 'nltk==3.5']
['2020-07-29 00', '27', '03,334', 'INFO', 'textblob==0.15.3']
['2020-07-29 00', '27', '03,940', 'INFO', 'pyLDAvis==2.1.2']
['2020-07-29 00', '27', '04,038', 'INFO', 'wordcloud==1.7.0']
['2020-07-29 00', '27', '04,310', 'INFO', 'Extracting Bigrams']
['2020-07-29 00', '27', '04,687', 'INFO', 'mlflow==1.8.0']
['2020-07-29 00', '27', '04,687', 'INFO', 'Checking Exceptions']
['2020-07-29 00', '27', '05,783', 'INFO', 'Extracting Bigrams']
['2020-07-29 00', '27', '06,062', 'INFO', 'Preloading libraries']
['2020-07-29 00', '27', '06,259', 'INFO', 'Preparing display monitor']
['2020-07-29 00', '27', '06,272', 'INFO', 'Importing libraries']
['2020-07-29 00', '27', '06,272', 'INFO', 'Declaring global variables']
['2020-07-29 00', '27', '06,273', 'INFO', 'Input prov

['2020-07-29 00', '41', '56,677', 'INFO', 'Checking libraries']
['2020-07-29 00', '41', '56,677', 'INFO', 'pd==1.0.4']
['2020-07-29 00', '41', '56,677', 'INFO', 'numpy==1.18.5']
['2020-07-29 00', '41', '58,100', 'INFO', 'gensim==3.8.3']
['2020-07-29 00', '41', '58,300', 'INFO', 'Compiling processed text']
['2020-07-29 00', '41', '58,330', 'INFO', 'Compiling information grid']
['2020-07-29 00', '41', '58,748', 'INFO', 'spacy==2.2.4']
['2020-07-29 00', '41', '58,839', 'INFO', 'Creating MLFlow logs']
['2020-07-29 00', '41', '59,363', 'INFO', 'setup() succesfully completed......................................']
['2020-07-29 00', '41', '59,363', 'INFO', 'Initializing create_model()']
['2020-07-29 00', '41', '59,363', 'INFO', 'create_model(model=lda, multi_core=True, num_topics=None, verbose=True, system=True)']
['2020-07-29 00', '41', '59,363', 'INFO', 'Checking exceptions']
['2020-07-29 00', '41', '59,363', 'INFO', 'Preloading libraries']
['2020-07-29 00', '41', '59,363', 'INFO', 'Prepari

['2020-07-29 00', '46', '21,713', 'INFO', 'python_build', "('default', 'May  7 2020 19", '46', "08')"]
['2020-07-29 00', '46', '21,713', 'INFO', 'machine', 'AMD64']
['2020-07-29 00', '46', '21,713', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']
['2020-07-29 00', '46', '21,747', 'INFO', 'Memory', 'svmem(total=17032478720, available=9211715584, percent=45.9, used=7820763136, free=9211715584)']
['2020-07-29 00', '46', '21,748', 'INFO', 'Physical Core', '4']
['2020-07-29 00', '46', '21,748', 'INFO', 'Logical Core', '8']
['2020-07-29 00', '46', '21,748', 'INFO', 'Checking libraries']
['2020-07-29 00', '46', '21,748', 'INFO', 'pd==1.0.4']
['2020-07-29 00', '46', '21,748', 'INFO', 'numpy==1.18.5']
['2020-07-29 00', '46', '23,111', 'INFO', 'gensim==3.8.3']
['2020-07-29 00', '46', '23,764', 'INFO', 'spacy==2.2.4']
['2020-07-29 00', '46', '23,911', 'INFO', 'Compiling processed text']
['2020-07-29 00', '46', '23,935', 'INFO', 'Compiling information grid']
['2020-07-29 00', '46', '24,475', 'INF

['2020-07-29 00', '55', '22,045', 'INFO', 'Removing special characters from the text']
['2020-07-29 00', '55', '22,093', 'INFO', 'Removing special characters from the text']
['2020-07-29 00', '55', '22,583', 'INFO', 'nltk==3.5']
['2020-07-29 00', '55', '22,628', 'INFO', 'textblob==0.15.3']
['2020-07-29 00', '55', '23,207', 'INFO', 'pyLDAvis==2.1.2']
['2020-07-29 00', '55', '23,301', 'INFO', 'wordcloud==1.7.0']
['2020-07-29 00', '55', '23,901', 'INFO', 'mlflow==1.8.0']
['2020-07-29 00', '55', '23,902', 'INFO', 'Checking Exceptions']
['2020-07-29 00', '55', '24,819', 'INFO', 'Tokenizing Words']
['2020-07-29 00', '55', '24,922', 'INFO', 'Tokenizing Words']
['2020-07-29 00', '55', '25,147', 'INFO', 'Extracting Bigrams']
['2020-07-29 00', '55', '25,334', 'INFO', 'Preloading libraries']
['2020-07-29 00', '55', '25,518', 'INFO', 'Preparing display monitor']
['2020-07-29 00', '55', '25,529', 'INFO', 'Importing libraries']
['2020-07-29 00', '55', '25,529', 'INFO', 'Declaring global variables']


['2020-07-29 00', '59', '54,133', 'INFO', 'Tokenizing Words']
['2020-07-29 00', '59', '56,042', 'INFO', 'Removing stopwords']
['2020-07-29 00', '59', '56,320', 'INFO', 'Removing stopwords']
['2020-07-29 00', '59', '59,722', 'INFO', 'Extracting Bigrams']
['2020-07-29 01', '00', '00,251', 'INFO', 'Removing stopwords']
['2020-07-29 01', '00', '00,272', 'INFO', 'Extracting Bigrams']
['2020-07-29 01', '00', '00,636', 'INFO', 'Extracting Trigrams']
['2020-07-29 01', '00', '03,900', 'INFO', 'Extracting Bigrams']
['2020-07-29 01', '00', '10,237', 'INFO', 'Extracting Trigrams']
['2020-07-29 01', '00', '11,038', 'INFO', 'Extracting Trigrams']
['2020-07-29 01', '00', '14,863', 'INFO', 'Extracting Trigrams']
['2020-07-29 01', '00', '20,229', 'INFO', 'Lemmatizing tokens']
['2020-07-29 01', '00', '29,671', 'INFO', 'Lemmatizing tokens']
['2020-07-29 01', '00', '31,270', 'INFO', 'Lemmatizing tokens']
['2020-07-29 01', '00', '34,754', 'INFO', 'Lemmatizing tokens']
['2020-07-29 01', '01', '32,463', 'INF

['2020-07-29 01', '12', '35,880', 'INFO', 'LdaMulticore imported successfully']
['2020-07-29 01', '12', '36,282', 'INFO', 'Removing stopwords after lemmatizing']
['2020-07-29 01', '12', '36,352', 'INFO', 'gensim==3.8.3']
['2020-07-29 01', '12', '36,900', 'INFO', 'Compiling processed text']
['2020-07-29 01', '12', '36,930', 'INFO', 'Compiling information grid']
['2020-07-29 01', '12', '36,986', 'INFO', 'spacy==2.2.4']
['2020-07-29 01', '12', '37,454', 'INFO', 'Creating MLFlow logs']
['2020-07-29 01', '12', '37,750', 'INFO', 'nltk==3.5']
['2020-07-29 01', '12', '37,807', 'INFO', 'textblob==0.15.3']
['2020-07-29 01', '12', '37,946', 'INFO', 'setup() succesfully completed......................................']
['2020-07-29 01', '12', '37,946', 'INFO', 'Initializing create_model()']
['2020-07-29 01', '12', '37,946', 'INFO', 'create_model(model=lda, multi_core=True, num_topics=None, verbose=True, system=True)']
['2020-07-29 01', '12', '37,946', 'INFO', 'Checking exceptions']
['2020-07-29 01

['2020-07-29 01', '17', '05,806', 'INFO', 'PyCaret NLP Module']
['2020-07-29 01', '17', '05,806', 'INFO', 'version pycaret-nightly-0.39']
['2020-07-29 01', '17', '05,806', 'INFO', 'Initializing setup()']
['2020-07-29 01', '17', '05,806', 'INFO', 'USI', 'ac23']
['2020-07-29 01', '17', '05,806', 'INFO', 'setup(data=(6818, 7), target=en, custom_stopwords=None, html=False, session_id=None, log_experiment=True,']
['experiment_name=kiva_exp, log_plots=False, log_data=False, verbose=True)']
['2020-07-29 01', '17', '05,806', 'INFO', 'Checking environment']
['2020-07-29 01', '17', '05,807', 'INFO', 'python_version', '3.6.10']
['2020-07-29 01', '17', '05,807', 'INFO', 'python_build', "('default', 'May  7 2020 19", '46', "08')"]
['2020-07-29 01', '17', '05,807', 'INFO', 'machine', 'AMD64']
['2020-07-29 01', '17', '05,807', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']
['2020-07-29 01', '17', '05,840', 'INFO', 'Memory', 'svmem(total=17032478720, available=9974321152, percent=41.4, used=70581575

['2020-07-29 01', '23', '47,168', 'INFO', 'Declaring global variables']
['2020-07-29 01', '23', '47,169', 'INFO', 'Input provided', 'dataframe']
['2020-07-29 01', '23', '47,169', 'INFO', 'session_id set to', '6666']
['2020-07-29 01', '23', '47,169', 'INFO', 'Copying training dataset']
['2020-07-29 01', '23', '47,170', 'INFO', 'Importing stopwords from nltk']
['2020-07-29 01', '23', '47,500', 'INFO', 'No custom stopwords defined']
['2020-07-29 01', '23', '47,505', 'INFO', 'Removing numeric characters from the text']
['2020-07-29 01', '23', '47,852', 'INFO', 'Removing special characters from the text']
['2020-07-29 01', '23', '48,258', 'INFO', 'Preloading libraries']
['2020-07-29 01', '23', '48,455', 'INFO', 'Preparing display monitor']
['2020-07-29 01', '23', '48,465', 'INFO', 'Importing libraries']
['2020-07-29 01', '23', '48,465', 'INFO', 'Declaring global variables']
['2020-07-29 01', '23', '48,465', 'INFO', 'Input provided', 'dataframe']
['2020-07-29 01', '23', '48,465', 'INFO', 'se

['2020-07-29 01', '32', '23,239', 'INFO', 'Initializing setup()']
['2020-07-29 01', '32', '23,239', 'INFO', 'USI', '205d']
['2020-07-29 01', '32', '23,239', 'INFO', 'setup(data=(6818, 7), target=en, custom_stopwords=None, html=False, session_id=None, log_experiment=True,']
['experiment_name=kiva_exp, log_plots=False, log_data=False, verbose=True)']
['2020-07-29 01', '32', '23,240', 'INFO', 'Checking environment']
['2020-07-29 01', '32', '23,240', 'INFO', 'python_version', '3.6.10']
['2020-07-29 01', '32', '23,240', 'INFO', 'python_build', "('default', 'May  7 2020 19", '46', "08')"]
['2020-07-29 01', '32', '23,240', 'INFO', 'machine', 'AMD64']
['2020-07-29 01', '32', '23,241', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']
['2020-07-29 01', '32', '23,283', 'INFO', 'Memory', 'svmem(total=17032478720, available=9052913664, percent=46.8, used=7979565056, free=9052913664)']
['2020-07-29 01', '32', '23,283', 'INFO', 'Physical Core', '4']
['2020-07-29 01', '32', '23,284', 'INFO', 'Logical 

['2020-07-29 01', '39', '04,797', 'INFO', 'num_topics set to', '4']
['2020-07-29 01', '39', '04,797', 'INFO', 'LDA multi_core enabled']
['2020-07-29 01', '39', '04,797', 'INFO', 'LdaMulticore imported successfully']
['2020-07-29 01', '39', '04,824', 'INFO', 'Creating MLFlow logs']
['2020-07-29 01', '39', '05,324', 'INFO', 'setup() succesfully completed......................................']
['2020-07-29 01', '39', '05,324', 'INFO', 'Initializing create_model()']
['2020-07-29 01', '39', '05,325', 'INFO', 'create_model(model=lda, multi_core=True, num_topics=None, verbose=True, system=True)']
['2020-07-29 01', '39', '05,325', 'INFO', 'Checking exceptions']
['2020-07-29 01', '39', '05,325', 'INFO', 'Preloading libraries']
['2020-07-29 01', '39', '05,325', 'INFO', 'Preparing display monitor']
['2020-07-29 01', '39', '05,334', 'INFO', 'Defining topic model']
['2020-07-29 01', '39', '05,335', 'INFO', 'Model', 'Latent Dirichlet Allocation']
['2020-07-29 01', '39', '05,335', 'INFO', 'Defining 

['2020-07-29 01', '50', '03,870', 'INFO', 'num_topics set to', '4']
['2020-07-29 01', '50', '03,871', 'INFO', 'LDA multi_core enabled']
['2020-07-29 01', '50', '03,871', 'INFO', 'LdaMulticore imported successfully']
['2020-07-29 01', '50', '04,377', 'INFO', 'pyLDAvis==2.1.2']
['2020-07-29 01', '50', '04,515', 'INFO', 'wordcloud==1.7.0']
['2020-07-29 01', '50', '04,586', 'INFO', 'Removing stopwords']
['2020-07-29 01', '50', '05,187', 'INFO', 'mlflow==1.8.0']
['2020-07-29 01', '50', '05,188', 'INFO', 'Checking Exceptions']
['2020-07-29 01', '50', '06,660', 'INFO', 'Preloading libraries']
['2020-07-29 01', '50', '06,879', 'INFO', 'Preparing display monitor']
['2020-07-29 01', '50', '06,895', 'INFO', 'Importing libraries']
['2020-07-29 01', '50', '06,895', 'INFO', 'Declaring global variables']
['2020-07-29 01', '50', '06,896', 'INFO', 'Input provided', 'dataframe']
['2020-07-29 01', '50', '06,896', 'INFO', 'session_id set to', '3576']
['2020-07-29 01', '50', '06,896', 'INFO', 'Copying trai

['2020-07-29 01', '54', '26,257', 'INFO', 'No custom stopwords defined']
['2020-07-29 01', '54', '26,257', 'INFO', 'Removing numeric characters from the text']
['2020-07-29 01', '54', '26,302', 'INFO', 'Creating corpus and dictionary']
['2020-07-29 01', '54', '26,674', 'INFO', 'Removing special characters from the text']
['2020-07-29 01', '54', '27,127', 'INFO', 'Compiling processed text']
['2020-07-29 01', '54', '27,151', 'INFO', 'Compiling information grid']
['2020-07-29 01', '54', '27,620', 'INFO', 'Creating MLFlow logs']
['2020-07-29 01', '54', '28,066', 'INFO', 'setup() succesfully completed......................................']
['2020-07-29 01', '54', '28,067', 'INFO', 'Initializing create_model()']
['2020-07-29 01', '54', '28,067', 'INFO', 'create_model(model=lda, multi_core=True, num_topics=None, verbose=True, system=True)']
['2020-07-29 01', '54', '28,067', 'INFO', 'Checking exceptions']
['2020-07-29 01', '54', '28,067', 'INFO', 'Preloading libraries']
['2020-07-29 01', '54'

['2020-07-29 02', '00', '58,066', 'INFO', 'Importing stopwords from nltk']
['2020-07-29 02', '00', '58,347', 'INFO', 'No custom stopwords defined']
['2020-07-29 02', '00', '58,348', 'INFO', 'Removing numeric characters from the text']
['2020-07-29 02', '00', '58,447', 'INFO', 'Creating MLFlow logs']
['2020-07-29 02', '00', '58,697', 'INFO', 'Removing special characters from the text']
['2020-07-29 02', '00', '58,833', 'INFO', 'Removing stopwords']
['2020-07-29 02', '00', '58,914', 'INFO', 'setup() succesfully completed......................................']
['2020-07-29 02', '00', '58,914', 'INFO', 'Initializing create_model()']
['2020-07-29 02', '00', '58,914', 'INFO', 'create_model(model=lda, multi_core=True, num_topics=None, verbose=True, system=True)']
['2020-07-29 02', '00', '58,915', 'INFO', 'Checking exceptions']
['2020-07-29 02', '00', '58,915', 'INFO', 'Preloading libraries']
['2020-07-29 02', '00', '58,915', 'INFO', 'Preparing display monitor']
['2020-07-29 02', '00', '58,92

['2020-07-29 02', '09', '31,823', 'INFO', 'pyLDAvis==2.1.2']
['2020-07-29 02', '09', '31,827', 'INFO', 'Removing stopwords after lemmatizing']
['2020-07-29 02', '09', '31,955', 'INFO', 'wordcloud==1.7.0']
['2020-07-29 02', '09', '32,634', 'INFO', 'mlflow==1.8.0']
['2020-07-29 02', '09', '32,634', 'INFO', 'Checking Exceptions']
['2020-07-29 02', '09', '33,920', 'INFO', 'Preloading libraries']
['2020-07-29 02', '09', '34,066', 'INFO', 'Creating corpus and dictionary']
['2020-07-29 02', '09', '34,129', 'INFO', 'Preparing display monitor']
['2020-07-29 02', '09', '34,138', 'INFO', 'Importing libraries']
['2020-07-29 02', '09', '34,138', 'INFO', 'Declaring global variables']
['2020-07-29 02', '09', '34,139', 'INFO', 'Input provided', 'dataframe']
['2020-07-29 02', '09', '34,139', 'INFO', 'session_id set to', '4825']
['2020-07-29 02', '09', '34,139', 'INFO', 'Copying training dataset']
['2020-07-29 02', '09', '34,140', 'INFO', 'Importing stopwords from nltk']
['2020-07-29 02', '09', '34,464'

['2020-07-29 02', '16', '18,356', 'INFO', 'gensim==3.8.3']
['2020-07-29 02', '16', '18,913', 'INFO', 'PyCaret NLP Module']
['2020-07-29 02', '16', '18,914', 'INFO', 'version pycaret-nightly-0.39']
['2020-07-29 02', '16', '18,914', 'INFO', 'Initializing setup()']
['2020-07-29 02', '16', '18,914', 'INFO', 'USI', '38de']
['2020-07-29 02', '16', '18,914', 'INFO', 'setup(data=(6818, 7), target=en, custom_stopwords=None, html=False, session_id=None, log_experiment=True,']
['experiment_name=kiva_exp, log_plots=False, log_data=False, verbose=True)']
['2020-07-29 02', '16', '18,914', 'INFO', 'Checking environment']
['2020-07-29 02', '16', '18,914', 'INFO', 'python_version', '3.6.10']
['2020-07-29 02', '16', '18,914', 'INFO', 'python_build', "('default', 'May  7 2020 19", '46', "08')"]
['2020-07-29 02', '16', '18,914', 'INFO', 'machine', 'AMD64']
['2020-07-29 02', '16', '18,915', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']
['2020-07-29 02', '16', '18,954', 'INFO', 'Memory', 'svmem(total=170

['2020-07-29 02', '22', '19,762', 'INFO', 'Compiling processed text']
['2020-07-29 02', '22', '19,795', 'INFO', 'Compiling information grid']
['2020-07-29 02', '22', '20,270', 'INFO', 'Creating MLFlow logs']
['2020-07-29 02', '22', '21,106', 'INFO', 'setup() succesfully completed......................................']
['2020-07-29 02', '22', '21,106', 'INFO', 'Initializing create_model()']
['2020-07-29 02', '22', '21,106', 'INFO', 'create_model(model=lda, multi_core=True, num_topics=None, verbose=True, system=True)']
['2020-07-29 02', '22', '21,106', 'INFO', 'Checking exceptions']
['2020-07-29 02', '22', '21,107', 'INFO', 'Preloading libraries']
['2020-07-29 02', '22', '21,107', 'INFO', 'Preparing display monitor']
['2020-07-29 02', '22', '21,122', 'INFO', 'Defining topic model']
['2020-07-29 02', '22', '21,122', 'INFO', 'Model', 'Latent Dirichlet Allocation']
['2020-07-29 02', '22', '21,122', 'INFO', 'Defining num_topics parameter']
['2020-07-29 02', '22', '21,122', 'INFO', 'num_topi

['2020-07-29 02', '29', '30,340', 'INFO', 'Checking Exceptions']
['2020-07-29 02', '29', '31,631', 'INFO', 'Preloading libraries']
['2020-07-29 02', '29', '31,826', 'INFO', 'Preparing display monitor']
['2020-07-29 02', '29', '31,837', 'INFO', 'Importing libraries']
['2020-07-29 02', '29', '31,837', 'INFO', 'Declaring global variables']
['2020-07-29 02', '29', '31,838', 'INFO', 'Input provided', 'dataframe']
['2020-07-29 02', '29', '31,838', 'INFO', 'session_id set to', '2432']
['2020-07-29 02', '29', '31,838', 'INFO', 'Copying training dataset']
['2020-07-29 02', '29', '31,839', 'INFO', 'Importing stopwords from nltk']
['2020-07-29 02', '29', '31,951', 'INFO', 'Tokenizing Words']
['2020-07-29 02', '29', '32,135', 'INFO', 'No custom stopwords defined']
['2020-07-29 02', '29', '32,135', 'INFO', 'Removing numeric characters from the text']
['2020-07-29 02', '29', '32,354', 'INFO', 'Tokenizing Words']
['2020-07-29 02', '29', '32,452', 'INFO', 'Removing special characters from the text']
[

['2020-07-29 02', '35', '58,575', 'INFO', 'Checking libraries']
['2020-07-29 02', '35', '58,576', 'INFO', 'pd==1.0.4']
['2020-07-29 02', '35', '58,576', 'INFO', 'numpy==1.18.5']
['2020-07-29 02', '35', '58,928', 'INFO', 'pyLDAvis==2.1.2']
['2020-07-29 02', '35', '59,035', 'INFO', 'wordcloud==1.7.0']
['2020-07-29 02', '35', '59,712', 'INFO', 'mlflow==1.8.0']
['2020-07-29 02', '35', '59,712', 'INFO', 'Checking Exceptions']
['2020-07-29 02', '35', '59,859', 'INFO', 'Preloading libraries']
['2020-07-29 02', '35', '59,886', 'INFO', 'gensim==3.8.3']
['2020-07-29 02', '36', '00,087', 'INFO', 'Preparing display monitor']
['2020-07-29 02', '36', '00,100', 'INFO', 'Importing libraries']
['2020-07-29 02', '36', '00,100', 'INFO', 'Declaring global variables']
['2020-07-29 02', '36', '00,100', 'INFO', 'Input provided', 'dataframe']
['2020-07-29 02', '36', '00,101', 'INFO', 'session_id set to', '5642']
['2020-07-29 02', '36', '00,101', 'INFO', 'Copying training dataset']
['2020-07-29 02', '36', '00,

['2020-07-29 02', '42', '30,675', 'INFO', 'num_topics set to', '4']
['2020-07-29 02', '42', '30,675', 'INFO', 'LDA multi_core enabled']
['2020-07-29 02', '42', '30,676', 'INFO', 'LdaMulticore imported successfully']
['2020-07-29 02', '42', '30,823', 'INFO', 'spacy==2.2.4']
['2020-07-29 02', '42', '31,279', 'INFO', 'mlflow==1.8.0']
['2020-07-29 02', '42', '31,279', 'INFO', 'Checking Exceptions']
['2020-07-29 02', '42', '31,604', 'INFO', 'nltk==3.5']
['2020-07-29 02', '42', '31,658', 'INFO', 'textblob==0.15.3']
['2020-07-29 02', '42', '32,277', 'INFO', 'pyLDAvis==2.1.2']
['2020-07-29 02', '42', '32,393', 'INFO', 'wordcloud==1.7.0']
['2020-07-29 02', '42', '32,723', 'INFO', 'Preloading libraries']
['2020-07-29 02', '42', '32,930', 'INFO', 'Preparing display monitor']
['2020-07-29 02', '42', '32,944', 'INFO', 'Importing libraries']
['2020-07-29 02', '42', '32,944', 'INFO', 'Declaring global variables']
['2020-07-29 02', '42', '32,944', 'INFO', 'Input provided', 'dataframe']
['2020-07-29 02

['2020-07-29 02', '49', '14,249', 'INFO', 'version pycaret-nightly-0.39']
['2020-07-29 02', '49', '14,249', 'INFO', 'Initializing setup()']
['2020-07-29 02', '49', '14,249', 'INFO', 'USI', 'b4ce']
['2020-07-29 02', '49', '14,249', 'INFO', 'setup(data=(6818, 7), target=en, custom_stopwords=None, html=False, session_id=None, log_experiment=True,']
['experiment_name=kiva_exp, log_plots=False, log_data=False, verbose=True)']
['2020-07-29 02', '49', '14,250', 'INFO', 'Checking environment']
['2020-07-29 02', '49', '14,250', 'INFO', 'python_version', '3.6.10']
['2020-07-29 02', '49', '14,250', 'INFO', 'python_build', "('default', 'May  7 2020 19", '46', "08')"]
['2020-07-29 02', '49', '14,250', 'INFO', 'machine', 'AMD64']
['2020-07-29 02', '49', '14,250', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']
['2020-07-29 02', '49', '14,293', 'INFO', 'Memory', 'svmem(total=17032478720, available=9381060608, percent=44.9, used=7651418112, free=9381060608)']
['2020-07-29 02', '49', '14,293', 'INFO',

['2020-07-29 02', '57', '36,156', 'INFO', 'USI', '69b5']
['2020-07-29 02', '57', '36,156', 'INFO', 'setup(data=(6818, 7), target=en, custom_stopwords=None, html=False, session_id=None, log_experiment=True,']
['experiment_name=kiva_exp, log_plots=False, log_data=False, verbose=True)']
['2020-07-29 02', '57', '36,156', 'INFO', 'Checking environment']
['2020-07-29 02', '57', '36,156', 'INFO', 'python_version', '3.6.10']
['2020-07-29 02', '57', '36,156', 'INFO', 'python_build', "('default', 'May  7 2020 19", '46', "08')"]
['2020-07-29 02', '57', '36,157', 'INFO', 'machine', 'AMD64']
['2020-07-29 02', '57', '36,157', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']
['2020-07-29 02', '57', '36,200', 'INFO', 'Memory', 'svmem(total=17032478720, available=8849444864, percent=48.0, used=8183033856, free=8849444864)']
['2020-07-29 02', '57', '36,200', 'INFO', 'Physical Core', '4']
['2020-07-29 02', '57', '36,200', 'INFO', 'Logical Core', '8']
['2020-07-29 02', '57', '36,200', 'INFO', 'Checking li

['2020-07-29 03', '04', '21,956', 'INFO', 'Removing numeric characters from the text']
['2020-07-29 03', '04', '22,222', 'INFO', 'No custom stopwords defined']
['2020-07-29 03', '04', '22,222', 'INFO', 'Removing numeric characters from the text']
['2020-07-29 03', '04', '22,327', 'INFO', 'Removing special characters from the text']
['2020-07-29 03', '04', '22,389', 'INFO', 'setup() succesfully completed......................................']
['2020-07-29 03', '04', '22,389', 'INFO', 'Initializing create_model()']
['2020-07-29 03', '04', '22,389', 'INFO', 'create_model(model=lda, multi_core=True, num_topics=None, verbose=True, system=True)']
['2020-07-29 03', '04', '22,390', 'INFO', 'Checking exceptions']
['2020-07-29 03', '04', '22,390', 'INFO', 'Preloading libraries']
['2020-07-29 03', '04', '22,390', 'INFO', 'Preparing display monitor']
['2020-07-29 03', '04', '22,396', 'INFO', 'Defining topic model']
['2020-07-29 03', '04', '22,396', 'INFO', 'Model', 'Latent Dirichlet Allocation']


['2020-07-29 03', '12', '57,162', 'INFO', 'mlflow==1.8.0']
['2020-07-29 03', '12', '57,162', 'INFO', 'Checking Exceptions']
['2020-07-29 03', '12', '57,165', 'INFO', 'Removing special characters from the text']
['2020-07-29 03', '12', '58,499', 'INFO', 'Preloading libraries']
['2020-07-29 03', '12', '58,718', 'INFO', 'Preparing display monitor']
['2020-07-29 03', '12', '58,729', 'INFO', 'Importing libraries']
['2020-07-29 03', '12', '58,729', 'INFO', 'Declaring global variables']
['2020-07-29 03', '12', '58,729', 'INFO', 'Input provided', 'dataframe']
['2020-07-29 03', '12', '58,729', 'INFO', 'session_id set to', '3717']
['2020-07-29 03', '12', '58,729', 'INFO', 'Copying training dataset']
['2020-07-29 03', '12', '58,730', 'INFO', 'Importing stopwords from nltk']
['2020-07-29 03', '12', '59,032', 'INFO', 'No custom stopwords defined']
['2020-07-29 03', '12', '59,033', 'INFO', 'Removing numeric characters from the text']
['2020-07-29 03', '12', '59,368', 'INFO', 'Removing special charac

['2020-07-29 03', '23', '39,145', 'INFO', 'Removing stopwords after lemmatizing']
['2020-07-29 03', '23', '39,839', 'INFO', 'Creating corpus and dictionary']
['2020-07-29 03', '23', '41,210', 'INFO', 'Creating corpus and dictionary']
['2020-07-29 03', '23', '41,624', 'INFO', 'Compiling processed text']
['2020-07-29 03', '23', '41,644', 'INFO', 'Compiling information grid']
['2020-07-29 03', '23', '42,186', 'INFO', 'Creating MLFlow logs']
['2020-07-29 03', '23', '42,753', 'INFO', 'setup() succesfully completed......................................']
['2020-07-29 03', '23', '42,753', 'INFO', 'Initializing create_model()']
['2020-07-29 03', '23', '42,753', 'INFO', 'create_model(model=lda, multi_core=True, num_topics=None, verbose=True, system=True)']
['2020-07-29 03', '23', '42,753', 'INFO', 'Checking exceptions']
['2020-07-29 03', '23', '42,753', 'INFO', 'Preloading libraries']
['2020-07-29 03', '23', '42,753', 'INFO', 'Preparing display monitor']
['2020-07-29 03', '23', '42,761', 'INFO'

['2020-07-29 03', '28', '25,423', 'INFO', 'Preparing display monitor']
['2020-07-29 03', '28', '25,432', 'INFO', 'Defining topic model']
['2020-07-29 03', '28', '25,432', 'INFO', 'Model', 'Latent Dirichlet Allocation']
['2020-07-29 03', '28', '25,432', 'INFO', 'Defining num_topics parameter']
['2020-07-29 03', '28', '25,432', 'INFO', 'num_topics set to', '4']
['2020-07-29 03', '28', '25,432', 'INFO', 'LDA multi_core enabled']
['2020-07-29 03', '28', '25,433', 'INFO', 'LdaMulticore imported successfully']
['2020-07-29 03', '28', '25,958', 'INFO', 'Extracting Bigrams']
['2020-07-29 03', '28', '26,267', 'INFO', 'Removing stopwords']
['2020-07-29 03', '28', '30,063', 'INFO', 'PyCaret NLP Module']
['2020-07-29 03', '28', '30,063', 'INFO', 'version pycaret-nightly-0.39']
['2020-07-29 03', '28', '30,064', 'INFO', 'Initializing setup()']
['2020-07-29 03', '28', '30,064', 'INFO', 'USI', '704e']
['2020-07-29 03', '28', '30,064', 'INFO', 'setup(data=(6818, 7), target=en, custom_stopwords=None, ht

['2020-07-29 03', '36', '45,737', 'INFO', 'Compiling information grid']
['2020-07-29 03', '36', '46,270', 'INFO', 'Creating MLFlow logs']
['2020-07-29 03', '36', '46,481', 'INFO', 'Compiling processed text']
['2020-07-29 03', '36', '46,517', 'INFO', 'Compiling information grid']
['2020-07-29 03', '36', '46,848', 'INFO', 'setup() succesfully completed......................................']
['2020-07-29 03', '36', '46,848', 'INFO', 'Initializing create_model()']
['2020-07-29 03', '36', '46,848', 'INFO', 'create_model(model=lda, multi_core=True, num_topics=None, verbose=True, system=True)']
['2020-07-29 03', '36', '46,848', 'INFO', 'Checking exceptions']
['2020-07-29 03', '36', '46,849', 'INFO', 'Preloading libraries']
['2020-07-29 03', '36', '46,849', 'INFO', 'Preparing display monitor']
['2020-07-29 03', '36', '46,857', 'INFO', 'Defining topic model']
['2020-07-29 03', '36', '46,857', 'INFO', 'Model', 'Latent Dirichlet Allocation']
['2020-07-29 03', '36', '46,857', 'INFO', 'Defining nu

['2020-07-29 03', '43', '34,634', 'INFO', 'Removing stopwords after lemmatizing']
['2020-07-29 03', '43', '34,903', 'INFO', 'Tokenizing Words']
['2020-07-29 03', '43', '36,651', 'INFO', 'Creating corpus and dictionary']
['2020-07-29 03', '43', '37,300', 'INFO', 'Removing stopwords']
['2020-07-29 03', '43', '38,728', 'INFO', 'Compiling processed text']
['2020-07-29 03', '43', '38,747', 'INFO', 'Compiling information grid']
['2020-07-29 03', '43', '39,081', 'INFO', 'Removing stopwords']
['2020-07-29 03', '43', '39,201', 'INFO', 'Creating MLFlow logs']
['2020-07-29 03', '43', '39,702', 'INFO', 'setup() succesfully completed......................................']
['2020-07-29 03', '43', '39,703', 'INFO', 'Initializing create_model()']
['2020-07-29 03', '43', '39,703', 'INFO', 'create_model(model=lda, multi_core=True, num_topics=None, verbose=True, system=True)']
['2020-07-29 03', '43', '39,703', 'INFO', 'Checking exceptions']
['2020-07-29 03', '43', '39,703', 'INFO', 'Preloading libraries

['2020-07-29 03', '54', '24,257', 'INFO', 'LDA multi_core enabled']
['2020-07-29 03', '54', '24,257', 'INFO', 'LdaMulticore imported successfully']
['2020-07-29 03', '54', '24,399', 'INFO', 'Compiling processed text']
['2020-07-29 03', '54', '24,437', 'INFO', 'Compiling information grid']
['2020-07-29 03', '54', '25,018', 'INFO', 'Creating MLFlow logs']
['2020-07-29 03', '54', '25,589', 'INFO', 'setup() succesfully completed......................................']
['2020-07-29 03', '54', '25,589', 'INFO', 'Initializing create_model()']
['2020-07-29 03', '54', '25,590', 'INFO', 'create_model(model=lda, multi_core=True, num_topics=None, verbose=True, system=True)']
['2020-07-29 03', '54', '25,590', 'INFO', 'Checking exceptions']
['2020-07-29 03', '54', '25,590', 'INFO', 'Preloading libraries']
['2020-07-29 03', '54', '25,590', 'INFO', 'Preparing display monitor']
['2020-07-29 03', '54', '25,606', 'INFO', 'Defining topic model']
['2020-07-29 03', '54', '25,606', 'INFO', 'Model', 'Latent D

['2020-07-29 04', '01', '13,089', 'INFO', 'Creating MLFlow logs']
['2020-07-29 04', '01', '13,664', 'INFO', 'setup() succesfully completed......................................']
['2020-07-29 04', '01', '13,664', 'INFO', 'Initializing create_model()']
['2020-07-29 04', '01', '13,664', 'INFO', 'create_model(model=lda, multi_core=True, num_topics=None, verbose=True, system=True)']
['2020-07-29 04', '01', '13,665', 'INFO', 'Checking exceptions']
['2020-07-29 04', '01', '13,665', 'INFO', 'Preloading libraries']
['2020-07-29 04', '01', '13,665', 'INFO', 'Preparing display monitor']
['2020-07-29 04', '01', '13,675', 'INFO', 'Defining topic model']
['2020-07-29 04', '01', '13,675', 'INFO', 'Model', 'Latent Dirichlet Allocation']
['2020-07-29 04', '01', '13,676', 'INFO', 'Defining num_topics parameter']
['2020-07-29 04', '01', '13,676', 'INFO', 'num_topics set to', '4']
['2020-07-29 04', '01', '13,676', 'INFO', 'LDA multi_core enabled']
['2020-07-29 04', '01', '13,676', 'INFO', 'LdaMulticore i

['2020-07-29 04', '10', '04,383', 'INFO', 'Preloading libraries']
['2020-07-29 04', '10', '04,582', 'INFO', 'Preparing display monitor']
['2020-07-29 04', '10', '04,596', 'INFO', 'Importing libraries']
['2020-07-29 04', '10', '04,596', 'INFO', 'Declaring global variables']
['2020-07-29 04', '10', '04,596', 'INFO', 'Input provided', 'dataframe']
['2020-07-29 04', '10', '04,596', 'INFO', 'session_id set to', '1205']
['2020-07-29 04', '10', '04,597', 'INFO', 'Copying training dataset']
['2020-07-29 04', '10', '04,597', 'INFO', 'Importing stopwords from nltk']
['2020-07-29 04', '10', '04,967', 'INFO', 'No custom stopwords defined']
['2020-07-29 04', '10', '04,967', 'INFO', 'Removing numeric characters from the text']
['2020-07-29 04', '10', '05,290', 'INFO', 'Removing special characters from the text']
['2020-07-29 04', '10', '07,815', 'INFO', 'Tokenizing Words']
['2020-07-29 04', '10', '07,946', 'INFO', 'Extracting Bigrams']
['2020-07-29 04', '10', '12,855', 'INFO', 'Extracting Trigrams']

['2020-07-29 04', '18', '22,359', 'INFO', 'Preloading libraries']
['2020-07-29 04', '18', '22,359', 'INFO', 'Preparing display monitor']
['2020-07-29 04', '18', '22,367', 'INFO', 'Defining topic model']
['2020-07-29 04', '18', '22,368', 'INFO', 'Model', 'Latent Dirichlet Allocation']
['2020-07-29 04', '18', '22,368', 'INFO', 'Defining num_topics parameter']
['2020-07-29 04', '18', '22,368', 'INFO', 'num_topics set to', '4']
['2020-07-29 04', '18', '22,368', 'INFO', 'LDA multi_core enabled']
['2020-07-29 04', '18', '22,368', 'INFO', 'LdaMulticore imported successfully']
['2020-07-29 04', '18', '24,192', 'INFO', 'Compiling processed text']
['2020-07-29 04', '18', '24,216', 'INFO', 'Compiling information grid']
['2020-07-29 04', '18', '24,635', 'INFO', 'Creating MLFlow logs']
['2020-07-29 04', '18', '24,846', 'INFO', 'PyCaret NLP Module']
['2020-07-29 04', '18', '24,846', 'INFO', 'version pycaret-nightly-0.39']
['2020-07-29 04', '18', '24,846', 'INFO', 'Initializing setup()']
['2020-07-29

['2020-07-29 04', '25', '09,648', 'INFO', 'Initializing setup()']
['2020-07-29 04', '25', '09,648', 'INFO', 'USI', '9a98']
['2020-07-29 04', '25', '09,648', 'INFO', 'setup(data=(6818, 7), target=en, custom_stopwords=None, html=False, session_id=None, log_experiment=True,']
['experiment_name=kiva_exp, log_plots=False, log_data=False, verbose=True)']
['2020-07-29 04', '25', '09,648', 'INFO', 'Checking environment']
['2020-07-29 04', '25', '09,649', 'INFO', 'python_version', '3.6.10']
['2020-07-29 04', '25', '09,649', 'INFO', 'python_build', "('default', 'May  7 2020 19", '46', "08')"]
['2020-07-29 04', '25', '09,649', 'INFO', 'machine', 'AMD64']
['2020-07-29 04', '25', '09,649', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']
['2020-07-29 04', '25', '09,685', 'INFO', 'Memory', 'svmem(total=17032478720, available=9547177984, percent=43.9, used=7485300736, free=9547177984)']
['2020-07-29 04', '25', '09,685', 'INFO', 'Physical Core', '4']
['2020-07-29 04', '25', '09,686', 'INFO', 'Logical 

['2020-07-29 04', '31', '43,171', 'INFO', 'Importing stopwords from nltk']
['2020-07-29 04', '31', '43,459', 'INFO', 'Tokenizing Words']
['2020-07-29 04', '31', '43,504', 'INFO', 'mlflow==1.8.0']
['2020-07-29 04', '31', '43,505', 'INFO', 'Checking Exceptions']
['2020-07-29 04', '31', '43,530', 'INFO', 'No custom stopwords defined']
['2020-07-29 04', '31', '43,530', 'INFO', 'Removing numeric characters from the text']
['2020-07-29 04', '31', '43,818', 'INFO', 'Removing special characters from the text']
['2020-07-29 04', '31', '44,743', 'INFO', 'Preloading libraries']
['2020-07-29 04', '31', '44,924', 'INFO', 'Preparing display monitor']
['2020-07-29 04', '31', '44,938', 'INFO', 'Importing libraries']
['2020-07-29 04', '31', '44,939', 'INFO', 'Declaring global variables']
['2020-07-29 04', '31', '44,939', 'INFO', 'Input provided', 'dataframe']
['2020-07-29 04', '31', '44,939', 'INFO', 'session_id set to', '1418']
['2020-07-29 04', '31', '44,939', 'INFO', 'Copying training dataset']
['20

['2020-07-29 04', '40', '12,813', 'INFO', 'Memory', 'svmem(total=17032478720, available=8788828160, percent=48.4, used=8243650560, free=8788828160)']
['2020-07-29 04', '40', '12,813', 'INFO', 'Physical Core', '4']
['2020-07-29 04', '40', '12,813', 'INFO', 'Logical Core', '8']
['2020-07-29 04', '40', '12,813', 'INFO', 'Checking libraries']
['2020-07-29 04', '40', '12,813', 'INFO', 'pd==1.0.4']
['2020-07-29 04', '40', '12,813', 'INFO', 'numpy==1.18.5']
['2020-07-29 04', '40', '13,317', 'INFO', 'Compiling processed text']
['2020-07-29 04', '40', '13,339', 'INFO', 'Compiling information grid']
['2020-07-29 04', '40', '13,822', 'INFO', 'Creating MLFlow logs']
['2020-07-29 04', '40', '13,849', 'INFO', 'Creating corpus and dictionary']
['2020-07-29 04', '40', '14,039', 'INFO', 'Creating corpus and dictionary']
['2020-07-29 04', '40', '14,111', 'INFO', 'gensim==3.8.3']
['2020-07-29 04', '40', '14,356', 'INFO', 'setup() succesfully completed......................................']
['2020-07-29 

['2020-07-29 04', '48', '55,663', 'INFO', 'Checking exceptions']
['2020-07-29 04', '48', '55,663', 'INFO', 'Preloading libraries']
['2020-07-29 04', '48', '55,663', 'INFO', 'Preparing display monitor']
['2020-07-29 04', '48', '55,674', 'INFO', 'Defining topic model']
['2020-07-29 04', '48', '55,675', 'INFO', 'Model', 'Latent Dirichlet Allocation']
['2020-07-29 04', '48', '55,675', 'INFO', 'Defining num_topics parameter']
['2020-07-29 04', '48', '55,675', 'INFO', 'num_topics set to', '4']
['2020-07-29 04', '48', '55,675', 'INFO', 'LDA multi_core enabled']
['2020-07-29 04', '48', '55,676', 'INFO', 'LdaMulticore imported successfully']
['2020-07-29 04', '48', '56,328', 'INFO', 'Creating corpus and dictionary']
['2020-07-29 04', '48', '56,443', 'INFO', 'Creating corpus and dictionary']
['2020-07-29 04', '48', '56,620', 'INFO', 'Preloading libraries']
['2020-07-29 04', '48', '56,829', 'INFO', 'Preparing display monitor']
['2020-07-29 04', '48', '56,844', 'INFO', 'Importing libraries']
['202

['2020-07-29 04', '57', '42,413', 'INFO', 'spacy==2.2.4']
['2020-07-29 04', '57', '43,167', 'INFO', 'gensim==3.8.3']
['2020-07-29 04', '57', '43,209', 'INFO', 'nltk==3.5']
['2020-07-29 04', '57', '43,258', 'INFO', 'textblob==0.15.3']
['2020-07-29 04', '57', '43,764', 'INFO', 'spacy==2.2.4']
['2020-07-29 04', '57', '43,898', 'INFO', 'pyLDAvis==2.1.2']
['2020-07-29 04', '57', '44,008', 'INFO', 'wordcloud==1.7.0']
['2020-07-29 04', '57', '44,465', 'INFO', 'nltk==3.5']
['2020-07-29 04', '57', '44,510', 'INFO', 'textblob==0.15.3']
['2020-07-29 04', '57', '44,658', 'INFO', 'mlflow==1.8.0']
['2020-07-29 04', '57', '44,658', 'INFO', 'Checking Exceptions']
['2020-07-29 04', '57', '45,061', 'INFO', 'pyLDAvis==2.1.2']
['2020-07-29 04', '57', '45,077', 'INFO', 'PyCaret NLP Module']
['2020-07-29 04', '57', '45,077', 'INFO', 'version pycaret-nightly-0.39']
['2020-07-29 04', '57', '45,077', 'INFO', 'Initializing setup()']
['2020-07-29 04', '57', '45,078', 'INFO', 'USI', '01c2']
['2020-07-29 04', '57'

['2020-07-29 05', '02', '08,391', 'INFO', 'Input provided', 'dataframe']
['2020-07-29 05', '02', '08,391', 'INFO', 'session_id set to', '6510']
['2020-07-29 05', '02', '08,391', 'INFO', 'Copying training dataset']
['2020-07-29 05', '02', '08,392', 'INFO', 'Importing stopwords from nltk']
['2020-07-29 05', '02', '08,733', 'INFO', 'No custom stopwords defined']
['2020-07-29 05', '02', '08,733', 'INFO', 'Removing numeric characters from the text']
['2020-07-29 05', '02', '08,897', 'INFO', 'Removing stopwords']
['2020-07-29 05', '02', '08,975', 'INFO', 'mlflow==1.8.0']
['2020-07-29 05', '02', '08,975', 'INFO', 'Checking Exceptions']
['2020-07-29 05', '02', '09,128', 'INFO', 'Removing special characters from the text']
['2020-07-29 05', '02', '10,295', 'INFO', 'Preloading libraries']
['2020-07-29 05', '02', '10,481', 'INFO', 'Preparing display monitor']
['2020-07-29 05', '02', '10,490', 'INFO', 'Importing libraries']
['2020-07-29 05', '02', '10,490', 'INFO', 'Declaring global variables']
['

['2020-07-29 05', '08', '38,813', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']
['2020-07-29 05', '08', '38,844', 'INFO', 'Memory', 'svmem(total=17032478720, available=9211105280, percent=45.9, used=7821373440, free=9211105280)']
['2020-07-29 05', '08', '38,844', 'INFO', 'Physical Core', '4']
['2020-07-29 05', '08', '38,844', 'INFO', 'Logical Core', '8']
['2020-07-29 05', '08', '38,844', 'INFO', 'Checking libraries']
['2020-07-29 05', '08', '38,844', 'INFO', 'pd==1.0.4']
['2020-07-29 05', '08', '38,844', 'INFO', 'numpy==1.18.5']
['2020-07-29 05', '08', '39,695', 'INFO', 'Creating corpus and dictionary']
['2020-07-29 05', '08', '40,122', 'INFO', 'gensim==3.8.3']
['2020-07-29 05', '08', '40,150', 'INFO', 'Tokenizing Words']
['2020-07-29 05', '08', '40,738', 'INFO', 'spacy==2.2.4']
['2020-07-29 05', '08', '41,554', 'INFO', 'nltk==3.5']
['2020-07-29 05', '08', '41,613', 'INFO', 'textblob==0.15.3']
['2020-07-29 05', '08', '41,681', 'INFO', 'Compiling processed text']
['2020-07-29 05', '0

['2020-07-29 05', '17', '16,538', 'INFO', 'Checking Exceptions']
['2020-07-29 05', '17', '17,817', 'INFO', 'Preloading libraries']
['2020-07-29 05', '17', '18,039', 'INFO', 'Preparing display monitor']
['2020-07-29 05', '17', '18,052', 'INFO', 'Importing libraries']
['2020-07-29 05', '17', '18,052', 'INFO', 'Declaring global variables']
['2020-07-29 05', '17', '18,053', 'INFO', 'Input provided', 'dataframe']
['2020-07-29 05', '17', '18,053', 'INFO', 'session_id set to', '6259']
['2020-07-29 05', '17', '18,053', 'INFO', 'Copying training dataset']
['2020-07-29 05', '17', '18,053', 'INFO', 'Importing stopwords from nltk']
['2020-07-29 05', '17', '18,328', 'INFO', 'No custom stopwords defined']
['2020-07-29 05', '17', '18,328', 'INFO', 'Removing numeric characters from the text']
['2020-07-29 05', '17', '18,489', 'INFO', 'Tokenizing Words']
['2020-07-29 05', '17', '18,614', 'INFO', 'Removing special characters from the text']
['2020-07-29 05', '17', '20,904', 'INFO', 'PyCaret NLP Module']

['2020-07-29 05', '23', '52,919', 'INFO', 'Preparing display monitor']
['2020-07-29 05', '23', '52,931', 'INFO', 'Importing libraries']
['2020-07-29 05', '23', '52,931', 'INFO', 'Declaring global variables']
['2020-07-29 05', '23', '52,931', 'INFO', 'Input provided', 'dataframe']
['2020-07-29 05', '23', '52,932', 'INFO', 'session_id set to', '3790']
['2020-07-29 05', '23', '52,932', 'INFO', 'Copying training dataset']
['2020-07-29 05', '23', '52,933', 'INFO', 'Importing stopwords from nltk']
['2020-07-29 05', '23', '53,333', 'INFO', 'No custom stopwords defined']
['2020-07-29 05', '23', '53,333', 'INFO', 'Removing numeric characters from the text']
['2020-07-29 05', '23', '53,673', 'INFO', 'Removing special characters from the text']
['2020-07-29 05', '23', '54,556', 'INFO', 'Tokenizing Words']
['2020-07-29 05', '23', '54,689', 'INFO', 'Removing stopwords after lemmatizing']
['2020-07-29 05', '23', '56,402', 'INFO', 'Tokenizing Words']
['2020-07-29 05', '23', '56,691', 'INFO', 'Creatin

['2020-07-29 05', '30', '39,364', 'INFO', 'Importing stopwords from nltk']
['2020-07-29 05', '30', '39,472', 'INFO', 'Removing stopwords']
['2020-07-29 05', '30', '39,662', 'INFO', 'No custom stopwords defined']
['2020-07-29 05', '30', '39,662', 'INFO', 'Removing numeric characters from the text']
['2020-07-29 05', '30', '39,768', 'INFO', 'Removing stopwords']
['2020-07-29 05', '30', '39,992', 'INFO', 'Removing special characters from the text']
['2020-07-29 05', '30', '40,412', 'INFO', 'gensim==3.8.3']
['2020-07-29 05', '30', '40,968', 'INFO', 'spacy==2.2.4']
['2020-07-29 05', '30', '41,655', 'INFO', 'nltk==3.5']
['2020-07-29 05', '30', '41,707', 'INFO', 'textblob==0.15.3']
['2020-07-29 05', '30', '42,289', 'INFO', 'pyLDAvis==2.1.2']
['2020-07-29 05', '30', '42,388', 'INFO', 'wordcloud==1.7.0']
['2020-07-29 05', '30', '42,560', 'INFO', 'Tokenizing Words']
['2020-07-29 05', '30', '43,026', 'INFO', 'mlflow==1.8.0']
['2020-07-29 05', '30', '43,027', 'INFO', 'Checking Exceptions']
['2020-

['2020-07-29 05', '37', '09,792', 'INFO', 'Checking environment']
['2020-07-29 05', '37', '09,792', 'INFO', 'python_version', '3.6.10']
['2020-07-29 05', '37', '09,792', 'INFO', 'python_build', "('default', 'May  7 2020 19", '46', "08')"]
['2020-07-29 05', '37', '09,793', 'INFO', 'machine', 'AMD64']
['2020-07-29 05', '37', '09,793', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']
['2020-07-29 05', '37', '09,833', 'INFO', 'Memory', 'svmem(total=17032478720, available=9680732160, percent=43.2, used=7351746560, free=9680732160)']
['2020-07-29 05', '37', '09,833', 'INFO', 'Physical Core', '4']
['2020-07-29 05', '37', '09,834', 'INFO', 'Logical Core', '8']
['2020-07-29 05', '37', '09,834', 'INFO', 'Checking libraries']
['2020-07-29 05', '37', '09,834', 'INFO', 'pd==1.0.4']
['2020-07-29 05', '37', '09,834', 'INFO', 'numpy==1.18.5']
['2020-07-29 05', '37', '09,955', 'INFO', 'Preparing display monitor']
['2020-07-29 05', '37', '09,965', 'INFO', 'Importing libraries']
['2020-07-29 05', '37', '

['2020-07-29 05', '48', '04,735', 'INFO', 'Importing libraries']
['2020-07-29 05', '48', '04,736', 'INFO', 'Declaring global variables']
['2020-07-29 05', '48', '04,736', 'INFO', 'Input provided', 'dataframe']
['2020-07-29 05', '48', '04,736', 'INFO', 'session_id set to', '6487']
['2020-07-29 05', '48', '04,736', 'INFO', 'Copying training dataset']
['2020-07-29 05', '48', '04,737', 'INFO', 'Importing stopwords from nltk']
['2020-07-29 05', '48', '04,952', 'INFO', 'Removing special characters from the text']
['2020-07-29 05', '48', '05,102', 'INFO', 'No custom stopwords defined']
['2020-07-29 05', '48', '05,103', 'INFO', 'Removing numeric characters from the text']
['2020-07-29 05', '48', '05,168', 'INFO', 'Creating MLFlow logs']
['2020-07-29 05', '48', '05,444', 'INFO', 'Removing special characters from the text']
['2020-07-29 05', '48', '05,724', 'INFO', 'setup() succesfully completed......................................']
['2020-07-29 05', '48', '05,724', 'INFO', 'Initializing creat

['2020-07-29 05', '52', '33,944', 'INFO', 'Checking environment']
['2020-07-29 05', '52', '33,944', 'INFO', 'python_version', '3.6.10']
['2020-07-29 05', '52', '33,944', 'INFO', 'python_build', "('default', 'May  7 2020 19", '46', "08')"]
['2020-07-29 05', '52', '33,944', 'INFO', 'machine', 'AMD64']
['2020-07-29 05', '52', '33,945', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']
['2020-07-29 05', '52', '33,980', 'INFO', 'Memory', 'svmem(total=17032478720, available=9567371264, percent=43.8, used=7465107456, free=9567371264)']
['2020-07-29 05', '52', '33,980', 'INFO', 'Physical Core', '4']
['2020-07-29 05', '52', '33,980', 'INFO', 'Logical Core', '8']
['2020-07-29 05', '52', '33,980', 'INFO', 'Checking libraries']
['2020-07-29 05', '52', '33,980', 'INFO', 'pd==1.0.4']
['2020-07-29 05', '52', '33,980', 'INFO', 'numpy==1.18.5']
['2020-07-29 05', '52', '34,498', 'INFO', 'gensim==3.8.3']
['2020-07-29 05', '52', '35,117', 'INFO', 'spacy==2.2.4']
['2020-07-29 05', '52', '35,293', 'INFO', 'g

['2020-07-29 05', '59', '10,100', 'INFO', 'nltk==3.5']
['2020-07-29 05', '59', '10,156', 'INFO', 'textblob==0.15.3']
['2020-07-29 05', '59', '10,749', 'INFO', 'pyLDAvis==2.1.2']
['2020-07-29 05', '59', '10,856', 'INFO', 'wordcloud==1.7.0']
['2020-07-29 05', '59', '11,026', 'INFO', 'Preloading libraries']
['2020-07-29 05', '59', '11,227', 'INFO', 'Preparing display monitor']
['2020-07-29 05', '59', '11,242', 'INFO', 'Importing libraries']
['2020-07-29 05', '59', '11,242', 'INFO', 'Declaring global variables']
['2020-07-29 05', '59', '11,242', 'INFO', 'Input provided', 'dataframe']
['2020-07-29 05', '59', '11,243', 'INFO', 'session_id set to', '5002']
['2020-07-29 05', '59', '11,243', 'INFO', 'Copying training dataset']
['2020-07-29 05', '59', '11,244', 'INFO', 'Importing stopwords from nltk']
['2020-07-29 05', '59', '11,495', 'INFO', 'mlflow==1.8.0']
['2020-07-29 05', '59', '11,496', 'INFO', 'Checking Exceptions']
['2020-07-29 05', '59', '11,529', 'INFO', 'No custom stopwords defined']


['2020-07-29 06', '09', '51,508', 'INFO', 'Preloading libraries']
['2020-07-29 06', '09', '51,508', 'INFO', 'Preparing display monitor']
['2020-07-29 06', '09', '51,513', 'INFO', 'PyCaret NLP Module']
['2020-07-29 06', '09', '51,513', 'INFO', 'version pycaret-nightly-0.39']
['2020-07-29 06', '09', '51,513', 'INFO', 'Initializing setup()']
['2020-07-29 06', '09', '51,513', 'INFO', 'USI', '4cd4']
['2020-07-29 06', '09', '51,514', 'INFO', 'setup(data=(6818, 7), target=en, custom_stopwords=None, html=False, session_id=None, log_experiment=True,']
['experiment_name=kiva_exp, log_plots=False, log_data=False, verbose=True)']
['2020-07-29 06', '09', '51,514', 'INFO', 'Checking environment']
['2020-07-29 06', '09', '51,514', 'INFO', 'python_version', '3.6.10']
['2020-07-29 06', '09', '51,514', 'INFO', 'python_build', "('default', 'May  7 2020 19", '46', "08')"]
['2020-07-29 06', '09', '51,514', 'INFO', 'machine', 'AMD64']
['2020-07-29 06', '09', '51,515', 'INFO', 'platform', 'Windows-10-10.0.18

['2020-07-29 06', '14', '19,785', 'INFO', 'USI', 'dc55']
['2020-07-29 06', '14', '19,786', 'INFO', 'setup(data=(6818, 7), target=en, custom_stopwords=None, html=False, session_id=None, log_experiment=True,']
['experiment_name=kiva_exp, log_plots=False, log_data=False, verbose=True)']
['2020-07-29 06', '14', '19,786', 'INFO', 'Checking environment']
['2020-07-29 06', '14', '19,786', 'INFO', 'python_version', '3.6.10']
['2020-07-29 06', '14', '19,786', 'INFO', 'python_build', "('default', 'May  7 2020 19", '46', "08')"]
['2020-07-29 06', '14', '19,786', 'INFO', 'machine', 'AMD64']
['2020-07-29 06', '14', '19,786', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']
['2020-07-29 06', '14', '19,827', 'INFO', 'Memory', 'svmem(total=17032478720, available=9622466560, percent=43.5, used=7410012160, free=9622466560)']
['2020-07-29 06', '14', '19,828', 'INFO', 'Physical Core', '4']
['2020-07-29 06', '14', '19,828', 'INFO', 'Logical Core', '8']
['2020-07-29 06', '14', '19,828', 'INFO', 'Checking li

['2020-07-29 06', '20', '47,068', 'INFO', 'version pycaret-nightly-0.39']
['2020-07-29 06', '20', '47,068', 'INFO', 'Initializing setup()']
['2020-07-29 06', '20', '47,068', 'INFO', 'USI', 'a5bd']
['2020-07-29 06', '20', '47,068', 'INFO', 'setup(data=(6818, 7), target=en, custom_stopwords=None, html=False, session_id=None, log_experiment=True,']
['experiment_name=kiva_exp, log_plots=False, log_data=False, verbose=True)']
['2020-07-29 06', '20', '47,068', 'INFO', 'Checking environment']
['2020-07-29 06', '20', '47,068', 'INFO', 'python_version', '3.6.10']
['2020-07-29 06', '20', '47,068', 'INFO', 'python_build', "('default', 'May  7 2020 19", '46', "08')"]
['2020-07-29 06', '20', '47,068', 'INFO', 'machine', 'AMD64']
['2020-07-29 06', '20', '47,069', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']
['2020-07-29 06', '20', '47,109', 'INFO', 'Memory', 'svmem(total=17032478720, available=9716658176, percent=43.0, used=7315820544, free=9716658176)']
['2020-07-29 06', '20', '47,109', 'INFO',

['2020-07-29 06', '27', '30,490', 'INFO', 'Removing stopwords']
['2020-07-29 06', '27', '30,536', 'INFO', 'Extracting Bigrams']
['2020-07-29 06', '27', '30,575', 'INFO', 'No custom stopwords defined']
['2020-07-29 06', '27', '30,575', 'INFO', 'Removing numeric characters from the text']
['2020-07-29 06', '27', '30,898', 'INFO', 'Removing special characters from the text']
['2020-07-29 06', '27', '33,639', 'INFO', 'Tokenizing Words']
['2020-07-29 06', '27', '34,039', 'INFO', 'Extracting Bigrams']
['2020-07-29 06', '27', '34,341', 'INFO', 'Extracting Bigrams']
['2020-07-29 06', '27', '40,196', 'INFO', 'Removing stopwords']
['2020-07-29 06', '27', '40,768', 'INFO', 'Extracting Trigrams']
['2020-07-29 06', '27', '44,113', 'INFO', 'Extracting Bigrams']
['2020-07-29 06', '27', '44,628', 'INFO', 'Extracting Trigrams']
['2020-07-29 06', '27', '44,859', 'INFO', 'Extracting Trigrams']
['2020-07-29 06', '27', '54,499', 'INFO', 'Extracting Trigrams']
['2020-07-29 06', '28', '00,033', 'INFO', 'Lemm

['2020-07-29 06', '38', '03,218', 'INFO', 'Compiling information grid']
['2020-07-29 06', '38', '03,744', 'INFO', 'Creating MLFlow logs']
['2020-07-29 06', '38', '04,283', 'INFO', 'gensim==3.8.3']
['2020-07-29 06', '38', '04,332', 'INFO', 'setup() succesfully completed......................................']
['2020-07-29 06', '38', '04,332', 'INFO', 'Initializing create_model()']
['2020-07-29 06', '38', '04,332', 'INFO', 'create_model(model=lda, multi_core=True, num_topics=None, verbose=True, system=True)']
['2020-07-29 06', '38', '04,333', 'INFO', 'Checking exceptions']
['2020-07-29 06', '38', '04,333', 'INFO', 'Preloading libraries']
['2020-07-29 06', '38', '04,333', 'INFO', 'Preparing display monitor']
['2020-07-29 06', '38', '04,345', 'INFO', 'Defining topic model']
['2020-07-29 06', '38', '04,345', 'INFO', 'Model', 'Latent Dirichlet Allocation']
['2020-07-29 06', '38', '04,345', 'INFO', 'Defining num_topics parameter']
['2020-07-29 06', '38', '04,346', 'INFO', 'num_topics set to',

['2020-07-29 06', '40', '31,899', 'INFO', 'Preparing display monitor']
['2020-07-29 06', '40', '31,910', 'INFO', 'Importing libraries']
['2020-07-29 06', '40', '31,910', 'INFO', 'Declaring global variables']
['2020-07-29 06', '40', '31,910', 'INFO', 'Input provided', 'dataframe']
['2020-07-29 06', '40', '31,910', 'INFO', 'session_id set to', '7482']
['2020-07-29 06', '40', '31,910', 'INFO', 'Copying training dataset']
['2020-07-29 06', '40', '31,911', 'INFO', 'Importing stopwords from nltk']
['2020-07-29 06', '40', '32,246', 'INFO', 'No custom stopwords defined']
['2020-07-29 06', '40', '32,247', 'INFO', 'Removing numeric characters from the text']
['2020-07-29 06', '40', '32,660', 'INFO', 'Removing special characters from the text']
['2020-07-29 06', '40', '33,317', 'INFO', 'Removing stopwords']
['2020-07-29 06', '40', '34,174', 'INFO', 'Extracting Bigrams']
['2020-07-29 06', '40', '35,260', 'INFO', 'Tokenizing Words']
['2020-07-29 06', '40', '37,000', 'INFO', 'Extracting Bigrams']
['

['2020-07-29 06', '51', '17,789', 'INFO', 'nltk==3.5']
['2020-07-29 06', '51', '17,848', 'INFO', 'textblob==0.15.3']
['2020-07-29 06', '51', '18,049', 'INFO', 'PyCaret NLP Module']
['2020-07-29 06', '51', '18,049', 'INFO', 'version pycaret-nightly-0.39']
['2020-07-29 06', '51', '18,050', 'INFO', 'Initializing setup()']
['2020-07-29 06', '51', '18,050', 'INFO', 'USI', 'd54e']
['2020-07-29 06', '51', '18,050', 'INFO', 'setup(data=(6818, 7), target=en, custom_stopwords=None, html=False, session_id=None, log_experiment=True,']
['experiment_name=kiva_exp, log_plots=False, log_data=False, verbose=True)']
['2020-07-29 06', '51', '18,050', 'INFO', 'Checking environment']
['2020-07-29 06', '51', '18,050', 'INFO', 'python_version', '3.6.10']
['2020-07-29 06', '51', '18,050', 'INFO', 'python_build', "('default', 'May  7 2020 19", '46', "08')"]
['2020-07-29 06', '51', '18,051', 'INFO', 'machine', 'AMD64']
['2020-07-29 06', '51', '18,051', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']
['2020-07-

['2020-07-29 06', '55', '41,854', 'INFO', 'Removing special characters from the text']
['2020-07-29 06', '55', '41,892', 'INFO', 'nltk==3.5']
['2020-07-29 06', '55', '41,940', 'INFO', 'textblob==0.15.3']
['2020-07-29 06', '55', '42,561', 'INFO', 'pyLDAvis==2.1.2']
['2020-07-29 06', '55', '42,666', 'INFO', 'wordcloud==1.7.0']
['2020-07-29 06', '55', '43,018', 'INFO', 'Removing stopwords']
['2020-07-29 06', '55', '43,309', 'INFO', 'mlflow==1.8.0']
['2020-07-29 06', '55', '43,309', 'INFO', 'Checking Exceptions']
['2020-07-29 06', '55', '43,421', 'INFO', 'Removing stopwords']
['2020-07-29 06', '55', '44,499', 'INFO', 'Tokenizing Words']
['2020-07-29 06', '55', '44,729', 'INFO', 'Preloading libraries']
['2020-07-29 06', '55', '44,926', 'INFO', 'Preparing display monitor']
['2020-07-29 06', '55', '44,939', 'INFO', 'Importing libraries']
['2020-07-29 06', '55', '44,939', 'INFO', 'Declaring global variables']
['2020-07-29 06', '55', '44,939', 'INFO', 'Input provided', 'dataframe']
['2020-07-29

['2020-07-29 07', '02', '04,812', 'INFO', 'No custom stopwords defined']
['2020-07-29 07', '02', '04,812', 'INFO', 'Removing numeric characters from the text']
['2020-07-29 07', '02', '05,001', 'INFO', 'nltk==3.5']
['2020-07-29 07', '02', '05,052', 'INFO', 'textblob==0.15.3']
['2020-07-29 07', '02', '05,217', 'INFO', 'Removing special characters from the text']
['2020-07-29 07', '02', '05,295', 'INFO', 'setup() succesfully completed......................................']
['2020-07-29 07', '02', '05,296', 'INFO', 'Initializing create_model()']
['2020-07-29 07', '02', '05,296', 'INFO', 'create_model(model=lda, multi_core=True, num_topics=None, verbose=True, system=True)']
['2020-07-29 07', '02', '05,296', 'INFO', 'Checking exceptions']
['2020-07-29 07', '02', '05,296', 'INFO', 'Preloading libraries']
['2020-07-29 07', '02', '05,296', 'INFO', 'Preparing display monitor']
['2020-07-29 07', '02', '05,312', 'INFO', 'Defining topic model']
['2020-07-29 07', '02', '05,312', 'INFO', 'Model', '

['experiment_name=kiva_exp, log_plots=False, log_data=False, verbose=True)']
['2020-07-29 07', '10', '44,205', 'INFO', 'Checking environment']
['2020-07-29 07', '10', '44,205', 'INFO', 'python_version', '3.6.10']
['2020-07-29 07', '10', '44,205', 'INFO', 'python_build', "('default', 'May  7 2020 19", '46', "08')"]
['2020-07-29 07', '10', '44,205', 'INFO', 'machine', 'AMD64']
['2020-07-29 07', '10', '44,206', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']
['2020-07-29 07', '10', '44,242', 'INFO', 'Memory', 'svmem(total=17032478720, available=9112604672, percent=46.5, used=7919874048, free=9112604672)']
['2020-07-29 07', '10', '44,242', 'INFO', 'Physical Core', '4']
['2020-07-29 07', '10', '44,242', 'INFO', 'Logical Core', '8']
['2020-07-29 07', '10', '44,243', 'INFO', 'Checking libraries']
['2020-07-29 07', '10', '44,243', 'INFO', 'pd==1.0.4']
['2020-07-29 07', '10', '44,243', 'INFO', 'numpy==1.18.5']
['2020-07-29 07', '10', '44,449', 'INFO', 'mlflow==1.8.0']
['2020-07-29 07', '10', '

['2020-07-29 07', '17', '24,586', 'INFO', 'LdaMulticore imported successfully']
['2020-07-29 07', '17', '25,223', 'INFO', 'Compiling processed text']
['2020-07-29 07', '17', '25,240', 'INFO', 'Compiling information grid']
['2020-07-29 07', '17', '25,766', 'INFO', 'Creating MLFlow logs']
['2020-07-29 07', '17', '26,365', 'INFO', 'setup() succesfully completed......................................']
['2020-07-29 07', '17', '26,365', 'INFO', 'Initializing create_model()']
['2020-07-29 07', '17', '26,365', 'INFO', 'create_model(model=lda, multi_core=True, num_topics=None, verbose=True, system=True)']
['2020-07-29 07', '17', '26,365', 'INFO', 'Checking exceptions']
['2020-07-29 07', '17', '26,365', 'INFO', 'Preloading libraries']
['2020-07-29 07', '17', '26,365', 'INFO', 'Preparing display monitor']
['2020-07-29 07', '17', '26,373', 'INFO', 'Defining topic model']
['2020-07-29 07', '17', '26,373', 'INFO', 'Model', 'Latent Dirichlet Allocation']
['2020-07-29 07', '17', '26,373', 'INFO', 'Def

['2020-07-29 07', '21', '37,924', 'INFO', 'version pycaret-nightly-0.39']
['2020-07-29 07', '21', '37,924', 'INFO', 'Initializing setup()']
['2020-07-29 07', '21', '37,925', 'INFO', 'USI', '1526']
['2020-07-29 07', '21', '37,925', 'INFO', 'setup(data=(6818, 7), target=en, custom_stopwords=None, html=False, session_id=None, log_experiment=True,']
['experiment_name=kiva_exp, log_plots=False, log_data=False, verbose=True)']
['2020-07-29 07', '21', '37,925', 'INFO', 'Checking environment']
['2020-07-29 07', '21', '37,925', 'INFO', 'python_version', '3.6.10']
['2020-07-29 07', '21', '37,925', 'INFO', 'python_build', "('default', 'May  7 2020 19", '46', "08')"]
['2020-07-29 07', '21', '37,925', 'INFO', 'machine', 'AMD64']
['2020-07-29 07', '21', '37,926', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']
['2020-07-29 07', '21', '37,942', 'INFO', 'mlflow==1.8.0']
['2020-07-29 07', '21', '37,943', 'INFO', 'Checking Exceptions']
['2020-07-29 07', '21', '37,961', 'INFO', 'Memory', 'svmem(total=17

['2020-07-29 07', '30', '32,878', 'INFO', 'numpy==1.18.5']
['2020-07-29 07', '30', '32,951', 'INFO', 'Creating corpus and dictionary']
['2020-07-29 07', '30', '33,976', 'INFO', 'Removing stopwords']
['2020-07-29 07', '30', '34,184', 'INFO', 'gensim==3.8.3']
['2020-07-29 07', '30', '34,772', 'INFO', 'Compiling processed text']
['2020-07-29 07', '30', '34,801', 'INFO', 'Compiling information grid']
['2020-07-29 07', '30', '34,805', 'INFO', 'spacy==2.2.4']
['2020-07-29 07', '30', '35,283', 'INFO', 'Creating MLFlow logs']
['2020-07-29 07', '30', '35,566', 'INFO', 'nltk==3.5']
['2020-07-29 07', '30', '35,627', 'INFO', 'textblob==0.15.3']
['2020-07-29 07', '30', '35,846', 'INFO', 'setup() succesfully completed......................................']
['2020-07-29 07', '30', '35,847', 'INFO', 'Initializing create_model()']
['2020-07-29 07', '30', '35,847', 'INFO', 'create_model(model=lda, multi_core=True, num_topics=None, verbose=True, system=True)']
['2020-07-29 07', '30', '35,847', 'INFO', '

["('feature_select', Empty()), ('fix_multi', Empty()),"]
["('dfs', Empty()), ('pca', Empty())],"]
['verbose=False), model_name=Transformation Pipeline, verbose=False)']
['2020-07-29 08', '23', '14,234', 'INFO', 'Appending prep pipeline']
['2020-07-29 08', '23', '14,239', 'INFO', 'Transformation Pipeline.pkl saved in current working directory']
['2020-07-29 08', '23', '14,246', 'INFO', '[Pipeline(memory=None,']
["steps=[('dtypes',"]
['DataTypes_Auto_infer(categorical_features=[],']
['display_types=True, features_todrop=[],']
["ml_usecase='classification',"]
["numerical_features=[], target='deposit',"]
['time_features=[])),']
["('imputer',"]
["Simple_Imputer(categorical_strategy='not_available',"]
["numeric_strategy='mean',"]
['target_variable=None)),']
["('new_levels1',"]
['New_Catagorical_Le...']
["('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),"]
["('P_transform', Empty()), ('pt_target', Empty()),"]
["('binn', Empty()), ('rem_outliers', Empty()),"]
["('cluster_all', E

['DataTypes_Auto_infer(categorical_features=[],']
['display_types=True, features_todrop=[],']
["ml_usecase='classification',"]
["numerical_features=[], target='deposit',"]
['time_features=[])),']
["('imputer',"]
["Simple_Imputer(categorical_strategy='not_available',"]
["numeric_strategy='mean',"]
['target_variable=None)),']
["('new_levels1',"]
['New_Catagorical_Le...']
["('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),"]
["('P_transform', Empty()), ('pt_target', Empty()),"]
["('binn', Empty()), ('rem_outliers', Empty()),"]
["('cluster_all', Empty()), ('dummy', Dummify(target='deposit')),"]
["('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),"]
["('feature_select', Empty()), ('fix_multi', Empty()),"]
["('dfs', Empty()), ('pca', Empty())],"]
["verbose=False), GradientBoostingClassifier(ccp_alpha=0.0, criterion='friedman_mse', init=None,"]
["learning_rate=0.1, loss='deviance', max_depth=3,"]
['max_features=None, max_leaf_nodes=None,']
['min_impurity_decrease=0

['2020-07-29 08', '29', '51,888', 'INFO', 'Evaluating Metrics']
['2020-07-29 08', '29', '52,380', 'INFO', 'Compiling Metrics']
['2020-07-29 08', '29', '52,401', 'INFO', 'Calculating mean and std']
['2020-07-29 08', '29', '52,402', 'INFO', 'Creating metrics dataframe']
['2020-07-29 08', '29', '52,418', 'INFO', 'Creating MLFlow logs']
['2020-07-29 08', '29', '52,683', 'INFO', 'Initializing save_model()']
['2020-07-29 08', '29', '52,683', 'INFO', "save_model(model=KNeighborsClassifier(algorithm='auto', leaf_size=30, metric='minkowski',"]
['metric_params=None, n_jobs=-1, n_neighbors=5, p=2,']
["weights='uniform'), model_name=Trained Model, verbose=False)"]
['2020-07-29 08', '29', '52,684', 'INFO', 'Appending prep pipeline']
['2020-07-29 08', '29', '52,719', 'INFO', 'Trained Model.pkl saved in current working directory']
['2020-07-29 08', '29', '52,729', 'INFO', '[Pipeline(memory=None,']
["steps=[('dtypes',"]
['DataTypes_Auto_infer(categorical_features=[],']
['display_types=True, features_t

['2020-07-29 08', '30', '36,480', 'INFO', 'save_model() succesfully completed......................................']
['2020-07-29 08', '30', '36,587', 'INFO', 'Initializing Ada Boost Classifier']
['2020-07-29 08', '30', '36,595', 'INFO', 'Initializing Fold 1']
['2020-07-29 08', '30', '36,603', 'INFO', 'Fitting Model']
['2020-07-29 08', '30', '36,766', 'INFO', 'Evaluating Metrics']
['2020-07-29 08', '30', '36,799', 'INFO', 'Compiling Metrics']
['2020-07-29 08', '30', '36,807', 'INFO', 'Initializing Fold 2']
['2020-07-29 08', '30', '36,816', 'INFO', 'Fitting Model']
['2020-07-29 08', '30', '36,974', 'INFO', 'Evaluating Metrics']
['2020-07-29 08', '30', '37,005', 'INFO', 'Compiling Metrics']
['2020-07-29 08', '30', '37,012', 'INFO', 'Initializing Fold 3']
['2020-07-29 08', '30', '37,019', 'INFO', 'Fitting Model']
['2020-07-29 08', '30', '37,168', 'INFO', 'Evaluating Metrics']
['2020-07-29 08', '30', '37,198', 'INFO', 'Compiling Metrics']
['2020-07-29 08', '30', '37,204', 'INFO', 'Initial

['display_types=True, features_todrop=[],']
["ml_usecase='classification',"]
["numerical_features=[], target='deposit',"]
['time_features=[])),']
["('imputer',"]
["Simple_Imputer(categorical_strategy='not_available',"]
["numeric_strategy='mean',"]
['target_variable=None)),']
["('new_levels1',"]
['New_Catagorical_Le...']
["('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),"]
["('P_transform', Empty()), ('pt_target', Empty()),"]
["('binn', Empty()), ('rem_outliers', Empty()),"]
["('cluster_all', Empty()), ('dummy', Dummify(target='deposit')),"]
["('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),"]
["('feature_select', Empty()), ('fix_multi', Empty()),"]
["('dfs', Empty()), ('pca', Empty())],"]
["verbose=False), DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',"]
['max_depth=None, max_features=None, max_leaf_nodes=None,']
['min_impurity_decrease=0.0, min_impurity_split=None,']
['min_samples_leaf=1, min_samples_split=2,']
["min_weight_fr

['max_features=None,']
['max_leaf_nodes=None,']
['min_impurity_decrease=0.0,']
['min_impurity_split=None,']
['min_samples_leaf=1,']
['min_samples_split=2,']
['min_weight_fraction_leaf=0.0,']
["presort='deprecated',"]
['random_state=123,']
["splitter='best'),"]
['bootstrap=True, bootstrap_features=False, max_features=1.0,']
['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']
['random_state=123, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']
['2020-07-29 08', '33', '23,619', 'INFO', 'Appending prep pipeline']
['2020-07-29 08', '33', '23,633', 'INFO', 'Trained Model.pkl saved in current working directory']
['2020-07-29 08', '33', '23,638', 'INFO', '[Pipeline(memory=None,']
["steps=[('dtypes',"]
['DataTypes_Auto_infer(categorical_features=[],']
['display_types=True, features_todrop=[],']
["ml_usecase='classification',"]
["numerical_features=[], target='deposit',"]
['time_features=[])),']
["('imputer',"]
["Simple_Imputer(categorical_strategy='not_avai

['2020-07-29 08', '33', '32,760', 'INFO', 'Base layer complete']
['2020-07-29 08', '33', '32,913', 'INFO', 'Defining folds']
['2020-07-29 08', '33', '32,915', 'INFO', 'Initializing Fold 1']
['2020-07-29 08', '33', '32,921', 'INFO', 'Fitting Model']
['2020-07-29 08', '33', '33,034', 'INFO', 'Evaluating Metrics']
['2020-07-29 08', '33', '33,268', 'INFO', 'Compiling Metrics']
['2020-07-29 08', '33', '33,288', 'INFO', 'Initializing Fold 2']
['2020-07-29 08', '33', '33,294', 'INFO', 'Fitting Model']
['2020-07-29 08', '33', '33,407', 'INFO', 'Evaluating Metrics']
['2020-07-29 08', '33', '33,632', 'INFO', 'Compiling Metrics']
['2020-07-29 08', '33', '33,651', 'INFO', 'Initializing Fold 3']
['2020-07-29 08', '33', '33,658', 'INFO', 'Fitting Model']
['2020-07-29 08', '33', '33,768', 'INFO', 'Evaluating Metrics']
['2020-07-29 08', '33', '34,003', 'INFO', 'Compiling Metrics']
['2020-07-29 08', '33', '34,021', 'INFO', 'Initializing Fold 4']
['2020-07-29 08', '33', '34,028', 'INFO', 'Fitting Model'

["numeric_strategy='mean',"]
['target_variable=None)),']
["('new_levels1',"]
['New_Catagorical_Le...']
["('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),"]
["('P_transform', Empty()), ('pt_target', Empty()),"]
["('binn', Empty()), ('rem_outliers', Empty()),"]
["('cluster_all', Empty()), ('dummy', Dummify(target='deposit')),"]
["('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),"]
["('feature_select', Empty()), ('fix_multi', Empty()),"]
["('dfs', Empty()), ('pca', Empty())],"]
["verbose=False), DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',"]
['max_depth=None, max_features=None, max_leaf_nodes=None,']
['min_impurity_decrease=0.0, min_impurity_split=None,']
['min_samples_leaf=1, min_samples_split=2,']
["min_weight_fraction_leaf=0.0, presort='deprecated',"]
["random_state=123, splitter='best')]"]
['2020-07-29 08', '33', '49,971', 'INFO', 'save_model() succesfully completed......................................']
['2020-07-29 08', '3

['2020-07-29 08', '41', '49,556', 'INFO', 'Importing untrained models']
['2020-07-29 08', '41', '49,557', 'INFO', 'Import successful']
['2020-07-29 08', '41', '49,565', 'INFO', 'Defining folds']
['2020-07-29 08', '41', '49,565', 'INFO', 'Declaring metric variables']
['2020-07-29 08', '41', '49,565', 'INFO', 'Initializing Linear Regression']
['2020-07-29 08', '41', '49,572', 'INFO', 'Initializing Fold 1']
['2020-07-29 08', '41', '49,578', 'INFO', 'Fitting Model']
['2020-07-29 08', '41', '49,582', 'INFO', 'Evaluating Metrics']
['2020-07-29 08', '41', '49,584', 'INFO', 'No inverse transformer found']
['2020-07-29 08', '41', '49,584', 'INFO', 'Compiling Metrics']
['2020-07-29 08', '41', '49,600', 'INFO', 'Initializing Fold 2']
['2020-07-29 08', '41', '49,605', 'INFO', 'Fitting Model']
['2020-07-29 08', '41', '49,609', 'INFO', 'Evaluating Metrics']
['2020-07-29 08', '41', '49,611', 'INFO', 'No inverse transformer found']
['2020-07-29 08', '41', '49,611', 'INFO', 'Compiling Metrics']
['2020-

['2020-07-29 08', '41', '52,792', 'INFO', 'Calculating mean and std']
['2020-07-29 08', '41', '52,793', 'INFO', 'Creating metrics dataframe']
['2020-07-29 08', '41', '52,808', 'INFO', 'Creating MLFlow logs']
['2020-07-29 08', '41', '52,971', 'INFO', 'Initializing save_model()']
['2020-07-29 08', '41', '52,971', 'INFO', 'save_model(model=PassiveAggressiveRegressor(C=1.0, average=False, early_stopping=False,']
['epsilon=0.1, fit_intercept=True,']
["loss='epsilon_insensitive', max_iter=1000,"]
['n_iter_no_change=5, random_state=123, shuffle=True,']
['tol=0.001, validation_fraction=0.1, verbose=0,']
['warm_start=False), model_name=Trained Model, verbose=False)']
['2020-07-29 08', '41', '52,971', 'INFO', 'Appending prep pipeline']
['2020-07-29 08', '41', '52,976', 'INFO', 'Trained Model.pkl saved in current working directory']
['2020-07-29 08', '41', '52,980', 'INFO', '[Pipeline(memory=None,']
["steps=[('dtypes',"]
['DataTypes_Auto_infer(categorical_features=[],']
['display_types=True, feat

['2020-07-29 08', '42', '05,400', 'INFO', 'Fitting Model']
['2020-07-29 08', '42', '05,416', 'INFO', 'Evaluating Metrics']
['2020-07-29 08', '42', '05,419', 'INFO', 'No inverse transformer found']
['2020-07-29 08', '42', '05,419', 'INFO', 'Compiling Metrics']
['2020-07-29 08', '42', '05,423', 'INFO', 'Calculating mean and std']
['2020-07-29 08', '42', '05,424', 'INFO', 'Creating metrics dataframe']
['2020-07-29 08', '42', '05,440', 'INFO', 'Creating MLFlow logs']
['2020-07-29 08', '42', '05,580', 'INFO', 'Initializing save_model()']
['2020-07-29 08', '42', '05,580', 'INFO', "save_model(model=AdaBoostRegressor(base_estimator=None, learning_rate=1.0, loss='linear',"]
['n_estimators=50, random_state=123), model_name=Trained Model, verbose=False)']
['2020-07-29 08', '42', '05,581', 'INFO', 'Appending prep pipeline']
['2020-07-29 08', '42', '05,587', 'INFO', 'Trained Model.pkl saved in current working directory']
['2020-07-29 08', '42', '05,592', 'INFO', '[Pipeline(memory=None,']
["steps=[(

['2020-07-29 08', '42', '18,363', 'INFO', 'No inverse transformation']
['2020-07-29 08', '42', '18,363', 'INFO', 'Compiling Metrics']
['2020-07-29 08', '42', '18,377', 'INFO', 'Initializing Fold 7']
['2020-07-29 08', '42', '18,379', 'INFO', 'Fitting Model']
['2020-07-29 08', '42', '18,477', 'INFO', 'Evaluating Metrics']
['2020-07-29 08', '42', '18,481', 'INFO', 'No inverse transformation']
['2020-07-29 08', '42', '18,481', 'INFO', 'Compiling Metrics']
['2020-07-29 08', '42', '18,494', 'INFO', 'Initializing Fold 8']
['2020-07-29 08', '42', '18,496', 'INFO', 'Fitting Model']
['2020-07-29 08', '42', '18,582', 'INFO', 'Evaluating Metrics']
['2020-07-29 08', '42', '18,586', 'INFO', 'No inverse transformation']
['2020-07-29 08', '42', '18,586', 'INFO', 'Compiling Metrics']
['2020-07-29 08', '42', '18,599', 'INFO', 'Initializing Fold 9']
['2020-07-29 08', '42', '18,601', 'INFO', 'Fitting Model']
['2020-07-29 08', '42', '18,698', 'INFO', 'Evaluating Metrics']
['2020-07-29 08', '42', '18,703', 

['2020-07-29 08', '42', '25,445', 'INFO', 'Uploading results into container']
['2020-07-29 08', '42', '25,445', 'INFO', 'Uploading model into container']
['2020-07-29 08', '42', '25,445', 'INFO', 'create_model_container', '6']
['2020-07-29 08', '42', '25,445', 'INFO', 'master_model_container', '6']
['2020-07-29 08', '42', '25,445', 'INFO', 'display_container', '7']
['2020-07-29 08', '42', '25,446', 'INFO', "LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,"]
["importance_type='split', learning_rate=0.1, max_depth=-1,"]
['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']
['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']
['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']
['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']
['2020-07-29 08', '42', '25,446', 'INFO', 'create_model() succesfully completed......................................']
['2020-07-29 08', '42', '25,446', 'INFO', 'Initializing create_mo

['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']
['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']
['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']
['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']
['2020-07-29 08', '42', '33,774', 'INFO', 'create_model() succesfully completed......................................']
['2020-07-29 08', '42', '33,774', 'INFO', 'Initializing create_model()']
['2020-07-29 08', '42', '33,774', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=True)']
['2020-07-29 08', '42', '33,774', 'INFO', 'Checking exceptions']
['2020-07-29 08', '42', '33,774', 'INFO', 'Preloading libraries']
['2020-07-29 08', '42', '33,774', 'INFO', 'Preparing display monitor']
['2020-07-29 08', '42', '33,786', 'INFO', 'Copying training dataset']
['2020-07-29 08', '42', '33,787', 'INFO', 'Importing libraries']
['2020-07-29 08', '42', '33,788

["steps=[('dtypes',"]
['DataTypes_Auto_infer(categorical_features=[],']
['display_types=True, features_todrop=[],']
["ml_usecase='regression',"]
["numerical_features=[], target='charges',"]
['time_features=[])),']
["('imputer',"]
["Simple_Imputer(categorical_strategy='not_available',"]
["numeric_strategy='mean',"]
['target_variable=None)),']
["('new_levels1',"]
['New_Catagorical_Levels...']
["('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),"]
["('P_transform', Empty()), ('pt_target', Empty()),"]
["('binn', Empty()), ('rem_outliers', Empty()),"]
["('cluster_all', Empty()), ('dummy', Dummify(target='charges')),"]
["('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),"]
["('feature_select', Empty()), ('fix_multi', Empty()),"]
["('dfs', Empty()), ('pca', Empty())],"]
["verbose=False), DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,"]
['max_features=None, max_leaf_nodes=None,']
['min_impurity_decrease=0.0, min_impurity_split=None,']
['min_sam

['max_samples=1.0, n_estimators=50, n_jobs=None, oob_score=False,']
['random_state=123, verbose=0, warm_start=False), None]']
['2020-07-29 08', '42', '58,871', 'INFO', 'save_model() succesfully completed......................................']
['2020-07-29 08', '42', '59,097', 'INFO', 'create_model_container', '15']
['2020-07-29 08', '42', '59,097', 'INFO', 'master_model_container', '15']
['2020-07-29 08', '42', '59,097', 'INFO', 'display_container', '16']
['2020-07-29 08', '42', '59,098', 'INFO', 'BaggingRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']
["criterion='mse',"]
['max_depth=None,']
['max_features=None,']
['max_leaf_nodes=None,']
['min_impurity_decrease=0.0,']
['min_impurity_split=None,']
['min_samples_leaf=1,']
['min_samples_split=2,']
['min_weight_fraction_leaf=0.0,']
["presort='deprecated',"]
['random_state=123,']
["splitter='best'),"]
['bootstrap=True, bootstrap_features=False, max_features=1.0,']
['max_samples=1.0, n_estimators=50, n_jobs=None, oob_score=

["verbose=False), AdaBoostRegressor(base_estimator=None, learning_rate=1.0, loss='linear',"]
['n_estimators=50, random_state=123), None]']
['2020-07-29 08', '43', '45,936', 'INFO', 'save_model() succesfully completed......................................']
['2020-07-29 08', '43', '46,042', 'INFO', 'Initializing Gradient Boosting Regressor']
['2020-07-29 08', '43', '46,047', 'INFO', 'Initializing Fold 1']
['2020-07-29 08', '43', '46,052', 'INFO', 'Fitting Model']
['2020-07-29 08', '43', '46,119', 'INFO', 'Evaluating Metrics']
['2020-07-29 08', '43', '46,121', 'INFO', 'No inverse transformer found']
['2020-07-29 08', '43', '46,121', 'INFO', 'Compiling Metrics']
['2020-07-29 08', '43', '46,127', 'INFO', 'Initializing Fold 2']
['2020-07-29 08', '43', '46,133', 'INFO', 'Fitting Model']
['2020-07-29 08', '43', '46,211', 'INFO', 'Evaluating Metrics']
['2020-07-29 08', '43', '46,213', 'INFO', 'No inverse transformer found']
['2020-07-29 08', '43', '46,213', 'INFO', 'Compiling Metrics']
['2020-

['max_features=None, max_leaf_nodes=None,']
['min_impurity_decrease=0.0, min_impurity_split=None,']
['min_samples_leaf=1, min_samples_split=2,']
['min_weight_fraction_leaf=0.0, n_estimators=100,']
["n_iter_no_change=None, presort='deprecated',"]
['random_state=123, subsample=1.0, tol=0.0001,']
["validation_fraction=0.1, verbose=0, warm_start=False), <catboost.core.CatBoostRegressor object at 0x00000236562B6E48>, RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',"]
["max_depth=None, max_features='auto', max_leaf_nodes=None,"]
['max_samples=None, min_impurity_decrease=0.0,']
['min_impurity_split=None, min_samples_leaf=1,']
['min_samples_split=2, min_weight_fraction_leaf=0.0,']
['n_estimators=100, n_jobs=-1, oob_score=False,']
["random_state=123, verbose=0, warm_start=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,"]
["importance_type='split', learning_rate=0.1, max_depth=-1,"]
['min_child_samples=20, min_child_weight=0.001, min_spli

["learning_rate=1.0, loss='linear', n_estimators=10,"]
['random_state=123), model_name=best-model, verbose=True)']
['2020-07-29 08', '44', '57,010', 'INFO', 'Appending prep pipeline']
['2020-07-29 08', '44', '57,026', 'INFO', 'best-model.pkl saved in current working directory']
['2020-07-29 08', '44', '57,034', 'INFO', '[Pipeline(memory=None,']
["steps=[('dtypes',"]
['DataTypes_Auto_infer(categorical_features=[],']
['display_types=True, features_todrop=[],']
["ml_usecase='regression',"]
["numerical_features=[], target='charges',"]
['time_features=[])),']
["('imputer',"]
["Simple_Imputer(categorical_strategy='not_available',"]
["numeric_strategy='mean',"]
['target_variable=None)),']
["('new_levels1',"]
['New_Catagorical_Levels...']
["('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),"]
["('P_transform', Empty()), ('pt_target', Empty()),"]
["('binn', Empty()), ('rem_outliers', Empty()),"]
["('cluster_all', Empty()), ('dummy', Dummify(target='charges')),"]
["('fix_perfect', 

['2020-07-29 09', '01', '29,229', 'INFO', 'Fitting PCA()']
['2020-07-29 09', '01', '29,234', 'INFO', 'Sorting dataframe']
['2020-07-29 09', '01', '29,235', 'INFO', 'Rendering Visual']
['2020-07-29 09', '01', '29,286', 'INFO', 'Visual Rendered Successfully']
['2020-07-29 09', '01', '29,286', 'INFO', 'plot_model() succesfully completed......................................']
['2020-07-29 09', '01', '29,292', 'INFO', 'Initializing plot_model()']
['2020-07-29 09', '01', '29,292', 'INFO', "plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,"]
["n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',"]
['random_state=123, tol=0.0001, verbose=0), plot=tsne, feature=None, label=False, save=False, system=True)']
['2020-07-29 09', '01', '29,292', 'INFO', 'Checking exceptions']
['2020-07-29 09', '01', '29,292', 'INFO', 'Importing libraries']
['2020-07-29 09', '01', '29,303', 'INFO', 'plot type', 'tsne']
['2020-07-29 09', '01', '29,303', 'INFO', 'I

# 11. MLFlow UI

In [21]:
!mlflow ui

Running the mlflow server failed. Please see the logs above for details.


# End
Thank you. For more information / tutorials on PyCaret, please visit https://www.pycaret.org