# Models of Original Research Paper

The repository of the original research paper contains all 49 models. In this Notebook we read in several of these models (saved in joblib files) to gain some more insights into the models of the original paper. We mainly focused on the AdaBoost Classifier models, as this was the best performing model according to the research paper.

In [1]:
pip install joblib

Note: you may need to restart the kernel to use updated packages.


In [144]:
import os
import joblib
import sklearn

## Trained Models

In [82]:
#GradientBoosting classifier
modeltrain1 = joblib.load('original_trained\PPMI-genetic_p1E2_omic_p1E4.trainedModel.joblib')
modeltrain1

In [97]:
#SVC
modeltrain2 = joblib.load('original_trained\PPMI-genetic_p1E4_omic_p1E5.trainedModel.joblib')
modeltrain2

In [100]:
#LinearDiscriminantAnalysis
modeltrain3 = joblib.load('original_trained\PPMI-genetic_p1E4_omic_p1E7.trainedModel.joblib')
modeltrain3

In [106]:
#AdaBoost classifier
modeltrain4 = joblib.load('original_trained\PPMI-genetic_p1E5_omic_p1E2.trainedModel.joblib')
modeltrain4.n_estimators

50

In [123]:
#AdaBoost classifier
modeltrain5 = joblib.load('original_trained\PPMI-genetic_p1E5_omic_p1E4.trainedModel.joblib')
modeltrain5.n_estimators

50

In [136]:
#QuadraticDiscriminantAnalysis
modeltrain6 = joblib.load('original_trained\PPMI-genetic_p1E8_omic_p1E8.trainedModel.joblib')
modeltrain6

https://scikit-learn.org/stable/model_persistence.html#security-maintainability-limitations


## Tuned Models

In [75]:
# AdaBooster
modeltune1 = joblib.load('original_tuned\PPMI-genetic_p1E5_omic_p1E2.tunedModel.joblib')

In [76]:
modeltune1.n_estimators

551

In [77]:
modeltune1.estimators_

[DecisionTreeClassifier(max_depth=1, random_state=1658376856),
 DecisionTreeClassifier(max_depth=1, random_state=1746037600),
 DecisionTreeClassifier(max_depth=1, random_state=1105651351),
 DecisionTreeClassifier(max_depth=1, random_state=1539524900),
 DecisionTreeClassifier(max_depth=1, random_state=242580344),
 DecisionTreeClassifier(max_depth=1, random_state=1447303150),
 DecisionTreeClassifier(max_depth=1, random_state=19279710),
 DecisionTreeClassifier(max_depth=1, random_state=1706137340),
 DecisionTreeClassifier(max_depth=1, random_state=488420485),
 DecisionTreeClassifier(max_depth=1, random_state=577474134),
 DecisionTreeClassifier(max_depth=1, random_state=51376458),
 DecisionTreeClassifier(max_depth=1, random_state=18073300),
 DecisionTreeClassifier(max_depth=1, random_state=1249559522),
 DecisionTreeClassifier(max_depth=1, random_state=1221908557),
 DecisionTreeClassifier(max_depth=1, random_state=1125490551),
 DecisionTreeClassifier(max_depth=1, random_state=517139994),
 D

In [78]:
modeltune1.n_features_in_

673

In [147]:
modeltune1.learning_rate

1.0

In [66]:
#BaggingClassifier
#modeltune2 = joblib.load('original_tuned\PPMI-genetic_p1E4_omic_p1E6.tunedModel.joblib')
#modeltune2

In [37]:
#LinearDiscriminantAnalysis
modeltune3 = joblib.load('original_tuned\PPMI-genetic_p1E4_omic_p1E7.tunedModel.joblib')
modeltune3

In [36]:
#GradientBoosting classifier
modeltune4 = joblib.load('original_tuned\PPMI-genetic_p1E5_omic_p1E3.tunedModel.joblib')
modeltune4

In [138]:
#AdaBoost classifier
modeltune5 = joblib.load('original_tuned\PPMI-genetic_p1E5_omic_p1E4.tunedModel.joblib')
modeltune5.n_estimators

904

In [139]:
modeltune5.estimators_

[DecisionTreeClassifier(max_depth=1, random_state=560569298),
 DecisionTreeClassifier(max_depth=1, random_state=894170006),
 DecisionTreeClassifier(max_depth=1, random_state=1265984553),
 DecisionTreeClassifier(max_depth=1, random_state=1611067305),
 DecisionTreeClassifier(max_depth=1, random_state=1260423823),
 DecisionTreeClassifier(max_depth=1, random_state=233196491),
 DecisionTreeClassifier(max_depth=1, random_state=182294719),
 DecisionTreeClassifier(max_depth=1, random_state=392982206),
 DecisionTreeClassifier(max_depth=1, random_state=1810635925),
 DecisionTreeClassifier(max_depth=1, random_state=482591383),
 DecisionTreeClassifier(max_depth=1, random_state=911932643),
 DecisionTreeClassifier(max_depth=1, random_state=2086266736),
 DecisionTreeClassifier(max_depth=1, random_state=1679904360),
 DecisionTreeClassifier(max_depth=1, random_state=1574946850),
 DecisionTreeClassifier(max_depth=1, random_state=384254926),
 DecisionTreeClassifier(max_depth=1, random_state=116216436),
 

In [140]:
modeltune5.estimators_[0].max_features_

111

In [141]:
modeltune5.estimators_[0].classes_

array([0, 1], dtype=int64)

In [142]:
modeltune5.n_classes_

2

In [69]:
modeltune5.estimator_weights_

array([1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1.,
       1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1.,
       1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1.,
       1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1.,
       1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1.,
       1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1.,
       1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1.,
       1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1.,
       1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1.,
       1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1.,
       1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1.,
       1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1.,
       1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1., 1.,
       1., 1., 1., 1., 1.

In [71]:
modeltune5.n_features_in_

111

In [63]:
#MLP classifier
modeltune6 = joblib.load('original_tuned\PPMI-genetic_p1E5_omic_p1E7.tunedModel.joblib')
modeltune6

In [62]:
#LogisticRegression
modeltune7 = joblib.load('original_tuned\PPMI-genetic_p1E5_omic_p1E8.tunedModel.joblib')
modeltune7

In [61]:
#SVC
modeltune8 = joblib.load('original_tuned\PPMI-genetic_p1E4_omic_p1E5.tunedModel.joblib')
modeltune8

In [12]:
import random
randomlist = []
for i in range(0,673):
    n = random.randint(1,30)
    randomlist.append(n)

In [13]:
model.predict([randomlist])

array([0], dtype=int64)

In [14]:
model.estimators_

[DecisionTreeClassifier(max_depth=1, random_state=1658376856),
 DecisionTreeClassifier(max_depth=1, random_state=1746037600),
 DecisionTreeClassifier(max_depth=1, random_state=1105651351),
 DecisionTreeClassifier(max_depth=1, random_state=1539524900),
 DecisionTreeClassifier(max_depth=1, random_state=242580344),
 DecisionTreeClassifier(max_depth=1, random_state=1447303150),
 DecisionTreeClassifier(max_depth=1, random_state=19279710),
 DecisionTreeClassifier(max_depth=1, random_state=1706137340),
 DecisionTreeClassifier(max_depth=1, random_state=488420485),
 DecisionTreeClassifier(max_depth=1, random_state=577474134),
 DecisionTreeClassifier(max_depth=1, random_state=51376458),
 DecisionTreeClassifier(max_depth=1, random_state=18073300),
 DecisionTreeClassifier(max_depth=1, random_state=1249559522),
 DecisionTreeClassifier(max_depth=1, random_state=1221908557),
 DecisionTreeClassifier(max_depth=1, random_state=1125490551),
 DecisionTreeClassifier(max_depth=1, random_state=517139994),
 D