In [1]:
import numpy as np
import pandas as pd
from sklearn.preprocessing import StandardScaler
from deepforest import CascadeForestClassifier #import deep forest package
from sklearn.metrics import f1_score,precision_score,recall_score,accuracy_score,roc_auc_score

# This is a quick tutorial that shows you how to use an already established deep forest model

## open your dataset

In [2]:
df_train = pd.read_csv("train_shuffle.csv")
df_test = pd.read_csv("test_shuffle.csv") #open your dataset
train_label = df_train.iloc[:,769].values
test_label = df_test.iloc[:,769].values # get the label

In [3]:
train_label

array([1, 1, 0, ..., 0, 0, 1])

## Get the extracted features (FEGS+BLOSUM62+Binary profile)

In [5]:
train_FEGS = df_train.iloc[:,770:1348].values
train_BLOSUM = df_train.iloc[:,1348:2348].values
train_Binary = df_train.iloc[:,2348:3348].values
train_FEGS_BLOSUM_Binary = np.concatenate((train_FEGS,train_BLOSUM,train_Binary),axis=1)

test_FEGS = df_test.iloc[:,770:1348].values
test_BLOSUM = df_test.iloc[:,1348:2348].values
test_Binary = df_test.iloc[:,2348:3348].values
test_FEGS_BLOSUM_Binary = np.concatenate((test_FEGS,test_BLOSUM,test_Binary),axis=1)

In [6]:
standardScaler = StandardScaler()
standardScaler.fit(train_FEGS_BLOSUM_Binary)
train_FEGS_BLOSUM_Binary_std = standardScaler.transform(train_FEGS_BLOSUM_Binary)
test_FEGS_BLOSUM_Binary_std = standardScaler.transform(test_FEGS_BLOSUM_Binary)

In [8]:
pwd

'/home/yaolt/pythoncode/Anticancer/main'

## Import the model

In [9]:
model_FEGS_BLOSUM_Binary = CascadeForestClassifier()
model_FEGS_BLOSUM_Binary.load("model/FEGS_BLOSUM_Binary")

https://scikit-learn.org/stable/modules/model_persistence.html#security-maintainability-limitations


## Prediction 

In [11]:
y_pred = model_FEGS_BLOSUM_Binary.predict(test_FEGS_BLOSUM_Binary_std)

[2022-09-01 20:19:40.323] Start to evalute the model:
[2022-09-01 20:19:40.345] Evaluating cascade layer = 0 
[2022-09-01 20:19:40.578] Evaluating cascade layer = 1 
[2022-09-01 20:19:40.795] Evaluating cascade layer = 2 


In [12]:
y_pred

array([1, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 1,
       0, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0,
       0, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 0, 1,
       0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0,
       0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1,
       0, 0, 0, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1,
       0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1, 1, 0, 1, 1, 1, 0,
       0, 0, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 0, 1,
       1, 1, 0, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1,
       1, 1, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0,
       0, 1, 1, 1, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1,
       0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 1,
       1, 1, 1, 0, 1, 1, 1, 1, 0, 0, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 1, 1,
       1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 0, 1, 0,