# Download testing data and unzip models.zip


In [1]:
# # find the share link of the file/folder on Google Drive
# file_share_links = [
#                     "https://drive.google.com/file/d/1pP81aU-10NWzVNbNnQUDvCeSrBLOkcWw/view?usp=sharing",   #sample_submission.csv
#                     "https://drive.google.com/file/d/1UEZzWcKk_QaHWzDMl6XdWGJLgkhiguj-/view?usp=sharing",   #test.csv
#                     "https://drive.google.com/file/d/1L7AYTx15-AQ2nXAuXm7hLC9HDvpKJCGw/view?usp=sharing",   #train.csv
#                     "", #models.zip
# ]

# for file_share_link in file_share_links:
#     # extract the ID of the file
#     file_id = file_share_link[file_share_link.find("d/") + 2: file_share_link.find('/view')]
#     print(file_id)

#     # append the id to this REST command
#     file_download_link = "https://docs.google.com/uc?export=download&id=" + file_id
#     print(file_download_link)


In [2]:
# !wget -O sample_submission.csv "https://docs.google.com/uc?export=download&id=1pP81aU-10NWzVNbNnQUDvCeSrBLOkcWw"
# !wget -O test.csv "https://docs.google.com/uc?export=download&id=1UEZzWcKk_QaHWzDMl6XdWGJLgkhiguj-"
# !wget -O train.csv "https://docs.google.com/uc?export=download&id=1L7AYTx15-AQ2nXAuXm7hLC9HDvpKJCGw"


## Upload trained `models.zip`

In [3]:
# # You need to upload the `models.zip` to Colab first
# !unzip -n models.zip

# Setup

In [4]:
import os
import time
from typing import Iterable

import numpy as np
import pandas as pd

# save scikit-learn model
from joblib import dump, load
# import pickle

import glob



# Functions

## def loadModels()

In [5]:
def loadModels(model_paths: str) -> Iterable:
    """Return a list of models"""
    models = []
    for model_path in model_paths:
        models.append(load(model_path))
    return models

## def saveResult()

Format:

| id | label  |
|----|--------|
| xx | 0 or 1 |
| xx | 0 or 1 |
| xx | 0 or 1 |

In [6]:
def saveResult(df_result: np.array,
               csv_name: str,
               label_name: str = 'label',
               folder = 'results'
               ):
    """result.csv format
    | id | label |
    |----|-------|
    | xx | 0 or 1|
    """

    if not os.path.exists(folder):
        os.makedirs(folder)
    
    # np.savetxt(csv_name, result[['id', 'label']], delimiter=",")
    df_result[[label_name]].to_csv(f'{folder}/{csv_name}.csv', index=True)


## def testModel()

In [7]:
def testModel(model, 
               x_test: np.array
              ) -> list:
    """return prediction `pred_y` list"""

    print(model)
    print(model.__class__.__name__)

    # For testing data
    print('>>> For testing data')
    pred_y = model.predict(x_test)
    # pred_y_list.append(pred_y)
    print('pred_y[:5] =', pred_y[:5])

    # result = np.insert(x_test, 1, pred_y, axis=1)
    # print(result)
    # saveResult()
    # print('>>> Prediction result saved')
    print('=========================\n')

    return pred_y


# Run

## Load test data

In [8]:
folder_results = 'results'
folder_data = ''
folder_models = 'models'

path_test = folder_data + 'test.csv'

# paths = glob.iglob(f'{folder_models}/*.joblib')
path_models = glob.glob(f'{folder_models}/*.joblib')
path_models = sorted(path_models)


#read test data
test = np.genfromtxt(path_test, delimiter=',', names=True, dtype=float)

row_index_name = 'id'
label_name = 'label'
feature_names = [x for x in test.dtype.names if (x != label_name) & (x != row_index_name)]

# test_x = test[feature_names].tolist()
# test_y = test[label_name].tolist()


# #class labels
# labels = list(set(test[label_name]))
# print(f'Classes/Labels of dataset (column: {label_name}):', labels)


# View
print(f'row_index_name: {row_index_name}')
print(f'label_name: {label_name}')
print(f'feature columns: {feature_names}')

# print(test_x[:5])
# print('labels of test data:', test_y[:5])


print('test.shape =', test.shape)


row_index_name: id
label_name: label
feature columns: ['MO_HLADR_MFI_cellsul', 'Neu_CD64MFI_cellsul', 'CD3T_cellsul', 'CD8T_cellsul', 'CD4T_cellsul', 'NK_cellsul', 'CD19_cellsul', 'CD45_cellsul', 'Age', 'Sex_0M1F', 'Mono_CD64MFI_cellsul']
test.shape = (59,)


In [9]:
# Convert np.array to df
# df_train = pd.DataFrame(train)
df_test = pd.DataFrame(test)

if row_index_name:
    # df_train.set_index(row_index_name, inplace=True)
    df_test.set_index(row_index_name, inplace=True)
    df_test.index = df_test.index.astype(int)

# display(df_train.describe())
# display(df_train.info())

display(df_test.head(3))
display(df_test.describe())
display(df_test.info())


Unnamed: 0_level_0,MO_HLADR_MFI_cellsul,Neu_CD64MFI_cellsul,CD3T_cellsul,CD8T_cellsul,CD4T_cellsul,NK_cellsul,CD19_cellsul,CD45_cellsul,Age,Sex_0M1F,Mono_CD64MFI_cellsul
id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1
0,2843.0,156.0,1358.52,730.78,637.85,127.06,94.82,1588.62,45.0,1.0,3256.0
1,437.0,137.0,509.43,268.05,243.07,390.86,98.24,1002.76,51.0,1.0,491.0
2,826.0,82.0,1232.22,493.42,744.08,516.28,320.15,2200.58,32.0,0.0,1381.0


Unnamed: 0,MO_HLADR_MFI_cellsul,Neu_CD64MFI_cellsul,CD3T_cellsul,CD8T_cellsul,CD4T_cellsul,NK_cellsul,CD19_cellsul,CD45_cellsul,Age,Sex_0M1F,Mono_CD64MFI_cellsul
count,59.0,59.0,59.0,59.0,59.0,59.0,59.0,59.0,59.0,59.0,59.0
mean,1212.423729,206.491525,1085.340508,546.220339,523.237966,226.820339,115.048983,1439.65339,41.186441,0.355932,1971.220339
std,772.139285,248.195027,564.337155,342.37002,271.730902,189.056327,87.200827,689.02181,9.438503,0.482905,1137.384129
min,82.0,24.0,258.01,114.98,80.39,17.72,2.96,314.25,15.0,0.0,371.0
25%,696.5,65.0,629.89,268.3,336.955,88.33,59.5,914.84,34.5,0.0,1283.5
50%,1010.0,114.0,1025.32,433.61,511.0,174.86,98.24,1378.32,42.0,0.0,1701.0
75%,1623.0,232.0,1495.395,751.38,676.53,318.14,143.56,1855.05,49.0,1.0,2375.0
max,4195.0,1141.0,2771.2,1738.55,1225.68,956.78,501.91,3355.86,62.0,1.0,6788.0


<class 'pandas.core.frame.DataFrame'>
Int64Index: 59 entries, 0 to 58
Data columns (total 11 columns):
 #   Column                Non-Null Count  Dtype  
---  ------                --------------  -----  
 0   MO_HLADR_MFI_cellsul  59 non-null     float64
 1   Neu_CD64MFI_cellsul   59 non-null     float64
 2   CD3T_cellsul          59 non-null     float64
 3   CD8T_cellsul          59 non-null     float64
 4   CD4T_cellsul          59 non-null     float64
 5   NK_cellsul            59 non-null     float64
 6   CD19_cellsul          59 non-null     float64
 7   CD45_cellsul          59 non-null     float64
 8   Age                   59 non-null     float64
 9   Sex_0M1F              59 non-null     float64
 10  Mono_CD64MFI_cellsul  59 non-null     float64
dtypes: float64(11)
memory usage: 5.5 KB


None

## Load and test models

In [10]:
# load models
models = loadModels(path_models)

label_name = 'label'

for model,path in zip(models, path_models):
    pred_y = testModel(model, df_test[feature_names])
    pred_y = pred_y.astype(int)
    
    df_result = df_test.copy()
    df_result.insert(loc=0,
               column=label_name,
               value=pred_y)
    display(df_result)

    csv_name = path[: path.find('.joblib')].replace(f'{folder_models}/', '')
    saveResult(df_result, csv_name, label_name, folder_results)
    # break

DecisionTreeClassifier(criterion='entropy', max_depth=10)
DecisionTreeClassifier
>>> For testing data
pred_y[:5] = [0. 0. 0. 0. 0.]



Unnamed: 0_level_0,label,MO_HLADR_MFI_cellsul,Neu_CD64MFI_cellsul,CD3T_cellsul,CD8T_cellsul,CD4T_cellsul,NK_cellsul,CD19_cellsul,CD45_cellsul,Age,Sex_0M1F,Mono_CD64MFI_cellsul
id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
0,0,2843.0,156.0,1358.52,730.78,637.85,127.06,94.82,1588.62,45.0,1.0,3256.0
1,0,437.0,137.0,509.43,268.05,243.07,390.86,98.24,1002.76,51.0,1.0,491.0
2,0,826.0,82.0,1232.22,493.42,744.08,516.28,320.15,2200.58,32.0,0.0,1381.0
3,0,861.0,50.0,1512.86,925.51,590.07,380.25,25.8,1929.1,50.0,0.0,1377.0
4,0,1160.0,157.0,890.42,403.91,489.53,266.92,87.63,1251.52,43.0,0.0,1844.0
5,1,867.0,85.0,1662.11,865.5,804.14,220.68,92.58,2063.11,44.0,1.0,986.0
6,0,1330.0,114.0,1307.95,710.86,607.96,271.01,214.49,1855.05,31.0,0.0,2077.0
7,0,494.0,48.0,1522.39,618.19,911.49,338.85,104.45,2013.05,36.0,1.0,1409.0
8,0,2119.0,73.0,1219.66,732.14,468.48,71.54,83.08,1378.32,45.0,1.0,2403.0
9,0,2052.0,39.0,1223.65,642.55,565.39,323.67,153.64,1711.88,36.0,0.0,1701.0


DecisionTreeClassifier(criterion='entropy', max_depth=15)
DecisionTreeClassifier
>>> For testing data
pred_y[:5] = [0. 0. 0. 0. 0.]



Unnamed: 0_level_0,label,MO_HLADR_MFI_cellsul,Neu_CD64MFI_cellsul,CD3T_cellsul,CD8T_cellsul,CD4T_cellsul,NK_cellsul,CD19_cellsul,CD45_cellsul,Age,Sex_0M1F,Mono_CD64MFI_cellsul
id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
0,0,2843.0,156.0,1358.52,730.78,637.85,127.06,94.82,1588.62,45.0,1.0,3256.0
1,0,437.0,137.0,509.43,268.05,243.07,390.86,98.24,1002.76,51.0,1.0,491.0
2,0,826.0,82.0,1232.22,493.42,744.08,516.28,320.15,2200.58,32.0,0.0,1381.0
3,0,861.0,50.0,1512.86,925.51,590.07,380.25,25.8,1929.1,50.0,0.0,1377.0
4,0,1160.0,157.0,890.42,403.91,489.53,266.92,87.63,1251.52,43.0,0.0,1844.0
5,1,867.0,85.0,1662.11,865.5,804.14,220.68,92.58,2063.11,44.0,1.0,986.0
6,0,1330.0,114.0,1307.95,710.86,607.96,271.01,214.49,1855.05,31.0,0.0,2077.0
7,0,494.0,48.0,1522.39,618.19,911.49,338.85,104.45,2013.05,36.0,1.0,1409.0
8,0,2119.0,73.0,1219.66,732.14,468.48,71.54,83.08,1378.32,45.0,1.0,2403.0
9,0,2052.0,39.0,1223.65,642.55,565.39,323.67,153.64,1711.88,36.0,0.0,1701.0


DecisionTreeClassifier(criterion='entropy', max_depth=20)
DecisionTreeClassifier
>>> For testing data
pred_y[:5] = [0. 1. 0. 0. 0.]



Unnamed: 0_level_0,label,MO_HLADR_MFI_cellsul,Neu_CD64MFI_cellsul,CD3T_cellsul,CD8T_cellsul,CD4T_cellsul,NK_cellsul,CD19_cellsul,CD45_cellsul,Age,Sex_0M1F,Mono_CD64MFI_cellsul
id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
0,0,2843.0,156.0,1358.52,730.78,637.85,127.06,94.82,1588.62,45.0,1.0,3256.0
1,1,437.0,137.0,509.43,268.05,243.07,390.86,98.24,1002.76,51.0,1.0,491.0
2,0,826.0,82.0,1232.22,493.42,744.08,516.28,320.15,2200.58,32.0,0.0,1381.0
3,0,861.0,50.0,1512.86,925.51,590.07,380.25,25.8,1929.1,50.0,0.0,1377.0
4,0,1160.0,157.0,890.42,403.91,489.53,266.92,87.63,1251.52,43.0,0.0,1844.0
5,1,867.0,85.0,1662.11,865.5,804.14,220.68,92.58,2063.11,44.0,1.0,986.0
6,0,1330.0,114.0,1307.95,710.86,607.96,271.01,214.49,1855.05,31.0,0.0,2077.0
7,0,494.0,48.0,1522.39,618.19,911.49,338.85,104.45,2013.05,36.0,1.0,1409.0
8,0,2119.0,73.0,1219.66,732.14,468.48,71.54,83.08,1378.32,45.0,1.0,2403.0
9,0,2052.0,39.0,1223.65,642.55,565.39,323.67,153.64,1711.88,36.0,0.0,1701.0


DecisionTreeClassifier(criterion='entropy', max_depth=5)
DecisionTreeClassifier
>>> For testing data
pred_y[:5] = [0. 1. 0. 0. 0.]



Unnamed: 0_level_0,label,MO_HLADR_MFI_cellsul,Neu_CD64MFI_cellsul,CD3T_cellsul,CD8T_cellsul,CD4T_cellsul,NK_cellsul,CD19_cellsul,CD45_cellsul,Age,Sex_0M1F,Mono_CD64MFI_cellsul
id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
0,0,2843.0,156.0,1358.52,730.78,637.85,127.06,94.82,1588.62,45.0,1.0,3256.0
1,1,437.0,137.0,509.43,268.05,243.07,390.86,98.24,1002.76,51.0,1.0,491.0
2,0,826.0,82.0,1232.22,493.42,744.08,516.28,320.15,2200.58,32.0,0.0,1381.0
3,0,861.0,50.0,1512.86,925.51,590.07,380.25,25.8,1929.1,50.0,0.0,1377.0
4,0,1160.0,157.0,890.42,403.91,489.53,266.92,87.63,1251.52,43.0,0.0,1844.0
5,1,867.0,85.0,1662.11,865.5,804.14,220.68,92.58,2063.11,44.0,1.0,986.0
6,0,1330.0,114.0,1307.95,710.86,607.96,271.01,214.49,1855.05,31.0,0.0,2077.0
7,0,494.0,48.0,1522.39,618.19,911.49,338.85,104.45,2013.05,36.0,1.0,1409.0
8,0,2119.0,73.0,1219.66,732.14,468.48,71.54,83.08,1378.32,45.0,1.0,2403.0
9,0,2052.0,39.0,1223.65,642.55,565.39,323.67,153.64,1711.88,36.0,0.0,1701.0


DecisionTreeClassifier(max_depth=10)
DecisionTreeClassifier
>>> For testing data
pred_y[:5] = [0. 0. 0. 0. 1.]



Unnamed: 0_level_0,label,MO_HLADR_MFI_cellsul,Neu_CD64MFI_cellsul,CD3T_cellsul,CD8T_cellsul,CD4T_cellsul,NK_cellsul,CD19_cellsul,CD45_cellsul,Age,Sex_0M1F,Mono_CD64MFI_cellsul
id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
0,0,2843.0,156.0,1358.52,730.78,637.85,127.06,94.82,1588.62,45.0,1.0,3256.0
1,0,437.0,137.0,509.43,268.05,243.07,390.86,98.24,1002.76,51.0,1.0,491.0
2,0,826.0,82.0,1232.22,493.42,744.08,516.28,320.15,2200.58,32.0,0.0,1381.0
3,0,861.0,50.0,1512.86,925.51,590.07,380.25,25.8,1929.1,50.0,0.0,1377.0
4,1,1160.0,157.0,890.42,403.91,489.53,266.92,87.63,1251.52,43.0,0.0,1844.0
5,0,867.0,85.0,1662.11,865.5,804.14,220.68,92.58,2063.11,44.0,1.0,986.0
6,1,1330.0,114.0,1307.95,710.86,607.96,271.01,214.49,1855.05,31.0,0.0,2077.0
7,0,494.0,48.0,1522.39,618.19,911.49,338.85,104.45,2013.05,36.0,1.0,1409.0
8,0,2119.0,73.0,1219.66,732.14,468.48,71.54,83.08,1378.32,45.0,1.0,2403.0
9,0,2052.0,39.0,1223.65,642.55,565.39,323.67,153.64,1711.88,36.0,0.0,1701.0


DecisionTreeClassifier(max_depth=15)
DecisionTreeClassifier
>>> For testing data
pred_y[:5] = [0. 0. 0. 0. 1.]



Unnamed: 0_level_0,label,MO_HLADR_MFI_cellsul,Neu_CD64MFI_cellsul,CD3T_cellsul,CD8T_cellsul,CD4T_cellsul,NK_cellsul,CD19_cellsul,CD45_cellsul,Age,Sex_0M1F,Mono_CD64MFI_cellsul
id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
0,0,2843.0,156.0,1358.52,730.78,637.85,127.06,94.82,1588.62,45.0,1.0,3256.0
1,0,437.0,137.0,509.43,268.05,243.07,390.86,98.24,1002.76,51.0,1.0,491.0
2,0,826.0,82.0,1232.22,493.42,744.08,516.28,320.15,2200.58,32.0,0.0,1381.0
3,0,861.0,50.0,1512.86,925.51,590.07,380.25,25.8,1929.1,50.0,0.0,1377.0
4,1,1160.0,157.0,890.42,403.91,489.53,266.92,87.63,1251.52,43.0,0.0,1844.0
5,0,867.0,85.0,1662.11,865.5,804.14,220.68,92.58,2063.11,44.0,1.0,986.0
6,1,1330.0,114.0,1307.95,710.86,607.96,271.01,214.49,1855.05,31.0,0.0,2077.0
7,0,494.0,48.0,1522.39,618.19,911.49,338.85,104.45,2013.05,36.0,1.0,1409.0
8,0,2119.0,73.0,1219.66,732.14,468.48,71.54,83.08,1378.32,45.0,1.0,2403.0
9,1,2052.0,39.0,1223.65,642.55,565.39,323.67,153.64,1711.88,36.0,0.0,1701.0


DecisionTreeClassifier(max_depth=20)
DecisionTreeClassifier
>>> For testing data
pred_y[:5] = [0. 0. 0. 0. 0.]



Unnamed: 0_level_0,label,MO_HLADR_MFI_cellsul,Neu_CD64MFI_cellsul,CD3T_cellsul,CD8T_cellsul,CD4T_cellsul,NK_cellsul,CD19_cellsul,CD45_cellsul,Age,Sex_0M1F,Mono_CD64MFI_cellsul
id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
0,0,2843.0,156.0,1358.52,730.78,637.85,127.06,94.82,1588.62,45.0,1.0,3256.0
1,0,437.0,137.0,509.43,268.05,243.07,390.86,98.24,1002.76,51.0,1.0,491.0
2,0,826.0,82.0,1232.22,493.42,744.08,516.28,320.15,2200.58,32.0,0.0,1381.0
3,0,861.0,50.0,1512.86,925.51,590.07,380.25,25.8,1929.1,50.0,0.0,1377.0
4,0,1160.0,157.0,890.42,403.91,489.53,266.92,87.63,1251.52,43.0,0.0,1844.0
5,0,867.0,85.0,1662.11,865.5,804.14,220.68,92.58,2063.11,44.0,1.0,986.0
6,0,1330.0,114.0,1307.95,710.86,607.96,271.01,214.49,1855.05,31.0,0.0,2077.0
7,1,494.0,48.0,1522.39,618.19,911.49,338.85,104.45,2013.05,36.0,1.0,1409.0
8,0,2119.0,73.0,1219.66,732.14,468.48,71.54,83.08,1378.32,45.0,1.0,2403.0
9,0,2052.0,39.0,1223.65,642.55,565.39,323.67,153.64,1711.88,36.0,0.0,1701.0


DecisionTreeClassifier(max_depth=5)
DecisionTreeClassifier
>>> For testing data
pred_y[:5] = [0. 1. 0. 0. 0.]



Unnamed: 0_level_0,label,MO_HLADR_MFI_cellsul,Neu_CD64MFI_cellsul,CD3T_cellsul,CD8T_cellsul,CD4T_cellsul,NK_cellsul,CD19_cellsul,CD45_cellsul,Age,Sex_0M1F,Mono_CD64MFI_cellsul
id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
0,0,2843.0,156.0,1358.52,730.78,637.85,127.06,94.82,1588.62,45.0,1.0,3256.0
1,1,437.0,137.0,509.43,268.05,243.07,390.86,98.24,1002.76,51.0,1.0,491.0
2,0,826.0,82.0,1232.22,493.42,744.08,516.28,320.15,2200.58,32.0,0.0,1381.0
3,0,861.0,50.0,1512.86,925.51,590.07,380.25,25.8,1929.1,50.0,0.0,1377.0
4,0,1160.0,157.0,890.42,403.91,489.53,266.92,87.63,1251.52,43.0,0.0,1844.0
5,0,867.0,85.0,1662.11,865.5,804.14,220.68,92.58,2063.11,44.0,1.0,986.0
6,0,1330.0,114.0,1307.95,710.86,607.96,271.01,214.49,1855.05,31.0,0.0,2077.0
7,1,494.0,48.0,1522.39,618.19,911.49,338.85,104.45,2013.05,36.0,1.0,1409.0
8,0,2119.0,73.0,1219.66,732.14,468.48,71.54,83.08,1378.32,45.0,1.0,2403.0
9,0,2052.0,39.0,1223.65,642.55,565.39,323.67,153.64,1711.88,36.0,0.0,1701.0


KNeighborsClassifier(n_neighbors=11)
KNeighborsClassifier
>>> For testing data
pred_y[:5] = [0. 0. 0. 0. 0.]



Unnamed: 0_level_0,label,MO_HLADR_MFI_cellsul,Neu_CD64MFI_cellsul,CD3T_cellsul,CD8T_cellsul,CD4T_cellsul,NK_cellsul,CD19_cellsul,CD45_cellsul,Age,Sex_0M1F,Mono_CD64MFI_cellsul
id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
0,0,2843.0,156.0,1358.52,730.78,637.85,127.06,94.82,1588.62,45.0,1.0,3256.0
1,0,437.0,137.0,509.43,268.05,243.07,390.86,98.24,1002.76,51.0,1.0,491.0
2,0,826.0,82.0,1232.22,493.42,744.08,516.28,320.15,2200.58,32.0,0.0,1381.0
3,0,861.0,50.0,1512.86,925.51,590.07,380.25,25.8,1929.1,50.0,0.0,1377.0
4,0,1160.0,157.0,890.42,403.91,489.53,266.92,87.63,1251.52,43.0,0.0,1844.0
5,0,867.0,85.0,1662.11,865.5,804.14,220.68,92.58,2063.11,44.0,1.0,986.0
6,0,1330.0,114.0,1307.95,710.86,607.96,271.01,214.49,1855.05,31.0,0.0,2077.0
7,0,494.0,48.0,1522.39,618.19,911.49,338.85,104.45,2013.05,36.0,1.0,1409.0
8,0,2119.0,73.0,1219.66,732.14,468.48,71.54,83.08,1378.32,45.0,1.0,2403.0
9,0,2052.0,39.0,1223.65,642.55,565.39,323.67,153.64,1711.88,36.0,0.0,1701.0


KNeighborsClassifier(n_neighbors=1)
KNeighborsClassifier
>>> For testing data
pred_y[:5] = [1. 0. 0. 0. 0.]



Unnamed: 0_level_0,label,MO_HLADR_MFI_cellsul,Neu_CD64MFI_cellsul,CD3T_cellsul,CD8T_cellsul,CD4T_cellsul,NK_cellsul,CD19_cellsul,CD45_cellsul,Age,Sex_0M1F,Mono_CD64MFI_cellsul
id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
0,1,2843.0,156.0,1358.52,730.78,637.85,127.06,94.82,1588.62,45.0,1.0,3256.0
1,0,437.0,137.0,509.43,268.05,243.07,390.86,98.24,1002.76,51.0,1.0,491.0
2,0,826.0,82.0,1232.22,493.42,744.08,516.28,320.15,2200.58,32.0,0.0,1381.0
3,0,861.0,50.0,1512.86,925.51,590.07,380.25,25.8,1929.1,50.0,0.0,1377.0
4,0,1160.0,157.0,890.42,403.91,489.53,266.92,87.63,1251.52,43.0,0.0,1844.0
5,0,867.0,85.0,1662.11,865.5,804.14,220.68,92.58,2063.11,44.0,1.0,986.0
6,0,1330.0,114.0,1307.95,710.86,607.96,271.01,214.49,1855.05,31.0,0.0,2077.0
7,0,494.0,48.0,1522.39,618.19,911.49,338.85,104.45,2013.05,36.0,1.0,1409.0
8,0,2119.0,73.0,1219.66,732.14,468.48,71.54,83.08,1378.32,45.0,1.0,2403.0
9,0,2052.0,39.0,1223.65,642.55,565.39,323.67,153.64,1711.88,36.0,0.0,1701.0


KNeighborsClassifier(n_neighbors=3)
KNeighborsClassifier
>>> For testing data
pred_y[:5] = [0. 0. 0. 0. 0.]



Unnamed: 0_level_0,label,MO_HLADR_MFI_cellsul,Neu_CD64MFI_cellsul,CD3T_cellsul,CD8T_cellsul,CD4T_cellsul,NK_cellsul,CD19_cellsul,CD45_cellsul,Age,Sex_0M1F,Mono_CD64MFI_cellsul
id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
0,0,2843.0,156.0,1358.52,730.78,637.85,127.06,94.82,1588.62,45.0,1.0,3256.0
1,0,437.0,137.0,509.43,268.05,243.07,390.86,98.24,1002.76,51.0,1.0,491.0
2,0,826.0,82.0,1232.22,493.42,744.08,516.28,320.15,2200.58,32.0,0.0,1381.0
3,0,861.0,50.0,1512.86,925.51,590.07,380.25,25.8,1929.1,50.0,0.0,1377.0
4,0,1160.0,157.0,890.42,403.91,489.53,266.92,87.63,1251.52,43.0,0.0,1844.0
5,0,867.0,85.0,1662.11,865.5,804.14,220.68,92.58,2063.11,44.0,1.0,986.0
6,0,1330.0,114.0,1307.95,710.86,607.96,271.01,214.49,1855.05,31.0,0.0,2077.0
7,0,494.0,48.0,1522.39,618.19,911.49,338.85,104.45,2013.05,36.0,1.0,1409.0
8,0,2119.0,73.0,1219.66,732.14,468.48,71.54,83.08,1378.32,45.0,1.0,2403.0
9,0,2052.0,39.0,1223.65,642.55,565.39,323.67,153.64,1711.88,36.0,0.0,1701.0


KNeighborsClassifier(n_neighbors=9)
KNeighborsClassifier
>>> For testing data
pred_y[:5] = [0. 0. 0. 0. 0.]



Unnamed: 0_level_0,label,MO_HLADR_MFI_cellsul,Neu_CD64MFI_cellsul,CD3T_cellsul,CD8T_cellsul,CD4T_cellsul,NK_cellsul,CD19_cellsul,CD45_cellsul,Age,Sex_0M1F,Mono_CD64MFI_cellsul
id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
0,0,2843.0,156.0,1358.52,730.78,637.85,127.06,94.82,1588.62,45.0,1.0,3256.0
1,0,437.0,137.0,509.43,268.05,243.07,390.86,98.24,1002.76,51.0,1.0,491.0
2,0,826.0,82.0,1232.22,493.42,744.08,516.28,320.15,2200.58,32.0,0.0,1381.0
3,0,861.0,50.0,1512.86,925.51,590.07,380.25,25.8,1929.1,50.0,0.0,1377.0
4,0,1160.0,157.0,890.42,403.91,489.53,266.92,87.63,1251.52,43.0,0.0,1844.0
5,0,867.0,85.0,1662.11,865.5,804.14,220.68,92.58,2063.11,44.0,1.0,986.0
6,0,1330.0,114.0,1307.95,710.86,607.96,271.01,214.49,1855.05,31.0,0.0,2077.0
7,0,494.0,48.0,1522.39,618.19,911.49,338.85,104.45,2013.05,36.0,1.0,1409.0
8,0,2119.0,73.0,1219.66,732.14,468.48,71.54,83.08,1378.32,45.0,1.0,2403.0
9,0,2052.0,39.0,1223.65,642.55,565.39,323.67,153.64,1711.88,36.0,0.0,1701.0


RandomForestClassifier(n_estimators=150)
RandomForestClassifier
>>> For testing data
pred_y[:5] = [0. 0. 0. 0. 0.]



Unnamed: 0_level_0,label,MO_HLADR_MFI_cellsul,Neu_CD64MFI_cellsul,CD3T_cellsul,CD8T_cellsul,CD4T_cellsul,NK_cellsul,CD19_cellsul,CD45_cellsul,Age,Sex_0M1F,Mono_CD64MFI_cellsul
id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
0,0,2843.0,156.0,1358.52,730.78,637.85,127.06,94.82,1588.62,45.0,1.0,3256.0
1,0,437.0,137.0,509.43,268.05,243.07,390.86,98.24,1002.76,51.0,1.0,491.0
2,0,826.0,82.0,1232.22,493.42,744.08,516.28,320.15,2200.58,32.0,0.0,1381.0
3,0,861.0,50.0,1512.86,925.51,590.07,380.25,25.8,1929.1,50.0,0.0,1377.0
4,0,1160.0,157.0,890.42,403.91,489.53,266.92,87.63,1251.52,43.0,0.0,1844.0
5,0,867.0,85.0,1662.11,865.5,804.14,220.68,92.58,2063.11,44.0,1.0,986.0
6,0,1330.0,114.0,1307.95,710.86,607.96,271.01,214.49,1855.05,31.0,0.0,2077.0
7,0,494.0,48.0,1522.39,618.19,911.49,338.85,104.45,2013.05,36.0,1.0,1409.0
8,0,2119.0,73.0,1219.66,732.14,468.48,71.54,83.08,1378.32,45.0,1.0,2403.0
9,0,2052.0,39.0,1223.65,642.55,565.39,323.67,153.64,1711.88,36.0,0.0,1701.0


RandomForestClassifier(n_estimators=200)
RandomForestClassifier
>>> For testing data
pred_y[:5] = [0. 0. 0. 0. 0.]



Unnamed: 0_level_0,label,MO_HLADR_MFI_cellsul,Neu_CD64MFI_cellsul,CD3T_cellsul,CD8T_cellsul,CD4T_cellsul,NK_cellsul,CD19_cellsul,CD45_cellsul,Age,Sex_0M1F,Mono_CD64MFI_cellsul
id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
0,0,2843.0,156.0,1358.52,730.78,637.85,127.06,94.82,1588.62,45.0,1.0,3256.0
1,0,437.0,137.0,509.43,268.05,243.07,390.86,98.24,1002.76,51.0,1.0,491.0
2,0,826.0,82.0,1232.22,493.42,744.08,516.28,320.15,2200.58,32.0,0.0,1381.0
3,0,861.0,50.0,1512.86,925.51,590.07,380.25,25.8,1929.1,50.0,0.0,1377.0
4,0,1160.0,157.0,890.42,403.91,489.53,266.92,87.63,1251.52,43.0,0.0,1844.0
5,0,867.0,85.0,1662.11,865.5,804.14,220.68,92.58,2063.11,44.0,1.0,986.0
6,0,1330.0,114.0,1307.95,710.86,607.96,271.01,214.49,1855.05,31.0,0.0,2077.0
7,0,494.0,48.0,1522.39,618.19,911.49,338.85,104.45,2013.05,36.0,1.0,1409.0
8,0,2119.0,73.0,1219.66,732.14,468.48,71.54,83.08,1378.32,45.0,1.0,2403.0
9,0,2052.0,39.0,1223.65,642.55,565.39,323.67,153.64,1711.88,36.0,0.0,1701.0


RandomForestClassifier(n_estimators=250)
RandomForestClassifier
>>> For testing data
pred_y[:5] = [0. 0. 0. 0. 0.]



Unnamed: 0_level_0,label,MO_HLADR_MFI_cellsul,Neu_CD64MFI_cellsul,CD3T_cellsul,CD8T_cellsul,CD4T_cellsul,NK_cellsul,CD19_cellsul,CD45_cellsul,Age,Sex_0M1F,Mono_CD64MFI_cellsul
id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
0,0,2843.0,156.0,1358.52,730.78,637.85,127.06,94.82,1588.62,45.0,1.0,3256.0
1,0,437.0,137.0,509.43,268.05,243.07,390.86,98.24,1002.76,51.0,1.0,491.0
2,0,826.0,82.0,1232.22,493.42,744.08,516.28,320.15,2200.58,32.0,0.0,1381.0
3,0,861.0,50.0,1512.86,925.51,590.07,380.25,25.8,1929.1,50.0,0.0,1377.0
4,0,1160.0,157.0,890.42,403.91,489.53,266.92,87.63,1251.52,43.0,0.0,1844.0
5,0,867.0,85.0,1662.11,865.5,804.14,220.68,92.58,2063.11,44.0,1.0,986.0
6,0,1330.0,114.0,1307.95,710.86,607.96,271.01,214.49,1855.05,31.0,0.0,2077.0
7,0,494.0,48.0,1522.39,618.19,911.49,338.85,104.45,2013.05,36.0,1.0,1409.0
8,0,2119.0,73.0,1219.66,732.14,468.48,71.54,83.08,1378.32,45.0,1.0,2403.0
9,0,2052.0,39.0,1223.65,642.55,565.39,323.67,153.64,1711.88,36.0,0.0,1701.0


RandomForestClassifier(n_estimators=300)
RandomForestClassifier
>>> For testing data
pred_y[:5] = [0. 0. 0. 0. 0.]



Unnamed: 0_level_0,label,MO_HLADR_MFI_cellsul,Neu_CD64MFI_cellsul,CD3T_cellsul,CD8T_cellsul,CD4T_cellsul,NK_cellsul,CD19_cellsul,CD45_cellsul,Age,Sex_0M1F,Mono_CD64MFI_cellsul
id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
0,0,2843.0,156.0,1358.52,730.78,637.85,127.06,94.82,1588.62,45.0,1.0,3256.0
1,0,437.0,137.0,509.43,268.05,243.07,390.86,98.24,1002.76,51.0,1.0,491.0
2,0,826.0,82.0,1232.22,493.42,744.08,516.28,320.15,2200.58,32.0,0.0,1381.0
3,0,861.0,50.0,1512.86,925.51,590.07,380.25,25.8,1929.1,50.0,0.0,1377.0
4,0,1160.0,157.0,890.42,403.91,489.53,266.92,87.63,1251.52,43.0,0.0,1844.0
5,0,867.0,85.0,1662.11,865.5,804.14,220.68,92.58,2063.11,44.0,1.0,986.0
6,0,1330.0,114.0,1307.95,710.86,607.96,271.01,214.49,1855.05,31.0,0.0,2077.0
7,0,494.0,48.0,1522.39,618.19,911.49,338.85,104.45,2013.05,36.0,1.0,1409.0
8,0,2119.0,73.0,1219.66,732.14,468.48,71.54,83.08,1378.32,45.0,1.0,2403.0
9,0,2052.0,39.0,1223.65,642.55,565.39,323.67,153.64,1711.88,36.0,0.0,1701.0


# Compress `results/` folder


In [11]:
!zip -r {folder_results}."$(TZ=':Asia/Hong_Kong' date +"%Y%m%d.%Hh%Mm")".zip {folder_results}

  adding: results/ (stored 0%)
  adding: results/rforest_250estimators_1.000acc.csv (deflated 55%)
  adding: results/knn_9n_1.000acc.csv (deflated 55%)
  adding: results/dectree_entropy_10depth_0.714acc.csv (deflated 54%)
  adding: results/dectree_entropy_15depth_0.714acc.csv (deflated 54%)
  adding: results/dectree_entropy_20depth_0.714acc.csv (deflated 54%)
  adding: results/knn_3n_0.857acc.csv (deflated 55%)
  adding: results/dectree_gini_5depth_1.000acc.csv (deflated 54%)
  adding: results/rforest_200estimators_1.000acc.csv (deflated 55%)
  adding: results/knn_1n_0.857acc.csv (deflated 55%)
  adding: results/rforest_150estimators_1.000acc.csv (deflated 55%)
  adding: results/dectree_entropy_5depth_1.000acc.csv (deflated 54%)
  adding: results/knn_11n_1.000acc.csv (deflated 56%)
  adding: results/dectree_gini_15depth_0.857acc.csv (deflated 54%)
  adding: results/dectree_gini_10depth_0.857acc.csv (deflated 54%)
  adding: results/dectree_gini_20depth_1.000acc.csv (defla

In [12]:
!echo "$(TZ=':Asia/Hong_Kong' date +"%Y%m%d.%Hh%Mm")"

20220405.19h49m


In [13]:
# !rm results/*.csv