# Drug Discovery, FAST-AI Tabular Model test


## DATASETS:
(a) Carbonic Anhydrase II (ChEMBL205), a protein lyase,  
(b) Cyclin-dependent kinase 2 (CHEMBL301), a protein kinase,  
(c) ether-a-go-go-related gene potassium channel 1 (HERG) (CHEMBL240), a voltage-gated ion channel,  
(d) Dopamine D4 receptor (CHEMBL219), a monoamine GPCR,  
(e) Coagulation factor X (CHEMBL244), a serine protease,  
(f) Cannabinoid CB1 receptor (CHEMBL218), a lipid-like GPCR and  
(g) Cytochrome P450 19A1 (CHEMBL1978), a cytochrome P450.  
The activity classes were selected based on data availability and as representatives of therapeutically important target classes or as anti-targets.

In [1]:
!nvidia-smi

Fri Apr  8 15:09:02 2022       
+-----------------------------------------------------------------------------+
| NVIDIA-SMI 450.156.00   Driver Version: 450.156.00   CUDA Version: 11.0     |
|-------------------------------+----------------------+----------------------+
| GPU  Name        Persistence-M| Bus-Id        Disp.A | Volatile Uncorr. ECC |
| Fan  Temp  Perf  Pwr:Usage/Cap|         Memory-Usage | GPU-Util  Compute M. |
|                               |                      |               MIG M. |
|   0  Tesla V100-DGXS...  On   | 00000000:07:00.0 Off |                    0 |
| N/A   38C    P0    54W / 300W |   8724MiB / 32505MiB |      0%      Default |
|                               |                      |                  N/A |
+-------------------------------+----------------------+----------------------+
|   1  Tesla V100-DGXS...  On   | 00000000:08:00.0 Off |                    0 |
| N/A   40C    P0    53W / 300W |   7050MiB / 32508MiB |      0%      Default |
|       

In [2]:
# Import
import pandas as pd
import numpy as np
from pathlib import Path

In [3]:
#%%capture
#!wget -c https://repo.continuum.io/miniconda/Miniconda3-latest-Linux-x86_64.sh
#!chmod +x Miniconda3-latest-Linux-x86_64.sh
#!time bash ./Miniconda3-latest-Linux-x86_64.sh -b -f -p /usr/local
#!time conda install -q -y -c conda-forge rdkit

In [4]:
from rdkit import Chem
from rdkit.Chem import AllChem

[15:09:03] Enabling RDKit 2019.09.3 jupyter extensions


In [5]:
top_mcc_scores = {
    
    'CHEMBL205': 0.862,
    'CHEMBL301': 0.926,
    'CHEMBL240': 0.884,
    'CHEMBL219': 0.887,
    'CHEMBL244': 0.983,
    'CHEMBL218': 0.941,
    'CHEMBL1978': 0.904}

In [6]:
path = Path('../dataset/13321_2017_226_MOESM1_ESM/')

In [7]:
#df.head()
list(path.iterdir())

[PosixPath('../dataset/13321_2017_226_MOESM1_ESM/mol_images'),
 PosixPath('../dataset/13321_2017_226_MOESM1_ESM/CHEMBL218'),
 PosixPath('../dataset/13321_2017_226_MOESM1_ESM/CHEMBL219'),
 PosixPath('../dataset/13321_2017_226_MOESM1_ESM/CHEMBL240'),
 PosixPath('../dataset/13321_2017_226_MOESM1_ESM/CHEMBL244'),
 PosixPath('../dataset/13321_2017_226_MOESM1_ESM/CHEMBL301'),
 PosixPath('../dataset/13321_2017_226_MOESM1_ESM/CHEMBL205'),
 PosixPath('../dataset/13321_2017_226_MOESM1_ESM/CHEMBL1978')]

In [8]:
dataset='CHEMBL205'

# TabularPandas

In [9]:
from sklearn.model_selection import train_test_split
from sklearn.metrics import auc,roc_auc_score,recall_score,precision_score,f1_score
from  sklearn.metrics import matthews_corrcoef
from sklearn.metrics import accuracy_score
from sklearn.model_selection import ParameterGrid

In [10]:
from fastai.tabular.all import *

In [11]:
def get_df(dataset, oversample = False):
    df = pd.read_csv(path/f'{dataset}/{dataset}_ecfp_512_activations_64.csv')
    X, y = df.drop(["CID", "SMILES", "Activity", 'Image', 'is_valid'], axis=1), df["Activity"]
    dep_var = ['Activity']
    cat_vars = X.columns
    cat_names = list(cat_vars)
    x_train, x_val = train_test_split(df.index, test_size=0.2, random_state=666, stratify=df['Activity'])
    df.loc[x_train, 'is_valid']=False
    df.loc[x_val, 'is_valid']=True
    if oversample:
        df = pd.concat([*[df.loc[(df.is_valid==False) & (df.Activity==1)]]*10, 
                            *[df.loc[(df.is_valid==False) & (df.Activity==0)]], 
                            df.loc[df.is_valid==True]], 
                            ignore_index=True)
    return df, dep_var, cat_vars, cat_names

In [12]:
df, dep_var, cat_vars, cat_names = get_df(dataset)

In [13]:
df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 17941 entries, 0 to 17940
Columns: 581 entries, CID to pca_63
dtypes: bool(1), float64(64), int64(513), object(3)
memory usage: 79.4+ MB


In [14]:
df.head()

Unnamed: 0,CID,SMILES,ECFP4_1,ECFP4_2,ECFP4_3,ECFP4_4,ECFP4_5,ECFP4_6,ECFP4_7,ECFP4_8,...,pca_54,pca_55,pca_56,pca_57,pca_58,pca_59,pca_60,pca_61,pca_62,pca_63
0,CHEMBL188002,S(=O)(=O)(N)c1cc(N/C(/S)=N\c2cc(C(=O)[O-])c(cc2)C=2c3c(OC4=CC(=O)C=CC=24)cc(O)cc3)ccc1,1,0,0,0,0,0,0,0,...,0.139053,-0.254431,0.414002,-0.016254,0.112134,0.111659,0.196388,-0.193955,0.004383,-0.429494
1,CHEMBL364127,Clc1ccc(cc1)C(=O)NC1Cc2cc(S(=O)(=O)N)ccc2C1,0,0,0,0,0,0,0,0,...,-0.001774,0.110718,0.005662,0.019671,0.170637,0.066581,0.245206,0.226241,0.06849,-0.025556
2,CHEMBL1683469,S(=O)(=O)(N)c1ccc(cc1)CNS(=O)(=O)CC12CCC(CC1=O)C2(C)C,0,0,0,0,0,0,0,0,...,-0.215584,0.272174,-0.173136,-0.261834,0.010428,-0.038368,0.184475,-0.12688,0.145626,0.179634
3,CHEMBL52564,Oc1ccccc1\C=C\C(=O)[O-],0,0,0,0,0,0,0,0,...,0.280948,-0.157399,-0.021701,0.064364,-0.219037,0.017443,-0.116238,0.05784,-0.238319,-0.199516
4,CHEMBL21427,OB(O)c1ccc(OC)cc1,1,0,0,0,0,0,0,0,...,-0.255639,0.419612,-0.214844,-0.029687,-0.507942,-0.045789,-0.219005,0.133554,-0.044429,-0.298659


In [15]:
train_idx = np.where(df.is_valid == False)[0]
valid_idx = np.where(df.is_valid == True)[0]
valid_idx

array([    5,    11,    13, ..., 17931, 17934, 17937])

In [16]:
def get_dls(df, dep_var, cat_vars, cat_names):
    train_idx = np.where(df.is_valid == False)[0]
    valid_idx = np.where(df.is_valid == True)[0]
    splits = (list(train_idx), list(valid_idx))
    procs = [Categorify, Normalize]
    to = TabularPandas(df, procs, cat_names=cat_names, y_names=dep_var, splits=splits, y_block = CategoryBlock(),
                      reduce_memory=True)
    to.show(3)
    to.items.head(3)
    dls = to.dataloaders(bs=32)
    return dls

In [17]:
dls = get_dls(df, dep_var, cat_vars, cat_names)

Unnamed: 0,ECFP4_1,ECFP4_2,ECFP4_3,ECFP4_4,ECFP4_5,ECFP4_6,ECFP4_7,ECFP4_8,ECFP4_9,ECFP4_10,ECFP4_11,ECFP4_12,ECFP4_13,ECFP4_14,ECFP4_15,ECFP4_16,ECFP4_17,ECFP4_18,ECFP4_19,ECFP4_20,ECFP4_21,ECFP4_22,ECFP4_23,ECFP4_24,ECFP4_25,ECFP4_26,ECFP4_27,ECFP4_28,ECFP4_29,ECFP4_30,ECFP4_31,ECFP4_32,ECFP4_33,ECFP4_34,ECFP4_35,ECFP4_36,ECFP4_37,ECFP4_38,ECFP4_39,ECFP4_40,ECFP4_41,ECFP4_42,ECFP4_43,ECFP4_44,ECFP4_45,ECFP4_46,ECFP4_47,ECFP4_48,ECFP4_49,ECFP4_50,ECFP4_51,ECFP4_52,ECFP4_53,ECFP4_54,ECFP4_55,ECFP4_56,ECFP4_57,ECFP4_58,ECFP4_59,ECFP4_60,ECFP4_61,ECFP4_62,ECFP4_63,ECFP4_64,ECFP4_65,ECFP4_66,ECFP4_67,ECFP4_68,ECFP4_69,ECFP4_70,ECFP4_71,ECFP4_72,ECFP4_73,ECFP4_74,ECFP4_75,ECFP4_76,ECFP4_77,ECFP4_78,ECFP4_79,ECFP4_80,ECFP4_81,ECFP4_82,ECFP4_83,ECFP4_84,ECFP4_85,ECFP4_86,ECFP4_87,ECFP4_88,ECFP4_89,ECFP4_90,ECFP4_91,ECFP4_92,ECFP4_93,ECFP4_94,ECFP4_95,ECFP4_96,ECFP4_97,ECFP4_98,ECFP4_99,ECFP4_100,ECFP4_101,ECFP4_102,ECFP4_103,ECFP4_104,ECFP4_105,ECFP4_106,ECFP4_107,ECFP4_108,ECFP4_109,ECFP4_110,ECFP4_111,ECFP4_112,ECFP4_113,ECFP4_114,ECFP4_115,ECFP4_116,ECFP4_117,ECFP4_118,ECFP4_119,ECFP4_120,ECFP4_121,ECFP4_122,ECFP4_123,ECFP4_124,ECFP4_125,ECFP4_126,ECFP4_127,ECFP4_128,ECFP4_129,ECFP4_130,ECFP4_131,ECFP4_132,ECFP4_133,ECFP4_134,ECFP4_135,ECFP4_136,ECFP4_137,ECFP4_138,ECFP4_139,ECFP4_140,ECFP4_141,ECFP4_142,ECFP4_143,ECFP4_144,ECFP4_145,ECFP4_146,ECFP4_147,ECFP4_148,ECFP4_149,ECFP4_150,ECFP4_151,ECFP4_152,ECFP4_153,ECFP4_154,ECFP4_155,ECFP4_156,ECFP4_157,ECFP4_158,ECFP4_159,ECFP4_160,ECFP4_161,ECFP4_162,ECFP4_163,ECFP4_164,ECFP4_165,ECFP4_166,ECFP4_167,ECFP4_168,ECFP4_169,ECFP4_170,ECFP4_171,ECFP4_172,ECFP4_173,ECFP4_174,ECFP4_175,ECFP4_176,ECFP4_177,ECFP4_178,ECFP4_179,ECFP4_180,ECFP4_181,ECFP4_182,ECFP4_183,ECFP4_184,ECFP4_185,ECFP4_186,ECFP4_187,ECFP4_188,ECFP4_189,ECFP4_190,ECFP4_191,ECFP4_192,ECFP4_193,ECFP4_194,ECFP4_195,ECFP4_196,ECFP4_197,ECFP4_198,ECFP4_199,ECFP4_200,ECFP4_201,ECFP4_202,ECFP4_203,ECFP4_204,ECFP4_205,ECFP4_206,ECFP4_207,ECFP4_208,ECFP4_209,ECFP4_210,ECFP4_211,ECFP4_212,ECFP4_213,ECFP4_214,ECFP4_215,ECFP4_216,ECFP4_217,ECFP4_218,ECFP4_219,ECFP4_220,ECFP4_221,ECFP4_222,ECFP4_223,ECFP4_224,ECFP4_225,ECFP4_226,ECFP4_227,ECFP4_228,ECFP4_229,ECFP4_230,ECFP4_231,ECFP4_232,ECFP4_233,ECFP4_234,ECFP4_235,ECFP4_236,ECFP4_237,ECFP4_238,ECFP4_239,ECFP4_240,ECFP4_241,ECFP4_242,ECFP4_243,ECFP4_244,ECFP4_245,ECFP4_246,ECFP4_247,ECFP4_248,ECFP4_249,ECFP4_250,ECFP4_251,ECFP4_252,ECFP4_253,ECFP4_254,ECFP4_255,ECFP4_256,ECFP4_257,ECFP4_258,ECFP4_259,ECFP4_260,ECFP4_261,ECFP4_262,ECFP4_263,ECFP4_264,ECFP4_265,ECFP4_266,ECFP4_267,ECFP4_268,ECFP4_269,ECFP4_270,ECFP4_271,ECFP4_272,ECFP4_273,ECFP4_274,ECFP4_275,ECFP4_276,ECFP4_277,ECFP4_278,ECFP4_279,ECFP4_280,ECFP4_281,ECFP4_282,ECFP4_283,ECFP4_284,ECFP4_285,ECFP4_286,ECFP4_287,ECFP4_288,ECFP4_289,ECFP4_290,ECFP4_291,ECFP4_292,ECFP4_293,ECFP4_294,ECFP4_295,ECFP4_296,ECFP4_297,ECFP4_298,ECFP4_299,ECFP4_300,ECFP4_301,ECFP4_302,ECFP4_303,ECFP4_304,ECFP4_305,ECFP4_306,ECFP4_307,ECFP4_308,ECFP4_309,ECFP4_310,ECFP4_311,ECFP4_312,ECFP4_313,ECFP4_314,ECFP4_315,ECFP4_316,ECFP4_317,ECFP4_318,ECFP4_319,ECFP4_320,ECFP4_321,ECFP4_322,ECFP4_323,ECFP4_324,ECFP4_325,ECFP4_326,ECFP4_327,ECFP4_328,ECFP4_329,ECFP4_330,ECFP4_331,ECFP4_332,ECFP4_333,ECFP4_334,ECFP4_335,ECFP4_336,ECFP4_337,ECFP4_338,ECFP4_339,ECFP4_340,ECFP4_341,ECFP4_342,ECFP4_343,ECFP4_344,ECFP4_345,ECFP4_346,ECFP4_347,ECFP4_348,ECFP4_349,ECFP4_350,ECFP4_351,ECFP4_352,ECFP4_353,ECFP4_354,ECFP4_355,ECFP4_356,ECFP4_357,ECFP4_358,ECFP4_359,ECFP4_360,ECFP4_361,ECFP4_362,ECFP4_363,ECFP4_364,ECFP4_365,ECFP4_366,ECFP4_367,ECFP4_368,ECFP4_369,ECFP4_370,ECFP4_371,ECFP4_372,ECFP4_373,ECFP4_374,ECFP4_375,ECFP4_376,ECFP4_377,ECFP4_378,ECFP4_379,ECFP4_380,ECFP4_381,ECFP4_382,ECFP4_383,ECFP4_384,ECFP4_385,ECFP4_386,ECFP4_387,ECFP4_388,ECFP4_389,ECFP4_390,ECFP4_391,ECFP4_392,ECFP4_393,ECFP4_394,ECFP4_395,ECFP4_396,ECFP4_397,ECFP4_398,ECFP4_399,ECFP4_400,ECFP4_401,ECFP4_402,ECFP4_403,ECFP4_404,ECFP4_405,ECFP4_406,ECFP4_407,ECFP4_408,ECFP4_409,ECFP4_410,ECFP4_411,ECFP4_412,ECFP4_413,ECFP4_414,ECFP4_415,ECFP4_416,ECFP4_417,ECFP4_418,ECFP4_419,ECFP4_420,ECFP4_421,ECFP4_422,ECFP4_423,ECFP4_424,ECFP4_425,ECFP4_426,ECFP4_427,ECFP4_428,ECFP4_429,ECFP4_430,ECFP4_431,ECFP4_432,ECFP4_433,ECFP4_434,ECFP4_435,ECFP4_436,ECFP4_437,ECFP4_438,ECFP4_439,ECFP4_440,ECFP4_441,ECFP4_442,ECFP4_443,ECFP4_444,ECFP4_445,ECFP4_446,ECFP4_447,ECFP4_448,ECFP4_449,ECFP4_450,ECFP4_451,ECFP4_452,ECFP4_453,ECFP4_454,ECFP4_455,ECFP4_456,ECFP4_457,ECFP4_458,ECFP4_459,ECFP4_460,ECFP4_461,ECFP4_462,ECFP4_463,ECFP4_464,ECFP4_465,ECFP4_466,ECFP4_467,ECFP4_468,ECFP4_469,ECFP4_470,ECFP4_471,ECFP4_472,ECFP4_473,ECFP4_474,ECFP4_475,ECFP4_476,ECFP4_477,ECFP4_478,ECFP4_479,ECFP4_480,ECFP4_481,ECFP4_482,ECFP4_483,ECFP4_484,ECFP4_485,ECFP4_486,ECFP4_487,ECFP4_488,ECFP4_489,ECFP4_490,ECFP4_491,ECFP4_492,ECFP4_493,ECFP4_494,ECFP4_495,ECFP4_496,ECFP4_497,ECFP4_498,ECFP4_499,ECFP4_500,ECFP4_501,ECFP4_502,ECFP4_503,ECFP4_504,ECFP4_505,ECFP4_506,ECFP4_507,ECFP4_508,ECFP4_509,ECFP4_510,ECFP4_511,ECFP4_512,pca_0,pca_1,pca_2,pca_3,pca_4,pca_5,pca_6,pca_7,pca_8,pca_9,pca_10,pca_11,pca_12,pca_13,pca_14,pca_15,pca_16,pca_17,pca_18,pca_19,pca_20,pca_21,pca_22,pca_23,pca_24,pca_25,pca_26,pca_27,pca_28,pca_29,pca_30,pca_31,pca_32,pca_33,pca_34,pca_35,pca_36,pca_37,pca_38,pca_39,pca_40,pca_41,pca_42,pca_43,pca_44,pca_45,pca_46,pca_47,pca_48,pca_49,pca_50,pca_51,pca_52,pca_53,pca_54,pca_55,pca_56,pca_57,pca_58,pca_59,pca_60,pca_61,pca_62,pca_63,Activity
0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,1,0,1,0,1,0,0,1,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,1,0,0,0,0,1,1,0,0,0,1,1,0,0,0,0,0,0,0,1,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,1,1,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,-2.58621,-10.225819,3.635715,-6.131528,-4.4481,-0.271146,-2.061514,0.656935,-1.278405,1.323977,-0.24571,-0.848637,-0.267102,0.840549,1.072798,-0.42052,-0.884244,0.132357,0.455445,-0.096275,-0.823238,0.290103,-0.0536,0.074537,0.380466,-0.216592,-0.185393,0.222247,-0.094523,0.098569,-0.449016,0.363437,0.282462,0.339721,-0.043617,0.132,-0.280592,-0.077076,0.189862,0.091102,0.040708,-0.288147,-0.090654,0.211012,0.294782,0.160358,-0.122637,0.113237,-0.076807,0.118681,-0.24904,0.050189,-0.171804,0.171463,0.139053,-0.254431,0.414002,-0.016254,0.112134,0.111659,0.196388,-0.193955,0.004383,-0.429494,1
1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,1,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,-9.816868,-18.622707,23.533211,-2.086306,4.083374,-1.902859,-0.34528,-3.000134,-0.599573,0.67915,-0.723131,-1.176993,0.01679,-1.370808,0.764996,1.442556,-1.926203,0.773776,-0.104462,-0.267454,-0.703544,-0.239739,0.192719,-0.222985,-0.231201,0.153058,0.097045,-0.012666,-0.16305,-0.151875,-0.239757,-0.212058,0.098664,-0.175905,-0.141147,-0.083352,0.10853,-0.310144,0.036012,-0.233646,0.378318,-0.009732,-0.097614,-0.203805,-0.045395,-0.161351,0.090067,0.077571,-0.208884,-0.117598,0.471341,0.025639,0.005718,-0.064647,-0.001774,0.110718,0.005662,0.019671,0.170637,0.066581,0.245206,0.226241,0.06849,-0.025556,1
2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,1,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,-11.547492,-17.93384,18.69618,-5.110664,1.468231,-2.254717,-1.461575,-1.878682,0.979978,-0.579781,-0.824583,-0.529804,-0.594658,-1.247169,1.200846,1.033458,-1.676035,0.79456,-0.091967,-0.417993,-0.291881,-0.062849,0.086349,-0.171252,-0.065032,-0.145549,0.214688,0.026512,-0.203051,-0.082079,0.148191,-0.042833,-0.436807,-0.065552,0.131823,-0.316843,0.07285,-0.217953,-0.168401,-0.28399,0.189408,-0.078982,-0.0115,-0.245735,-0.394431,0.089192,-0.074878,-0.1975,-0.072153,0.157782,0.111821,-0.174444,0.108647,0.10308,-0.215584,0.272174,-0.173136,-0.261834,0.010428,-0.038368,0.184475,-0.12688,0.145626,0.179634,1


In [18]:
dls.show_batch()

Unnamed: 0,ECFP4_1,ECFP4_2,ECFP4_3,ECFP4_4,ECFP4_5,ECFP4_6,ECFP4_7,ECFP4_8,ECFP4_9,ECFP4_10,ECFP4_11,ECFP4_12,ECFP4_13,ECFP4_14,ECFP4_15,ECFP4_16,ECFP4_17,ECFP4_18,ECFP4_19,ECFP4_20,ECFP4_21,ECFP4_22,ECFP4_23,ECFP4_24,ECFP4_25,ECFP4_26,ECFP4_27,ECFP4_28,ECFP4_29,ECFP4_30,ECFP4_31,ECFP4_32,ECFP4_33,ECFP4_34,ECFP4_35,ECFP4_36,ECFP4_37,ECFP4_38,ECFP4_39,ECFP4_40,ECFP4_41,ECFP4_42,ECFP4_43,ECFP4_44,ECFP4_45,ECFP4_46,ECFP4_47,ECFP4_48,ECFP4_49,ECFP4_50,ECFP4_51,ECFP4_52,ECFP4_53,ECFP4_54,ECFP4_55,ECFP4_56,ECFP4_57,ECFP4_58,ECFP4_59,ECFP4_60,ECFP4_61,ECFP4_62,ECFP4_63,ECFP4_64,ECFP4_65,ECFP4_66,ECFP4_67,ECFP4_68,ECFP4_69,ECFP4_70,ECFP4_71,ECFP4_72,ECFP4_73,ECFP4_74,ECFP4_75,ECFP4_76,ECFP4_77,ECFP4_78,ECFP4_79,ECFP4_80,ECFP4_81,ECFP4_82,ECFP4_83,ECFP4_84,ECFP4_85,ECFP4_86,ECFP4_87,ECFP4_88,ECFP4_89,ECFP4_90,ECFP4_91,ECFP4_92,ECFP4_93,ECFP4_94,ECFP4_95,ECFP4_96,ECFP4_97,ECFP4_98,ECFP4_99,ECFP4_100,ECFP4_101,ECFP4_102,ECFP4_103,ECFP4_104,ECFP4_105,ECFP4_106,ECFP4_107,ECFP4_108,ECFP4_109,ECFP4_110,ECFP4_111,ECFP4_112,ECFP4_113,ECFP4_114,ECFP4_115,ECFP4_116,ECFP4_117,ECFP4_118,ECFP4_119,ECFP4_120,ECFP4_121,ECFP4_122,ECFP4_123,ECFP4_124,ECFP4_125,ECFP4_126,ECFP4_127,ECFP4_128,ECFP4_129,ECFP4_130,ECFP4_131,ECFP4_132,ECFP4_133,ECFP4_134,ECFP4_135,ECFP4_136,ECFP4_137,ECFP4_138,ECFP4_139,ECFP4_140,ECFP4_141,ECFP4_142,ECFP4_143,ECFP4_144,ECFP4_145,ECFP4_146,ECFP4_147,ECFP4_148,ECFP4_149,ECFP4_150,ECFP4_151,ECFP4_152,ECFP4_153,ECFP4_154,ECFP4_155,ECFP4_156,ECFP4_157,ECFP4_158,ECFP4_159,ECFP4_160,ECFP4_161,ECFP4_162,ECFP4_163,ECFP4_164,ECFP4_165,ECFP4_166,ECFP4_167,ECFP4_168,ECFP4_169,ECFP4_170,ECFP4_171,ECFP4_172,ECFP4_173,ECFP4_174,ECFP4_175,ECFP4_176,ECFP4_177,ECFP4_178,ECFP4_179,ECFP4_180,ECFP4_181,ECFP4_182,ECFP4_183,ECFP4_184,ECFP4_185,ECFP4_186,ECFP4_187,ECFP4_188,ECFP4_189,ECFP4_190,ECFP4_191,ECFP4_192,ECFP4_193,ECFP4_194,ECFP4_195,ECFP4_196,ECFP4_197,ECFP4_198,ECFP4_199,ECFP4_200,ECFP4_201,ECFP4_202,ECFP4_203,ECFP4_204,ECFP4_205,ECFP4_206,ECFP4_207,ECFP4_208,ECFP4_209,ECFP4_210,ECFP4_211,ECFP4_212,ECFP4_213,ECFP4_214,ECFP4_215,ECFP4_216,ECFP4_217,ECFP4_218,ECFP4_219,ECFP4_220,ECFP4_221,ECFP4_222,ECFP4_223,ECFP4_224,ECFP4_225,ECFP4_226,ECFP4_227,ECFP4_228,ECFP4_229,ECFP4_230,ECFP4_231,ECFP4_232,ECFP4_233,ECFP4_234,ECFP4_235,ECFP4_236,ECFP4_237,ECFP4_238,ECFP4_239,ECFP4_240,ECFP4_241,ECFP4_242,ECFP4_243,ECFP4_244,ECFP4_245,ECFP4_246,ECFP4_247,ECFP4_248,ECFP4_249,ECFP4_250,ECFP4_251,ECFP4_252,ECFP4_253,ECFP4_254,ECFP4_255,ECFP4_256,ECFP4_257,ECFP4_258,ECFP4_259,ECFP4_260,ECFP4_261,ECFP4_262,ECFP4_263,ECFP4_264,ECFP4_265,ECFP4_266,ECFP4_267,ECFP4_268,ECFP4_269,ECFP4_270,ECFP4_271,ECFP4_272,ECFP4_273,ECFP4_274,ECFP4_275,ECFP4_276,ECFP4_277,ECFP4_278,ECFP4_279,ECFP4_280,ECFP4_281,ECFP4_282,ECFP4_283,ECFP4_284,ECFP4_285,ECFP4_286,ECFP4_287,ECFP4_288,ECFP4_289,ECFP4_290,ECFP4_291,ECFP4_292,ECFP4_293,ECFP4_294,ECFP4_295,ECFP4_296,ECFP4_297,ECFP4_298,ECFP4_299,ECFP4_300,ECFP4_301,ECFP4_302,ECFP4_303,ECFP4_304,ECFP4_305,ECFP4_306,ECFP4_307,ECFP4_308,ECFP4_309,ECFP4_310,ECFP4_311,ECFP4_312,ECFP4_313,ECFP4_314,ECFP4_315,ECFP4_316,ECFP4_317,ECFP4_318,ECFP4_319,ECFP4_320,ECFP4_321,ECFP4_322,ECFP4_323,ECFP4_324,ECFP4_325,ECFP4_326,ECFP4_327,ECFP4_328,ECFP4_329,ECFP4_330,ECFP4_331,ECFP4_332,ECFP4_333,ECFP4_334,ECFP4_335,ECFP4_336,ECFP4_337,ECFP4_338,ECFP4_339,ECFP4_340,ECFP4_341,ECFP4_342,ECFP4_343,ECFP4_344,ECFP4_345,ECFP4_346,ECFP4_347,ECFP4_348,ECFP4_349,ECFP4_350,ECFP4_351,ECFP4_352,ECFP4_353,ECFP4_354,ECFP4_355,ECFP4_356,ECFP4_357,ECFP4_358,ECFP4_359,ECFP4_360,ECFP4_361,ECFP4_362,ECFP4_363,ECFP4_364,ECFP4_365,ECFP4_366,ECFP4_367,ECFP4_368,ECFP4_369,ECFP4_370,ECFP4_371,ECFP4_372,ECFP4_373,ECFP4_374,ECFP4_375,ECFP4_376,ECFP4_377,ECFP4_378,ECFP4_379,ECFP4_380,ECFP4_381,ECFP4_382,ECFP4_383,ECFP4_384,ECFP4_385,ECFP4_386,ECFP4_387,ECFP4_388,ECFP4_389,ECFP4_390,ECFP4_391,ECFP4_392,ECFP4_393,ECFP4_394,ECFP4_395,ECFP4_396,ECFP4_397,ECFP4_398,ECFP4_399,ECFP4_400,ECFP4_401,ECFP4_402,ECFP4_403,ECFP4_404,ECFP4_405,ECFP4_406,ECFP4_407,ECFP4_408,ECFP4_409,ECFP4_410,ECFP4_411,ECFP4_412,ECFP4_413,ECFP4_414,ECFP4_415,ECFP4_416,ECFP4_417,ECFP4_418,ECFP4_419,ECFP4_420,ECFP4_421,ECFP4_422,ECFP4_423,ECFP4_424,ECFP4_425,ECFP4_426,ECFP4_427,ECFP4_428,ECFP4_429,ECFP4_430,ECFP4_431,ECFP4_432,ECFP4_433,ECFP4_434,ECFP4_435,ECFP4_436,ECFP4_437,ECFP4_438,ECFP4_439,ECFP4_440,ECFP4_441,ECFP4_442,ECFP4_443,ECFP4_444,ECFP4_445,ECFP4_446,ECFP4_447,ECFP4_448,ECFP4_449,ECFP4_450,ECFP4_451,ECFP4_452,ECFP4_453,ECFP4_454,ECFP4_455,ECFP4_456,ECFP4_457,ECFP4_458,ECFP4_459,ECFP4_460,ECFP4_461,ECFP4_462,ECFP4_463,ECFP4_464,ECFP4_465,ECFP4_466,ECFP4_467,ECFP4_468,ECFP4_469,ECFP4_470,ECFP4_471,ECFP4_472,ECFP4_473,ECFP4_474,ECFP4_475,ECFP4_476,ECFP4_477,ECFP4_478,ECFP4_479,ECFP4_480,ECFP4_481,ECFP4_482,ECFP4_483,ECFP4_484,ECFP4_485,ECFP4_486,ECFP4_487,ECFP4_488,ECFP4_489,ECFP4_490,ECFP4_491,ECFP4_492,ECFP4_493,ECFP4_494,ECFP4_495,ECFP4_496,ECFP4_497,ECFP4_498,ECFP4_499,ECFP4_500,ECFP4_501,ECFP4_502,ECFP4_503,ECFP4_504,ECFP4_505,ECFP4_506,ECFP4_507,ECFP4_508,ECFP4_509,ECFP4_510,ECFP4_511,ECFP4_512,pca_0,pca_1,pca_2,pca_3,pca_4,pca_5,pca_6,pca_7,pca_8,pca_9,pca_10,pca_11,pca_12,pca_13,pca_14,pca_15,pca_16,pca_17,pca_18,pca_19,pca_20,pca_21,pca_22,pca_23,pca_24,pca_25,pca_26,pca_27,pca_28,pca_29,pca_30,pca_31,pca_32,pca_33,pca_34,pca_35,pca_36,pca_37,pca_38,pca_39,pca_40,pca_41,pca_42,pca_43,pca_44,pca_45,pca_46,pca_47,pca_48,pca_49,pca_50,pca_51,pca_52,pca_53,pca_54,pca_55,pca_56,pca_57,pca_58,pca_59,pca_60,pca_61,pca_62,pca_63,Activity
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,11.901319,0.137827,-4.440769,-2.303982,5.95112,0.02069,1.03987,-1.45656,-0.091264,-0.90379,1.539176,-0.456045,-2.157402,-0.128602,0.247712,0.222864,0.047858,-0.012669,-0.241127,0.119103,-0.027785,-0.081928,0.972734,0.044087,-0.185951,0.392767,-0.557718,-0.184152,-0.247713,-0.076384,0.330611,-0.572002,-0.110822,-0.004289,-0.352498,-0.097663,0.187439,-0.533825,0.305859,0.13112,-0.49551,0.019136,0.379346,0.157979,0.253936,0.054228,-0.414509,-0.129695,0.291346,-0.221596,0.014415,0.092507,-0.310497,0.058637,0.128002,0.344395,-0.092279,0.063742,-0.244348,0.004872,0.08846,0.14404,0.107338,-0.010672,0
1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,1,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,1,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,1,1,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,1,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,35.123848,21.552345,8.326368,-16.103525,12.189694,-0.502858,-0.930966,-2.810736,4.158796,1.274666,-2.447943,-1.146399,-0.428574,-1.522284,-0.17972,-0.502181,0.686503,-0.499536,-0.987135,0.015067,0.234988,-0.932561,-0.044172,0.390815,-0.583491,0.207375,0.319875,-0.789718,0.181961,0.163525,0.388833,0.320521,0.149464,0.102339,0.235121,0.411945,-0.09871,-0.170372,-0.080277,0.093578,-0.332697,-0.341387,-0.036956,-0.534046,-0.09538,-0.217884,0.254418,0.061621,-0.26303,-0.287773,-0.096244,0.389921,0.25941,-0.096041,0.127104,0.146239,-0.096352,0.217282,-0.020972,0.191515,0.052849,-0.115789,-0.083292,0.053915,0
2,0,1,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,1,0,0,0,0,1,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,1,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,1,1,0,0,1,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,1,0,0,0,1,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,1,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,-13.604988,-4.547828,-6.757512,-0.605447,0.562819,-0.424089,-2.050209,0.375359,0.546383,-0.92878,-0.60156,0.041161,0.954839,0.057017,-0.076634,-0.245366,0.138476,0.388169,0.684716,0.2515,0.053033,-0.10902,-0.240786,0.001856,-0.493345,0.052208,-0.001903,-0.111213,-0.032079,0.082737,0.088589,0.020103,0.083638,0.063118,0.044766,-0.26313,0.050668,-0.01644,0.234661,-0.113008,-0.0241,0.039069,-0.0201,-0.384175,0.274372,0.129722,0.150643,0.271683,-0.191455,-0.026604,0.03123,0.042196,-0.115757,0.139354,-0.027834,-0.069195,-0.355866,-0.117907,0.125648,0.159373,-0.044221,0.186157,0.051054,-0.027499,0
3,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,6.346448,-1.347502,-5.182335,-0.64111,-1.269011,8.617794,2.053694,0.973009,-0.274762,-0.610885,0.088374,-0.212995,0.129832,0.121519,0.308648,0.051672,0.112547,0.036721,-0.221198,-0.372744,-0.170504,1.248227,0.009982,-0.182487,-0.397449,0.134227,0.386492,-0.501378,0.194421,0.175813,-0.305458,0.017968,0.130188,-0.07136,-0.259287,-0.091772,0.509661,0.186741,0.097508,0.080971,0.260713,0.254443,-0.019798,0.379957,-0.159857,0.327674,0.377874,0.034881,-0.073463,-0.024772,0.208265,-0.040244,0.032478,-0.108659,-0.001639,-0.027016,-0.124663,-0.299199,-0.124084,0.162663,-0.075197,-0.183758,-0.230197,0.16649,0
4,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,1,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,1,0,0,0,0,0,0,1,0,0,1,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,1,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,1,1,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,-3.288321,1.525151,-5.675885,-8.154809,-2.349339,-0.832282,0.077745,0.549485,-0.791112,0.326519,-1.041809,0.576592,0.44728,-0.497935,-0.197377,0.218716,-0.261239,-0.151923,0.081007,0.008075,0.274816,0.153122,0.227086,0.091392,0.234435,-0.100246,-0.332484,-0.005484,0.069106,-0.125468,-0.21932,-0.183024,-0.053025,-0.018175,-0.395375,0.066281,0.412718,0.031094,0.091517,-0.084378,-0.028094,0.074929,0.151782,-0.068698,-0.00054,-0.097804,0.161118,-0.024921,0.126029,-0.182819,0.012411,-0.035488,-0.057896,-0.178594,-0.173142,-0.011821,4.1e-05,0.03785,0.031097,-0.082569,-0.217732,-0.003232,-0.131287,-0.175186,0
5,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,1,1,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,1,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,5.143438,-1.685173,-5.052134,0.993202,-4.274637,2.957591,1.646269,-2.910197,0.113691,-0.612456,-0.757344,-0.655417,0.212439,-0.204333,-0.225868,0.401006,0.302253,0.409401,-0.652684,0.010502,0.497612,-0.199613,0.412294,-0.389625,0.162848,-0.085348,-0.181396,0.046018,0.060045,0.078338,0.187209,-0.108971,-0.078258,-0.435566,0.302018,-0.185886,0.263863,-0.05057,-0.042118,-0.591152,0.143984,-0.091273,-0.017517,0.216087,-0.080266,-0.151924,0.029174,0.060445,0.117174,0.037348,-0.261222,-0.06705,0.097431,0.029634,0.186692,-0.059184,0.114358,0.114099,-0.098122,0.054426,-0.178019,0.060755,0.099719,0.112055,0
6,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,1,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,3.420429,-2.605902,-2.663652,5.213378,1.75182,10.414148,-0.947383,-0.138187,0.470943,-1.009834,0.865182,-0.243266,-0.541311,-0.975099,-0.373232,-0.481736,0.699132,0.682152,0.51047,-0.600473,0.409066,0.415748,0.242636,-0.376788,0.056887,-0.122039,-0.109951,-0.035672,-0.209241,-0.118539,-0.451312,0.377405,0.005971,0.4172,-0.272161,-0.226298,0.237303,-0.182653,-0.494097,-0.129103,-0.220872,0.185632,-0.150899,-0.069222,0.152688,0.227641,-0.070709,-0.0662,-0.201589,-0.228943,0.090332,-0.035177,-0.201065,0.028515,-0.281152,-0.000506,0.059541,0.024493,0.093451,-0.137401,-0.354523,0.160384,0.125823,0.203885,0
7,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,1,0,0,0,1,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,1,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,-12.074063,-19.244139,15.966215,1.552936,2.430849,-1.479302,-2.580765,-0.8694,-0.880242,1.992702,-3.208631,-0.272389,-0.39409,-0.493837,1.099212,1.27255,-0.837854,-0.142678,0.391356,-0.871508,-0.596248,-0.589404,0.026399,-0.358893,-0.030805,-0.110807,0.317087,-0.030205,-0.424876,0.175907,-0.008915,0.270481,0.296331,0.19107,-0.328979,0.429721,0.356007,-0.435674,-0.286079,0.048925,0.110571,-0.298971,0.226076,0.020447,0.088923,-0.12052,0.132227,0.202616,0.119771,-0.405652,-0.099589,-0.229051,-0.250319,-0.058672,-0.208673,0.074361,0.226883,-0.145691,-0.066706,-0.157808,0.165128,-0.070568,0.067994,-0.024566,1
8,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,1,0,0,0,1,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,1,0,1,0,1,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,-18.824343,7.300288,1.56868,8.489171,-2.301176,-0.663879,0.553846,-1.073269,1.139462,-0.144241,-0.181974,-0.374884,0.20608,0.679143,0.281033,0.017418,-0.039458,-0.268324,-0.392473,-0.063548,-0.062858,0.25976,-0.097588,0.006421,-0.106823,-0.243264,0.384387,-0.181023,0.197804,0.069301,-0.183775,-0.029935,0.16637,-0.187105,0.130783,0.030762,-0.356215,0.130443,0.107814,-0.145924,0.024984,0.070763,-0.070342,-0.017636,0.094765,-0.147,-0.084744,-0.065531,-0.096231,-0.033839,0.114188,-0.011301,0.002563,-0.18235,-0.109505,-0.009277,0.023625,0.186918,-0.026002,0.014486,0.212605,-0.122834,0.118559,0.08965,0
9,1,1,1,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,-3.014035,-5.902528,-7.994674,0.603936,-2.76682,-3.130877,-0.17787,-2.142795,0.498921,0.016303,0.113204,-0.189486,-0.085036,0.168993,0.000184,0.577317,0.155549,0.221033,0.131059,0.22296,0.092432,0.160977,0.277692,0.089319,-0.049266,-0.025547,-0.010818,0.086399,-0.100417,0.095477,-0.119083,-0.084571,-0.096087,-0.116525,0.068228,0.28886,-0.192339,0.029426,0.094685,-0.21676,-0.229226,-0.189719,0.065834,0.01099,0.031185,0.055869,-0.033316,-0.045365,0.155304,0.067351,0.121697,0.074023,0.019039,0.041881,0.058868,0.105833,0.069157,0.098704,-0.023071,0.169958,0.107762,-0.00851,-0.142159,0.060089,0


# Loss function with weighted classes

In [19]:
def get_loss_func(df):
    TARGET = 'Activity'
    class_count_df = df.groupby(TARGET).count()
    n_0, n_1 = class_count_df.iloc[0, 0], class_count_df.iloc[1, 0]
    w_0 = (n_0 + n_1) / (2.0 * n_0)
    w_1 = (n_0 + n_1) / (2.0 * n_1)
    print(w_0)
    print(w_1)
    class_weights=torch.FloatTensor([w_0, w_1]).cuda()
    loss_func = CrossEntropyLossFlat(weight=class_weights)
    return loss_func

In [20]:
loss_func = get_loss_func(df)

0.55
5.5


# Train tabular DNN model

In [31]:
def train_model(dls, dataset, loss_func=loss_func, epochs=11, wd=0.0002, layers=[100,50]):
    
    print(f'Training model on dataset: {dataset}')
    print(f'Trained epochs: epochs={epochs}')
    
    learn = tabular_learner(dls, 
                            layers=layers,
                            wd=wd,
                            metrics=[accuracy, 
                            F1Score(), 
                            Precision(), 
                            Recall(), 
                            RocAucBinary(), 
                            MatthewsCorrCoef()])
    
    
    #print(f'Finding learning rate...')
    #lr_min, lr_steep = learn.lr_find(suggestions=True, show_plot=False)
    #print(f'Training model with learning rate: {lr_min}')
    learn.fit_one_cycle(epochs, 0.0003)
    
    
    return learn

In [32]:
train_model(dls, dataset, epochs=10)

Training model on dataset: CHEMBL205
Trained epochs: epochs=10
Finding learning rate...


Training model with learning rate: 0.006918309628963471


epoch,train_loss,valid_loss,accuracy,f1_score,precision_score,recall_score,roc_auc_score,matthews_corrcoef,time
0,0.137713,0.095587,0.968515,0.821485,0.846906,0.797546,0.979104,0.804673,01:35
1,0.106301,0.184123,0.94929,0.662963,0.836449,0.54908,0.980241,0.653343,01:35
2,0.063433,0.153224,0.961549,0.770764,0.84058,0.711656,0.981126,0.753034,01:36
3,0.026722,0.307125,0.939816,0.555556,0.84375,0.41411,0.980612,0.565952,01:34
4,0.035291,00:26,,,,,,,


KeyboardInterrupt: 

# Test parameters

In [23]:
from sklearn.model_selection import ParameterGrid

In [24]:
param_grid = {
    'layers': [[200,100], [300,150], [400, 200], [500,250], [600,300], [700, 350], [1000, 500]]
}
param_grid= ParameterGrid(param_grid)

In [25]:
def train_with_parameters ():
    datasets = ['CHEMBL205_cl', 'CHEMBL301_cl', 'CHEMBL218_cl', 
                'CHEMBL240_cl', 'CHEMBL219_cl', 
                'CHEMBL244_cl', 'CHEMBL1978_cl']
    i = 0
    
    
    df = pd.read_csv(path/f'{datasets[i]}_ecfp_512.csv')
        
    x_train, x_valid = train_test_split(df.index, test_size=0.2, random_state=42, stratify=df['Activity'])
    splits = (list(x_train), list(x_valid))
    procs = [Categorify]
        
    dep_var = ['Activity']
    X = df.drop(["CID", "SMILES", "Activity"], axis=1)
    cat_vars = X.columns
    cat_names = list(cat_vars)
    
    to = TabularPandas(df, 
                        procs,
                        cat_names=cat_names, 
                        y_names=dep_var, 
                        splits=splits, 
                        y_block = CategoryBlock())
    dls = to.dataloaders()
    
    for setting in param_grid:
        
        print(f"Training with layers: {setting['layers']}")
        learn = train_model(dls, datasets[i], layers=setting['layers'])
        

In [None]:
train_with_parameters()