# Drug Discovery, FAST-AI Tabular Model test


## DATASETS:
(a) Carbonic Anhydrase II (ChEMBL205), a protein lyase,  
(b) Cyclin-dependent kinase 2 (CHEMBL301), a protein kinase,  
(c) ether-a-go-go-related gene potassium channel 1 (HERG) (CHEMBL240), a voltage-gated ion channel,  
(d) Dopamine D4 receptor (CHEMBL219), a monoamine GPCR,  
(e) Coagulation factor X (CHEMBL244), a serine protease,  
(f) Cannabinoid CB1 receptor (CHEMBL218), a lipid-like GPCR and  
(g) Cytochrome P450 19A1 (CHEMBL1978), a cytochrome P450.  
The activity classes were selected based on data availability and as representatives of therapeutically important target classes or as anti-targets.

In [1]:
!nvidia-smi

Wed Apr  6 15:46:15 2022       
+-----------------------------------------------------------------------------+
| NVIDIA-SMI 470.103.01   Driver Version: 470.103.01   CUDA Version: 11.4     |
|-------------------------------+----------------------+----------------------+
| GPU  Name        Persistence-M| Bus-Id        Disp.A | Volatile Uncorr. ECC |
| Fan  Temp  Perf  Pwr:Usage/Cap|         Memory-Usage | GPU-Util  Compute M. |
|                               |                      |               MIG M. |
|   0  NVIDIA GeForce ...  Off  | 00000000:01:00.0  On |                  N/A |
| 29%   60C    P0    69W / 240W |    649MiB /  8116MiB |      0%      Default |
|                               |                      |                  N/A |
+-------------------------------+----------------------+----------------------+
                                                                               
+---------------------------------------------------------------------------

In [2]:
# Import
import pandas as pd
import numpy as np
from pathlib import Path

In [3]:
#%%capture
#!wget -c https://repo.continuum.io/miniconda/Miniconda3-latest-Linux-x86_64.sh
#!chmod +x Miniconda3-latest-Linux-x86_64.sh
#!time bash ./Miniconda3-latest-Linux-x86_64.sh -b -f -p /usr/local
#!time conda install -q -y -c conda-forge rdkit

In [4]:
from rdkit import Chem
from rdkit.Chem import AllChem

[15:46:15] Enabling RDKit 2019.09.3 jupyter extensions


In [5]:
top_mcc_scores = {
    
    'CHEMBL205': 0.862,
    'CHEMBL301': 0.926,
    'CHEMBL240': 0.884,
    'CHEMBL219': 0.887,
    'CHEMBL244': 0.983,
    'CHEMBL218': 0.941,
    'CHEMBL1978': 0.904}

In [6]:
path = Path('../dataset/13321_2017_226_MOESM1_ESM/')

In [7]:
#df.head()
list(path.iterdir())

[PosixPath('../dataset/13321_2017_226_MOESM1_ESM/CHEMBL205'),
 PosixPath('../dataset/13321_2017_226_MOESM1_ESM/.ipynb_checkpoints'),
 PosixPath('../dataset/13321_2017_226_MOESM1_ESM/CHEMBL301'),
 PosixPath('../dataset/13321_2017_226_MOESM1_ESM/CHEMBL218'),
 PosixPath('../dataset/13321_2017_226_MOESM1_ESM/CHEMBL219'),
 PosixPath('../dataset/13321_2017_226_MOESM1_ESM/CHEMBL244'),
 PosixPath('../dataset/13321_2017_226_MOESM1_ESM/mol_images'),
 PosixPath('../dataset/13321_2017_226_MOESM1_ESM/CHEMBL1978'),
 PosixPath('../dataset/13321_2017_226_MOESM1_ESM/CHEMBL240')]

In [8]:
dataset='CHEMBL205'

# TabularPandas

In [9]:
from sklearn.model_selection import train_test_split
from sklearn.metrics import auc,roc_auc_score,recall_score,precision_score,f1_score
from  sklearn.metrics import matthews_corrcoef
from sklearn.metrics import accuracy_score
from sklearn.model_selection import ParameterGrid

In [10]:
from fastai.tabular.all import *

In [11]:
def get_df(dataset, oversample = False):
    df = pd.read_csv(path/f'{dataset}/{dataset}_cl-data-with-pca-activations.csv')
    X, y = df.drop(["CID", "SMILES", "Activity", 'Image', 'is_valid'], axis=1), df["Activity"]
    dep_var = ['Activity']
    cat_vars = X.columns
    cat_names = list(cat_vars)
    x_train, x_val = train_test_split(df.index, test_size=0.2, random_state=666, stratify=df['Activity'])
    df.loc[x_train, 'is_valid']=False
    df.loc[x_val, 'is_valid']=True
    if oversample:
        df = pd.concat([*[df.loc[(df.is_valid==False) & (df.Activity==1)]]*10, 
                            *[df.loc[(df.is_valid==False) & (df.Activity==0)]], 
                            df.loc[df.is_valid==True]], 
                            ignore_index=True)
    return df, dep_var, cat_vars, cat_names

In [12]:
df, dep_var, cat_vars, cat_names = get_df(dataset)

In [13]:
df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 17941 entries, 0 to 17940
Columns: 1157 entries, CID to pca_127
dtypes: bool(1), float64(128), int64(1025), object(3)
memory usage: 158.2+ MB


In [14]:
df.head()

Unnamed: 0,CID,SMILES,ECFP4_1,ECFP4_2,ECFP4_3,ECFP4_4,ECFP4_5,ECFP4_6,ECFP4_7,ECFP4_8,...,pca_118,pca_119,pca_120,pca_121,pca_122,pca_123,pca_124,pca_125,pca_126,pca_127
0,CHEMBL188002,S(=O)(=O)(N)c1cc(N/C(/S)=N\c2cc(C(=O)[O-])c(cc2)C=2c3c(OC4=CC(=O)C=CC=24)cc(O)cc3)ccc1,0,0,0,0,0,0,0,0,...,0.098678,0.060415,-0.061614,-0.131339,0.031808,0.049131,0.018394,-0.004024,-0.189193,0.033769
1,CHEMBL364127,Clc1ccc(cc1)C(=O)NC1Cc2cc(S(=O)(=O)N)ccc2C1,0,0,0,0,0,0,0,0,...,0.006445,0.07649,-0.005898,0.047445,-0.09457,-0.036108,-0.108462,0.026409,-0.061849,-0.083877
2,CHEMBL1683469,S(=O)(=O)(N)c1ccc(cc1)CNS(=O)(=O)CC12CCC(CC1=O)C2(C)C,0,0,0,0,0,0,0,0,...,0.075003,0.126251,0.045264,0.073885,-0.044814,0.0766,-0.085974,0.083727,0.023021,0.14059
3,CHEMBL52564,Oc1ccccc1\C=C\C(=O)[O-],0,0,0,0,0,0,0,0,...,-0.119512,-0.243272,-0.035284,-0.169405,-0.165121,0.077793,0.002286,0.092607,-0.000398,0.042947
4,CHEMBL21427,OB(O)c1ccc(OC)cc1,0,0,0,0,0,0,0,0,...,-0.010942,-0.019184,-0.065507,0.023736,-0.205628,0.044264,-0.167439,0.029012,0.01732,-0.095512


In [15]:
train_idx = np.where(df.is_valid == False)[0]
valid_idx = np.where(df.is_valid == True)[0]
valid_idx

array([    5,    11,    13, ..., 17931, 17934, 17937])

In [16]:
def get_dls(df, dep_var, cat_vars, cat_names):
    train_idx = np.where(df.is_valid == False)[0]
    valid_idx = np.where(df.is_valid == True)[0]
    splits = (list(train_idx), list(valid_idx))
    procs = [Categorify, Normalize]
    to = TabularPandas(df, procs, cat_names=cat_names, y_names=dep_var, splits=splits, y_block = CategoryBlock(),
                      reduce_memory=True)
    to.show(3)
    to.items.head(3)
    dls = to.dataloaders(bs=2)
    return dls

In [17]:
dls = get_dls(df, dep_var, cat_vars, cat_names)

Unnamed: 0,ECFP4_1,ECFP4_2,ECFP4_3,ECFP4_4,ECFP4_5,ECFP4_6,ECFP4_7,ECFP4_8,ECFP4_9,ECFP4_10,ECFP4_11,ECFP4_12,ECFP4_13,ECFP4_14,ECFP4_15,ECFP4_16,ECFP4_17,ECFP4_18,ECFP4_19,ECFP4_20,ECFP4_21,ECFP4_22,ECFP4_23,ECFP4_24,ECFP4_25,ECFP4_26,ECFP4_27,ECFP4_28,ECFP4_29,ECFP4_30,ECFP4_31,ECFP4_32,ECFP4_33,ECFP4_34,ECFP4_35,ECFP4_36,ECFP4_37,ECFP4_38,ECFP4_39,ECFP4_40,ECFP4_41,ECFP4_42,ECFP4_43,ECFP4_44,ECFP4_45,ECFP4_46,ECFP4_47,ECFP4_48,ECFP4_49,ECFP4_50,ECFP4_51,ECFP4_52,ECFP4_53,ECFP4_54,ECFP4_55,ECFP4_56,ECFP4_57,ECFP4_58,ECFP4_59,ECFP4_60,ECFP4_61,ECFP4_62,ECFP4_63,ECFP4_64,ECFP4_65,ECFP4_66,ECFP4_67,ECFP4_68,ECFP4_69,ECFP4_70,ECFP4_71,ECFP4_72,ECFP4_73,ECFP4_74,ECFP4_75,ECFP4_76,ECFP4_77,ECFP4_78,ECFP4_79,ECFP4_80,ECFP4_81,ECFP4_82,ECFP4_83,ECFP4_84,ECFP4_85,ECFP4_86,ECFP4_87,ECFP4_88,ECFP4_89,ECFP4_90,ECFP4_91,ECFP4_92,ECFP4_93,ECFP4_94,ECFP4_95,ECFP4_96,ECFP4_97,ECFP4_98,ECFP4_99,ECFP4_100,ECFP4_101,ECFP4_102,ECFP4_103,ECFP4_104,ECFP4_105,ECFP4_106,ECFP4_107,ECFP4_108,ECFP4_109,ECFP4_110,ECFP4_111,ECFP4_112,ECFP4_113,ECFP4_114,ECFP4_115,ECFP4_116,ECFP4_117,ECFP4_118,ECFP4_119,ECFP4_120,ECFP4_121,ECFP4_122,ECFP4_123,ECFP4_124,ECFP4_125,ECFP4_126,ECFP4_127,ECFP4_128,ECFP4_129,ECFP4_130,ECFP4_131,ECFP4_132,ECFP4_133,ECFP4_134,ECFP4_135,ECFP4_136,ECFP4_137,ECFP4_138,ECFP4_139,ECFP4_140,ECFP4_141,ECFP4_142,ECFP4_143,ECFP4_144,ECFP4_145,ECFP4_146,ECFP4_147,ECFP4_148,ECFP4_149,ECFP4_150,ECFP4_151,ECFP4_152,ECFP4_153,ECFP4_154,ECFP4_155,ECFP4_156,ECFP4_157,ECFP4_158,ECFP4_159,ECFP4_160,ECFP4_161,ECFP4_162,ECFP4_163,ECFP4_164,ECFP4_165,ECFP4_166,ECFP4_167,ECFP4_168,ECFP4_169,ECFP4_170,ECFP4_171,ECFP4_172,ECFP4_173,ECFP4_174,ECFP4_175,ECFP4_176,ECFP4_177,ECFP4_178,ECFP4_179,ECFP4_180,ECFP4_181,ECFP4_182,ECFP4_183,ECFP4_184,ECFP4_185,ECFP4_186,ECFP4_187,ECFP4_188,ECFP4_189,ECFP4_190,ECFP4_191,ECFP4_192,ECFP4_193,ECFP4_194,ECFP4_195,ECFP4_196,ECFP4_197,ECFP4_198,ECFP4_199,ECFP4_200,ECFP4_201,ECFP4_202,ECFP4_203,ECFP4_204,ECFP4_205,ECFP4_206,ECFP4_207,ECFP4_208,ECFP4_209,ECFP4_210,ECFP4_211,ECFP4_212,ECFP4_213,ECFP4_214,ECFP4_215,ECFP4_216,ECFP4_217,ECFP4_218,ECFP4_219,ECFP4_220,ECFP4_221,ECFP4_222,ECFP4_223,ECFP4_224,ECFP4_225,ECFP4_226,ECFP4_227,ECFP4_228,ECFP4_229,ECFP4_230,ECFP4_231,ECFP4_232,ECFP4_233,ECFP4_234,ECFP4_235,ECFP4_236,ECFP4_237,ECFP4_238,ECFP4_239,ECFP4_240,ECFP4_241,ECFP4_242,ECFP4_243,ECFP4_244,ECFP4_245,ECFP4_246,ECFP4_247,ECFP4_248,ECFP4_249,ECFP4_250,ECFP4_251,ECFP4_252,ECFP4_253,ECFP4_254,ECFP4_255,ECFP4_256,ECFP4_257,ECFP4_258,ECFP4_259,ECFP4_260,ECFP4_261,ECFP4_262,ECFP4_263,ECFP4_264,ECFP4_265,ECFP4_266,ECFP4_267,ECFP4_268,ECFP4_269,ECFP4_270,ECFP4_271,ECFP4_272,ECFP4_273,ECFP4_274,ECFP4_275,ECFP4_276,ECFP4_277,ECFP4_278,ECFP4_279,ECFP4_280,ECFP4_281,ECFP4_282,ECFP4_283,ECFP4_284,ECFP4_285,ECFP4_286,ECFP4_287,ECFP4_288,ECFP4_289,ECFP4_290,ECFP4_291,ECFP4_292,ECFP4_293,ECFP4_294,ECFP4_295,ECFP4_296,ECFP4_297,ECFP4_298,ECFP4_299,ECFP4_300,ECFP4_301,ECFP4_302,ECFP4_303,ECFP4_304,ECFP4_305,ECFP4_306,ECFP4_307,ECFP4_308,ECFP4_309,ECFP4_310,ECFP4_311,ECFP4_312,ECFP4_313,ECFP4_314,ECFP4_315,ECFP4_316,ECFP4_317,ECFP4_318,ECFP4_319,ECFP4_320,ECFP4_321,ECFP4_322,ECFP4_323,ECFP4_324,ECFP4_325,ECFP4_326,ECFP4_327,ECFP4_328,ECFP4_329,ECFP4_330,ECFP4_331,ECFP4_332,ECFP4_333,ECFP4_334,ECFP4_335,ECFP4_336,ECFP4_337,ECFP4_338,ECFP4_339,ECFP4_340,ECFP4_341,ECFP4_342,ECFP4_343,ECFP4_344,ECFP4_345,ECFP4_346,ECFP4_347,ECFP4_348,ECFP4_349,ECFP4_350,ECFP4_351,ECFP4_352,ECFP4_353,ECFP4_354,ECFP4_355,ECFP4_356,ECFP4_357,ECFP4_358,ECFP4_359,ECFP4_360,ECFP4_361,ECFP4_362,ECFP4_363,ECFP4_364,ECFP4_365,ECFP4_366,ECFP4_367,ECFP4_368,ECFP4_369,ECFP4_370,ECFP4_371,ECFP4_372,ECFP4_373,ECFP4_374,ECFP4_375,ECFP4_376,ECFP4_377,ECFP4_378,ECFP4_379,ECFP4_380,ECFP4_381,ECFP4_382,ECFP4_383,ECFP4_384,ECFP4_385,ECFP4_386,ECFP4_387,ECFP4_388,ECFP4_389,ECFP4_390,ECFP4_391,ECFP4_392,ECFP4_393,ECFP4_394,ECFP4_395,ECFP4_396,ECFP4_397,ECFP4_398,ECFP4_399,ECFP4_400,ECFP4_401,ECFP4_402,ECFP4_403,ECFP4_404,ECFP4_405,ECFP4_406,ECFP4_407,ECFP4_408,ECFP4_409,ECFP4_410,ECFP4_411,ECFP4_412,ECFP4_413,ECFP4_414,ECFP4_415,ECFP4_416,ECFP4_417,ECFP4_418,ECFP4_419,ECFP4_420,ECFP4_421,ECFP4_422,ECFP4_423,ECFP4_424,ECFP4_425,ECFP4_426,ECFP4_427,ECFP4_428,ECFP4_429,ECFP4_430,ECFP4_431,ECFP4_432,ECFP4_433,ECFP4_434,ECFP4_435,ECFP4_436,ECFP4_437,ECFP4_438,ECFP4_439,ECFP4_440,ECFP4_441,ECFP4_442,ECFP4_443,ECFP4_444,ECFP4_445,ECFP4_446,ECFP4_447,ECFP4_448,ECFP4_449,ECFP4_450,ECFP4_451,ECFP4_452,ECFP4_453,ECFP4_454,ECFP4_455,ECFP4_456,ECFP4_457,ECFP4_458,ECFP4_459,ECFP4_460,ECFP4_461,ECFP4_462,ECFP4_463,ECFP4_464,ECFP4_465,ECFP4_466,ECFP4_467,ECFP4_468,ECFP4_469,ECFP4_470,ECFP4_471,ECFP4_472,ECFP4_473,ECFP4_474,ECFP4_475,ECFP4_476,ECFP4_477,ECFP4_478,ECFP4_479,ECFP4_480,ECFP4_481,ECFP4_482,ECFP4_483,ECFP4_484,ECFP4_485,ECFP4_486,ECFP4_487,ECFP4_488,ECFP4_489,ECFP4_490,ECFP4_491,ECFP4_492,ECFP4_493,ECFP4_494,ECFP4_495,ECFP4_496,ECFP4_497,ECFP4_498,ECFP4_499,ECFP4_500,ECFP4_501,ECFP4_502,ECFP4_503,ECFP4_504,ECFP4_505,ECFP4_506,ECFP4_507,ECFP4_508,ECFP4_509,ECFP4_510,ECFP4_511,ECFP4_512,ECFP4_513,ECFP4_514,ECFP4_515,ECFP4_516,ECFP4_517,ECFP4_518,ECFP4_519,ECFP4_520,ECFP4_521,ECFP4_522,ECFP4_523,ECFP4_524,ECFP4_525,ECFP4_526,ECFP4_527,ECFP4_528,ECFP4_529,ECFP4_530,ECFP4_531,ECFP4_532,ECFP4_533,ECFP4_534,ECFP4_535,ECFP4_536,ECFP4_537,ECFP4_538,ECFP4_539,ECFP4_540,ECFP4_541,ECFP4_542,ECFP4_543,ECFP4_544,ECFP4_545,ECFP4_546,ECFP4_547,ECFP4_548,ECFP4_549,ECFP4_550,ECFP4_551,ECFP4_552,ECFP4_553,ECFP4_554,ECFP4_555,ECFP4_556,ECFP4_557,ECFP4_558,ECFP4_559,ECFP4_560,ECFP4_561,ECFP4_562,ECFP4_563,ECFP4_564,ECFP4_565,ECFP4_566,ECFP4_567,ECFP4_568,ECFP4_569,ECFP4_570,ECFP4_571,ECFP4_572,ECFP4_573,ECFP4_574,ECFP4_575,ECFP4_576,ECFP4_577,ECFP4_578,ECFP4_579,ECFP4_580,ECFP4_581,ECFP4_582,ECFP4_583,ECFP4_584,ECFP4_585,ECFP4_586,ECFP4_587,ECFP4_588,ECFP4_589,ECFP4_590,ECFP4_591,ECFP4_592,ECFP4_593,ECFP4_594,ECFP4_595,ECFP4_596,ECFP4_597,ECFP4_598,ECFP4_599,ECFP4_600,ECFP4_601,ECFP4_602,ECFP4_603,ECFP4_604,ECFP4_605,ECFP4_606,ECFP4_607,ECFP4_608,ECFP4_609,ECFP4_610,ECFP4_611,ECFP4_612,ECFP4_613,ECFP4_614,ECFP4_615,ECFP4_616,ECFP4_617,ECFP4_618,ECFP4_619,ECFP4_620,ECFP4_621,ECFP4_622,ECFP4_623,ECFP4_624,ECFP4_625,ECFP4_626,ECFP4_627,ECFP4_628,ECFP4_629,ECFP4_630,ECFP4_631,ECFP4_632,ECFP4_633,ECFP4_634,ECFP4_635,ECFP4_636,ECFP4_637,ECFP4_638,ECFP4_639,ECFP4_640,ECFP4_641,ECFP4_642,ECFP4_643,ECFP4_644,ECFP4_645,ECFP4_646,ECFP4_647,ECFP4_648,ECFP4_649,ECFP4_650,ECFP4_651,ECFP4_652,ECFP4_653,ECFP4_654,ECFP4_655,ECFP4_656,ECFP4_657,ECFP4_658,ECFP4_659,ECFP4_660,ECFP4_661,ECFP4_662,ECFP4_663,ECFP4_664,ECFP4_665,ECFP4_666,ECFP4_667,ECFP4_668,ECFP4_669,ECFP4_670,ECFP4_671,ECFP4_672,ECFP4_673,ECFP4_674,ECFP4_675,ECFP4_676,ECFP4_677,ECFP4_678,ECFP4_679,ECFP4_680,ECFP4_681,ECFP4_682,ECFP4_683,ECFP4_684,ECFP4_685,ECFP4_686,ECFP4_687,ECFP4_688,ECFP4_689,ECFP4_690,ECFP4_691,ECFP4_692,ECFP4_693,ECFP4_694,ECFP4_695,ECFP4_696,ECFP4_697,ECFP4_698,ECFP4_699,ECFP4_700,ECFP4_701,ECFP4_702,ECFP4_703,ECFP4_704,ECFP4_705,ECFP4_706,ECFP4_707,ECFP4_708,ECFP4_709,ECFP4_710,ECFP4_711,ECFP4_712,ECFP4_713,ECFP4_714,ECFP4_715,ECFP4_716,ECFP4_717,ECFP4_718,ECFP4_719,ECFP4_720,ECFP4_721,ECFP4_722,ECFP4_723,ECFP4_724,ECFP4_725,ECFP4_726,ECFP4_727,ECFP4_728,ECFP4_729,ECFP4_730,ECFP4_731,ECFP4_732,ECFP4_733,ECFP4_734,ECFP4_735,ECFP4_736,ECFP4_737,ECFP4_738,ECFP4_739,ECFP4_740,ECFP4_741,ECFP4_742,ECFP4_743,ECFP4_744,ECFP4_745,ECFP4_746,ECFP4_747,ECFP4_748,ECFP4_749,ECFP4_750,ECFP4_751,ECFP4_752,ECFP4_753,ECFP4_754,ECFP4_755,ECFP4_756,ECFP4_757,ECFP4_758,ECFP4_759,ECFP4_760,ECFP4_761,ECFP4_762,ECFP4_763,ECFP4_764,ECFP4_765,ECFP4_766,ECFP4_767,ECFP4_768,ECFP4_769,ECFP4_770,ECFP4_771,ECFP4_772,ECFP4_773,ECFP4_774,ECFP4_775,ECFP4_776,ECFP4_777,ECFP4_778,ECFP4_779,ECFP4_780,ECFP4_781,ECFP4_782,ECFP4_783,ECFP4_784,ECFP4_785,ECFP4_786,ECFP4_787,ECFP4_788,ECFP4_789,ECFP4_790,ECFP4_791,ECFP4_792,ECFP4_793,ECFP4_794,ECFP4_795,ECFP4_796,ECFP4_797,ECFP4_798,ECFP4_799,ECFP4_800,ECFP4_801,ECFP4_802,ECFP4_803,ECFP4_804,ECFP4_805,ECFP4_806,ECFP4_807,ECFP4_808,ECFP4_809,ECFP4_810,ECFP4_811,ECFP4_812,ECFP4_813,ECFP4_814,ECFP4_815,ECFP4_816,ECFP4_817,ECFP4_818,ECFP4_819,ECFP4_820,ECFP4_821,ECFP4_822,ECFP4_823,ECFP4_824,ECFP4_825,ECFP4_826,ECFP4_827,ECFP4_828,ECFP4_829,ECFP4_830,ECFP4_831,ECFP4_832,ECFP4_833,ECFP4_834,ECFP4_835,ECFP4_836,ECFP4_837,ECFP4_838,ECFP4_839,ECFP4_840,ECFP4_841,ECFP4_842,ECFP4_843,ECFP4_844,ECFP4_845,ECFP4_846,ECFP4_847,ECFP4_848,ECFP4_849,ECFP4_850,ECFP4_851,ECFP4_852,ECFP4_853,ECFP4_854,ECFP4_855,ECFP4_856,ECFP4_857,ECFP4_858,ECFP4_859,ECFP4_860,ECFP4_861,ECFP4_862,ECFP4_863,ECFP4_864,ECFP4_865,ECFP4_866,ECFP4_867,ECFP4_868,ECFP4_869,ECFP4_870,ECFP4_871,ECFP4_872,ECFP4_873,ECFP4_874,ECFP4_875,ECFP4_876,ECFP4_877,ECFP4_878,ECFP4_879,ECFP4_880,ECFP4_881,ECFP4_882,ECFP4_883,ECFP4_884,ECFP4_885,ECFP4_886,ECFP4_887,ECFP4_888,ECFP4_889,ECFP4_890,ECFP4_891,ECFP4_892,ECFP4_893,ECFP4_894,ECFP4_895,ECFP4_896,ECFP4_897,ECFP4_898,ECFP4_899,ECFP4_900,ECFP4_901,ECFP4_902,ECFP4_903,ECFP4_904,ECFP4_905,ECFP4_906,ECFP4_907,ECFP4_908,ECFP4_909,ECFP4_910,ECFP4_911,ECFP4_912,ECFP4_913,ECFP4_914,ECFP4_915,ECFP4_916,ECFP4_917,ECFP4_918,ECFP4_919,ECFP4_920,ECFP4_921,ECFP4_922,ECFP4_923,ECFP4_924,ECFP4_925,ECFP4_926,ECFP4_927,ECFP4_928,ECFP4_929,ECFP4_930,ECFP4_931,ECFP4_932,ECFP4_933,ECFP4_934,ECFP4_935,ECFP4_936,ECFP4_937,ECFP4_938,ECFP4_939,ECFP4_940,ECFP4_941,ECFP4_942,ECFP4_943,ECFP4_944,ECFP4_945,ECFP4_946,ECFP4_947,ECFP4_948,ECFP4_949,ECFP4_950,ECFP4_951,ECFP4_952,ECFP4_953,ECFP4_954,ECFP4_955,ECFP4_956,ECFP4_957,ECFP4_958,ECFP4_959,ECFP4_960,ECFP4_961,ECFP4_962,ECFP4_963,ECFP4_964,ECFP4_965,ECFP4_966,ECFP4_967,ECFP4_968,ECFP4_969,ECFP4_970,ECFP4_971,ECFP4_972,ECFP4_973,ECFP4_974,ECFP4_975,ECFP4_976,ECFP4_977,ECFP4_978,ECFP4_979,ECFP4_980,ECFP4_981,ECFP4_982,ECFP4_983,ECFP4_984,ECFP4_985,ECFP4_986,ECFP4_987,ECFP4_988,ECFP4_989,ECFP4_990,ECFP4_991,ECFP4_992,ECFP4_993,ECFP4_994,ECFP4_995,ECFP4_996,ECFP4_997,ECFP4_998,ECFP4_999,ECFP4_1000,ECFP4_1001,ECFP4_1002,ECFP4_1003,ECFP4_1004,ECFP4_1005,ECFP4_1006,ECFP4_1007,ECFP4_1008,ECFP4_1009,ECFP4_1010,ECFP4_1011,ECFP4_1012,ECFP4_1013,ECFP4_1014,ECFP4_1015,ECFP4_1016,ECFP4_1017,ECFP4_1018,ECFP4_1019,ECFP4_1020,ECFP4_1021,ECFP4_1022,ECFP4_1023,ECFP4_1024,pca_0,pca_1,pca_2,pca_3,pca_4,pca_5,pca_6,pca_7,pca_8,pca_9,pca_10,pca_11,pca_12,pca_13,pca_14,pca_15,pca_16,pca_17,pca_18,pca_19,pca_20,pca_21,pca_22,pca_23,pca_24,pca_25,pca_26,pca_27,pca_28,pca_29,pca_30,pca_31,pca_32,pca_33,pca_34,pca_35,pca_36,pca_37,pca_38,pca_39,pca_40,pca_41,pca_42,pca_43,pca_44,pca_45,pca_46,pca_47,pca_48,pca_49,pca_50,pca_51,pca_52,pca_53,pca_54,pca_55,pca_56,pca_57,pca_58,pca_59,pca_60,pca_61,pca_62,pca_63,pca_64,pca_65,pca_66,pca_67,pca_68,pca_69,pca_70,pca_71,pca_72,pca_73,pca_74,pca_75,pca_76,pca_77,pca_78,pca_79,pca_80,pca_81,pca_82,pca_83,pca_84,pca_85,pca_86,pca_87,pca_88,pca_89,pca_90,pca_91,pca_92,pca_93,pca_94,pca_95,pca_96,pca_97,pca_98,pca_99,pca_100,pca_101,pca_102,pca_103,pca_104,pca_105,pca_106,pca_107,pca_108,pca_109,pca_110,pca_111,pca_112,pca_113,pca_114,pca_115,pca_116,pca_117,pca_118,pca_119,pca_120,pca_121,pca_122,pca_123,pca_124,pca_125,pca_126,pca_127,Activity
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,1,0,1,0,1,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,1,1,0,0,0,1,1,0,0,0,0,0,0,0,1,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,-7.626243,-11.846932,2.181621,2.883427,-4.164511,-3.025412,-1.176717,0.194958,0.644585,-0.373791,-0.059939,-1.151247,0.351695,-1.330585,-0.113102,0.176865,-0.283759,-0.688204,0.138614,-0.372719,0.314997,-0.052979,0.014772,0.356431,0.179756,1.070953,0.444522,-0.092453,-0.526336,0.163987,-0.365356,-0.095878,0.263648,0.048336,-0.008787,-0.217316,-0.349936,-0.037208,0.203831,0.34656,0.229243,-0.073354,0.157622,-0.014819,-0.153702,-0.263785,-0.12208,0.084603,-0.057411,0.157627,-0.007216,0.003859,-0.007265,0.009786,0.11836,-0.023304,-0.053317,0.130024,-0.033925,0.177049,-0.141376,0.24719,0.159351,0.094854,-0.067168,-0.127517,0.09015,-0.033176,0.148282,-0.073813,-0.152446,-0.117549,0.050001,-0.08325,-0.008074,0.298914,-0.080444,0.107191,0.023913,0.227304,-0.087986,0.210436,0.059144,-0.415183,0.094206,0.034507,-0.042093,-0.176972,0.122428,-0.120136,0.116182,-0.09308,0.114622,0.133001,-0.089289,0.189726,-0.139854,0.039087,0.118963,0.089514,-0.088588,0.088197,0.094364,-0.105273,-0.131378,-0.072215,-0.135175,-0.001849,-0.101133,-0.070293,0.15853,0.065273,0.037905,0.071613,-0.087035,0.085425,0.055551,-0.022177,0.098678,0.060415,-0.061614,-0.131339,0.031808,0.049131,0.018394,-0.004024,-0.189193,0.033769,1
1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,-10.642493,-14.473786,29.402847,3.771606,-0.006615,-0.60986,-3.360197,2.174378,0.160712,-0.892385,-0.739158,0.338298,0.81289,-0.865568,-1.338991,-0.212996,-0.34615,0.883195,0.197303,1.060262,-1.024971,0.545317,0.105733,0.170735,0.200382,0.559315,0.417992,-0.007711,0.309836,-0.292155,-0.325514,-0.263592,-0.324977,0.136255,0.074295,-0.045194,0.028823,0.29742,0.153312,0.075171,0.170891,0.050916,-0.185067,0.027833,-0.066338,-0.017106,-0.116444,-0.082758,0.172381,-0.134892,-0.00984,-0.204481,-0.004094,0.124597,0.070535,0.073869,0.142652,0.145394,0.034182,-0.088261,-0.18831,-0.034564,-0.125205,-0.231942,-0.001536,-0.132004,-0.005005,-0.025114,-0.205839,0.059902,-0.025298,0.05377,0.076772,-0.051585,0.135781,0.043523,-0.19034,0.018994,0.049833,-0.081415,0.058884,0.174269,-0.17381,0.12485,0.028287,-0.004814,-0.147564,-0.066429,0.054995,0.073099,0.106678,0.064808,0.065724,-0.030958,0.038676,0.034664,-0.018986,0.012207,0.028871,0.260914,-0.194524,-0.140997,-0.015034,0.078196,0.067742,0.075835,0.149257,0.010034,0.043316,-0.048497,-0.033323,0.08231,-0.009727,-0.140177,0.019644,0.135408,0.07156,-0.008652,0.006445,0.07649,-0.005898,0.047445,-0.09457,-0.036108,-0.108462,0.026409,-0.061849,-0.083877,1
2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,-9.040936,-13.375031,30.047092,0.540517,-3.778347,-0.255176,-2.284647,-0.155476,1.301045,-0.250722,-1.106377,1.606184,0.669297,-0.048965,-0.920734,0.081888,0.041506,0.338175,-0.23916,1.06839,-1.090549,0.715668,-0.188631,-0.117621,0.071343,0.343115,0.235626,-0.028628,0.677921,-0.226921,0.06071,0.030761,-0.173746,0.363386,-0.160115,0.226437,0.446362,0.075632,-0.130567,-0.075392,-0.113587,0.249709,0.150407,-0.040744,0.062327,0.116705,0.108356,0.318407,0.049282,-0.170562,0.139205,-0.102848,0.051523,0.053748,-0.153476,-0.118444,0.067252,0.144337,-0.090382,-0.106932,-0.187527,-0.119072,-0.042821,0.011001,-0.251983,0.090717,0.041378,-0.178891,0.119406,0.003645,0.094842,-0.025912,-0.109966,0.063043,-0.206965,0.076332,0.221548,0.076153,-0.049734,-0.046496,0.086656,0.072398,0.077547,-0.041765,-0.030694,-0.080868,0.228547,0.163674,-0.187785,0.036867,-0.102444,0.015504,-0.127633,-0.020928,-0.079749,-0.053163,-0.058719,-0.10433,0.164384,0.253386,0.033731,-0.125032,0.098574,-0.007486,-0.130702,0.098414,0.089139,-0.086329,0.051939,-0.20252,-0.178584,0.090626,-0.07269,-0.104784,0.056251,-0.063718,0.232519,-0.070618,0.075003,0.126252,0.045264,0.073885,-0.044814,0.0766,-0.085974,0.083727,0.023021,0.14059,1


In [18]:
dls.show_batch()

Unnamed: 0,ECFP4_1,ECFP4_2,ECFP4_3,ECFP4_4,ECFP4_5,ECFP4_6,ECFP4_7,ECFP4_8,ECFP4_9,ECFP4_10,ECFP4_11,ECFP4_12,ECFP4_13,ECFP4_14,ECFP4_15,ECFP4_16,ECFP4_17,ECFP4_18,ECFP4_19,ECFP4_20,ECFP4_21,ECFP4_22,ECFP4_23,ECFP4_24,ECFP4_25,ECFP4_26,ECFP4_27,ECFP4_28,ECFP4_29,ECFP4_30,ECFP4_31,ECFP4_32,ECFP4_33,ECFP4_34,ECFP4_35,ECFP4_36,ECFP4_37,ECFP4_38,ECFP4_39,ECFP4_40,ECFP4_41,ECFP4_42,ECFP4_43,ECFP4_44,ECFP4_45,ECFP4_46,ECFP4_47,ECFP4_48,ECFP4_49,ECFP4_50,ECFP4_51,ECFP4_52,ECFP4_53,ECFP4_54,ECFP4_55,ECFP4_56,ECFP4_57,ECFP4_58,ECFP4_59,ECFP4_60,ECFP4_61,ECFP4_62,ECFP4_63,ECFP4_64,ECFP4_65,ECFP4_66,ECFP4_67,ECFP4_68,ECFP4_69,ECFP4_70,ECFP4_71,ECFP4_72,ECFP4_73,ECFP4_74,ECFP4_75,ECFP4_76,ECFP4_77,ECFP4_78,ECFP4_79,ECFP4_80,ECFP4_81,ECFP4_82,ECFP4_83,ECFP4_84,ECFP4_85,ECFP4_86,ECFP4_87,ECFP4_88,ECFP4_89,ECFP4_90,ECFP4_91,ECFP4_92,ECFP4_93,ECFP4_94,ECFP4_95,ECFP4_96,ECFP4_97,ECFP4_98,ECFP4_99,ECFP4_100,ECFP4_101,ECFP4_102,ECFP4_103,ECFP4_104,ECFP4_105,ECFP4_106,ECFP4_107,ECFP4_108,ECFP4_109,ECFP4_110,ECFP4_111,ECFP4_112,ECFP4_113,ECFP4_114,ECFP4_115,ECFP4_116,ECFP4_117,ECFP4_118,ECFP4_119,ECFP4_120,ECFP4_121,ECFP4_122,ECFP4_123,ECFP4_124,ECFP4_125,ECFP4_126,ECFP4_127,ECFP4_128,ECFP4_129,ECFP4_130,ECFP4_131,ECFP4_132,ECFP4_133,ECFP4_134,ECFP4_135,ECFP4_136,ECFP4_137,ECFP4_138,ECFP4_139,ECFP4_140,ECFP4_141,ECFP4_142,ECFP4_143,ECFP4_144,ECFP4_145,ECFP4_146,ECFP4_147,ECFP4_148,ECFP4_149,ECFP4_150,ECFP4_151,ECFP4_152,ECFP4_153,ECFP4_154,ECFP4_155,ECFP4_156,ECFP4_157,ECFP4_158,ECFP4_159,ECFP4_160,ECFP4_161,ECFP4_162,ECFP4_163,ECFP4_164,ECFP4_165,ECFP4_166,ECFP4_167,ECFP4_168,ECFP4_169,ECFP4_170,ECFP4_171,ECFP4_172,ECFP4_173,ECFP4_174,ECFP4_175,ECFP4_176,ECFP4_177,ECFP4_178,ECFP4_179,ECFP4_180,ECFP4_181,ECFP4_182,ECFP4_183,ECFP4_184,ECFP4_185,ECFP4_186,ECFP4_187,ECFP4_188,ECFP4_189,ECFP4_190,ECFP4_191,ECFP4_192,ECFP4_193,ECFP4_194,ECFP4_195,ECFP4_196,ECFP4_197,ECFP4_198,ECFP4_199,ECFP4_200,ECFP4_201,ECFP4_202,ECFP4_203,ECFP4_204,ECFP4_205,ECFP4_206,ECFP4_207,ECFP4_208,ECFP4_209,ECFP4_210,ECFP4_211,ECFP4_212,ECFP4_213,ECFP4_214,ECFP4_215,ECFP4_216,ECFP4_217,ECFP4_218,ECFP4_219,ECFP4_220,ECFP4_221,ECFP4_222,ECFP4_223,ECFP4_224,ECFP4_225,ECFP4_226,ECFP4_227,ECFP4_228,ECFP4_229,ECFP4_230,ECFP4_231,ECFP4_232,ECFP4_233,ECFP4_234,ECFP4_235,ECFP4_236,ECFP4_237,ECFP4_238,ECFP4_239,ECFP4_240,ECFP4_241,ECFP4_242,ECFP4_243,ECFP4_244,ECFP4_245,ECFP4_246,ECFP4_247,ECFP4_248,ECFP4_249,ECFP4_250,ECFP4_251,ECFP4_252,ECFP4_253,ECFP4_254,ECFP4_255,ECFP4_256,ECFP4_257,ECFP4_258,ECFP4_259,ECFP4_260,ECFP4_261,ECFP4_262,ECFP4_263,ECFP4_264,ECFP4_265,ECFP4_266,ECFP4_267,ECFP4_268,ECFP4_269,ECFP4_270,ECFP4_271,ECFP4_272,ECFP4_273,ECFP4_274,ECFP4_275,ECFP4_276,ECFP4_277,ECFP4_278,ECFP4_279,ECFP4_280,ECFP4_281,ECFP4_282,ECFP4_283,ECFP4_284,ECFP4_285,ECFP4_286,ECFP4_287,ECFP4_288,ECFP4_289,ECFP4_290,ECFP4_291,ECFP4_292,ECFP4_293,ECFP4_294,ECFP4_295,ECFP4_296,ECFP4_297,ECFP4_298,ECFP4_299,ECFP4_300,ECFP4_301,ECFP4_302,ECFP4_303,ECFP4_304,ECFP4_305,ECFP4_306,ECFP4_307,ECFP4_308,ECFP4_309,ECFP4_310,ECFP4_311,ECFP4_312,ECFP4_313,ECFP4_314,ECFP4_315,ECFP4_316,ECFP4_317,ECFP4_318,ECFP4_319,ECFP4_320,ECFP4_321,ECFP4_322,ECFP4_323,ECFP4_324,ECFP4_325,ECFP4_326,ECFP4_327,ECFP4_328,ECFP4_329,ECFP4_330,ECFP4_331,ECFP4_332,ECFP4_333,ECFP4_334,ECFP4_335,ECFP4_336,ECFP4_337,ECFP4_338,ECFP4_339,ECFP4_340,ECFP4_341,ECFP4_342,ECFP4_343,ECFP4_344,ECFP4_345,ECFP4_346,ECFP4_347,ECFP4_348,ECFP4_349,ECFP4_350,ECFP4_351,ECFP4_352,ECFP4_353,ECFP4_354,ECFP4_355,ECFP4_356,ECFP4_357,ECFP4_358,ECFP4_359,ECFP4_360,ECFP4_361,ECFP4_362,ECFP4_363,ECFP4_364,ECFP4_365,ECFP4_366,ECFP4_367,ECFP4_368,ECFP4_369,ECFP4_370,ECFP4_371,ECFP4_372,ECFP4_373,ECFP4_374,ECFP4_375,ECFP4_376,ECFP4_377,ECFP4_378,ECFP4_379,ECFP4_380,ECFP4_381,ECFP4_382,ECFP4_383,ECFP4_384,ECFP4_385,ECFP4_386,ECFP4_387,ECFP4_388,ECFP4_389,ECFP4_390,ECFP4_391,ECFP4_392,ECFP4_393,ECFP4_394,ECFP4_395,ECFP4_396,ECFP4_397,ECFP4_398,ECFP4_399,ECFP4_400,ECFP4_401,ECFP4_402,ECFP4_403,ECFP4_404,ECFP4_405,ECFP4_406,ECFP4_407,ECFP4_408,ECFP4_409,ECFP4_410,ECFP4_411,ECFP4_412,ECFP4_413,ECFP4_414,ECFP4_415,ECFP4_416,ECFP4_417,ECFP4_418,ECFP4_419,ECFP4_420,ECFP4_421,ECFP4_422,ECFP4_423,ECFP4_424,ECFP4_425,ECFP4_426,ECFP4_427,ECFP4_428,ECFP4_429,ECFP4_430,ECFP4_431,ECFP4_432,ECFP4_433,ECFP4_434,ECFP4_435,ECFP4_436,ECFP4_437,ECFP4_438,ECFP4_439,ECFP4_440,ECFP4_441,ECFP4_442,ECFP4_443,ECFP4_444,ECFP4_445,ECFP4_446,ECFP4_447,ECFP4_448,ECFP4_449,ECFP4_450,ECFP4_451,ECFP4_452,ECFP4_453,ECFP4_454,ECFP4_455,ECFP4_456,ECFP4_457,ECFP4_458,ECFP4_459,ECFP4_460,ECFP4_461,ECFP4_462,ECFP4_463,ECFP4_464,ECFP4_465,ECFP4_466,ECFP4_467,ECFP4_468,ECFP4_469,ECFP4_470,ECFP4_471,ECFP4_472,ECFP4_473,ECFP4_474,ECFP4_475,ECFP4_476,ECFP4_477,ECFP4_478,ECFP4_479,ECFP4_480,ECFP4_481,ECFP4_482,ECFP4_483,ECFP4_484,ECFP4_485,ECFP4_486,ECFP4_487,ECFP4_488,ECFP4_489,ECFP4_490,ECFP4_491,ECFP4_492,ECFP4_493,ECFP4_494,ECFP4_495,ECFP4_496,ECFP4_497,ECFP4_498,ECFP4_499,ECFP4_500,ECFP4_501,ECFP4_502,ECFP4_503,ECFP4_504,ECFP4_505,ECFP4_506,ECFP4_507,ECFP4_508,ECFP4_509,ECFP4_510,ECFP4_511,ECFP4_512,ECFP4_513,ECFP4_514,ECFP4_515,ECFP4_516,ECFP4_517,ECFP4_518,ECFP4_519,ECFP4_520,ECFP4_521,ECFP4_522,ECFP4_523,ECFP4_524,ECFP4_525,ECFP4_526,ECFP4_527,ECFP4_528,ECFP4_529,ECFP4_530,ECFP4_531,ECFP4_532,ECFP4_533,ECFP4_534,ECFP4_535,ECFP4_536,ECFP4_537,ECFP4_538,ECFP4_539,ECFP4_540,ECFP4_541,ECFP4_542,ECFP4_543,ECFP4_544,ECFP4_545,ECFP4_546,ECFP4_547,ECFP4_548,ECFP4_549,ECFP4_550,ECFP4_551,ECFP4_552,ECFP4_553,ECFP4_554,ECFP4_555,ECFP4_556,ECFP4_557,ECFP4_558,ECFP4_559,ECFP4_560,ECFP4_561,ECFP4_562,ECFP4_563,ECFP4_564,ECFP4_565,ECFP4_566,ECFP4_567,ECFP4_568,ECFP4_569,ECFP4_570,ECFP4_571,ECFP4_572,ECFP4_573,ECFP4_574,ECFP4_575,ECFP4_576,ECFP4_577,ECFP4_578,ECFP4_579,ECFP4_580,ECFP4_581,ECFP4_582,ECFP4_583,ECFP4_584,ECFP4_585,ECFP4_586,ECFP4_587,ECFP4_588,ECFP4_589,ECFP4_590,ECFP4_591,ECFP4_592,ECFP4_593,ECFP4_594,ECFP4_595,ECFP4_596,ECFP4_597,ECFP4_598,ECFP4_599,ECFP4_600,ECFP4_601,ECFP4_602,ECFP4_603,ECFP4_604,ECFP4_605,ECFP4_606,ECFP4_607,ECFP4_608,ECFP4_609,ECFP4_610,ECFP4_611,ECFP4_612,ECFP4_613,ECFP4_614,ECFP4_615,ECFP4_616,ECFP4_617,ECFP4_618,ECFP4_619,ECFP4_620,ECFP4_621,ECFP4_622,ECFP4_623,ECFP4_624,ECFP4_625,ECFP4_626,ECFP4_627,ECFP4_628,ECFP4_629,ECFP4_630,ECFP4_631,ECFP4_632,ECFP4_633,ECFP4_634,ECFP4_635,ECFP4_636,ECFP4_637,ECFP4_638,ECFP4_639,ECFP4_640,ECFP4_641,ECFP4_642,ECFP4_643,ECFP4_644,ECFP4_645,ECFP4_646,ECFP4_647,ECFP4_648,ECFP4_649,ECFP4_650,ECFP4_651,ECFP4_652,ECFP4_653,ECFP4_654,ECFP4_655,ECFP4_656,ECFP4_657,ECFP4_658,ECFP4_659,ECFP4_660,ECFP4_661,ECFP4_662,ECFP4_663,ECFP4_664,ECFP4_665,ECFP4_666,ECFP4_667,ECFP4_668,ECFP4_669,ECFP4_670,ECFP4_671,ECFP4_672,ECFP4_673,ECFP4_674,ECFP4_675,ECFP4_676,ECFP4_677,ECFP4_678,ECFP4_679,ECFP4_680,ECFP4_681,ECFP4_682,ECFP4_683,ECFP4_684,ECFP4_685,ECFP4_686,ECFP4_687,ECFP4_688,ECFP4_689,ECFP4_690,ECFP4_691,ECFP4_692,ECFP4_693,ECFP4_694,ECFP4_695,ECFP4_696,ECFP4_697,ECFP4_698,ECFP4_699,ECFP4_700,ECFP4_701,ECFP4_702,ECFP4_703,ECFP4_704,ECFP4_705,ECFP4_706,ECFP4_707,ECFP4_708,ECFP4_709,ECFP4_710,ECFP4_711,ECFP4_712,ECFP4_713,ECFP4_714,ECFP4_715,ECFP4_716,ECFP4_717,ECFP4_718,ECFP4_719,ECFP4_720,ECFP4_721,ECFP4_722,ECFP4_723,ECFP4_724,ECFP4_725,ECFP4_726,ECFP4_727,ECFP4_728,ECFP4_729,ECFP4_730,ECFP4_731,ECFP4_732,ECFP4_733,ECFP4_734,ECFP4_735,ECFP4_736,ECFP4_737,ECFP4_738,ECFP4_739,ECFP4_740,ECFP4_741,ECFP4_742,ECFP4_743,ECFP4_744,ECFP4_745,ECFP4_746,ECFP4_747,ECFP4_748,ECFP4_749,ECFP4_750,ECFP4_751,ECFP4_752,ECFP4_753,ECFP4_754,ECFP4_755,ECFP4_756,ECFP4_757,ECFP4_758,ECFP4_759,ECFP4_760,ECFP4_761,ECFP4_762,ECFP4_763,ECFP4_764,ECFP4_765,ECFP4_766,ECFP4_767,ECFP4_768,ECFP4_769,ECFP4_770,ECFP4_771,ECFP4_772,ECFP4_773,ECFP4_774,ECFP4_775,ECFP4_776,ECFP4_777,ECFP4_778,ECFP4_779,ECFP4_780,ECFP4_781,ECFP4_782,ECFP4_783,ECFP4_784,ECFP4_785,ECFP4_786,ECFP4_787,ECFP4_788,ECFP4_789,ECFP4_790,ECFP4_791,ECFP4_792,ECFP4_793,ECFP4_794,ECFP4_795,ECFP4_796,ECFP4_797,ECFP4_798,ECFP4_799,ECFP4_800,ECFP4_801,ECFP4_802,ECFP4_803,ECFP4_804,ECFP4_805,ECFP4_806,ECFP4_807,ECFP4_808,ECFP4_809,ECFP4_810,ECFP4_811,ECFP4_812,ECFP4_813,ECFP4_814,ECFP4_815,ECFP4_816,ECFP4_817,ECFP4_818,ECFP4_819,ECFP4_820,ECFP4_821,ECFP4_822,ECFP4_823,ECFP4_824,ECFP4_825,ECFP4_826,ECFP4_827,ECFP4_828,ECFP4_829,ECFP4_830,ECFP4_831,ECFP4_832,ECFP4_833,ECFP4_834,ECFP4_835,ECFP4_836,ECFP4_837,ECFP4_838,ECFP4_839,ECFP4_840,ECFP4_841,ECFP4_842,ECFP4_843,ECFP4_844,ECFP4_845,ECFP4_846,ECFP4_847,ECFP4_848,ECFP4_849,ECFP4_850,ECFP4_851,ECFP4_852,ECFP4_853,ECFP4_854,ECFP4_855,ECFP4_856,ECFP4_857,ECFP4_858,ECFP4_859,ECFP4_860,ECFP4_861,ECFP4_862,ECFP4_863,ECFP4_864,ECFP4_865,ECFP4_866,ECFP4_867,ECFP4_868,ECFP4_869,ECFP4_870,ECFP4_871,ECFP4_872,ECFP4_873,ECFP4_874,ECFP4_875,ECFP4_876,ECFP4_877,ECFP4_878,ECFP4_879,ECFP4_880,ECFP4_881,ECFP4_882,ECFP4_883,ECFP4_884,ECFP4_885,ECFP4_886,ECFP4_887,ECFP4_888,ECFP4_889,ECFP4_890,ECFP4_891,ECFP4_892,ECFP4_893,ECFP4_894,ECFP4_895,ECFP4_896,ECFP4_897,ECFP4_898,ECFP4_899,ECFP4_900,ECFP4_901,ECFP4_902,ECFP4_903,ECFP4_904,ECFP4_905,ECFP4_906,ECFP4_907,ECFP4_908,ECFP4_909,ECFP4_910,ECFP4_911,ECFP4_912,ECFP4_913,ECFP4_914,ECFP4_915,ECFP4_916,ECFP4_917,ECFP4_918,ECFP4_919,ECFP4_920,ECFP4_921,ECFP4_922,ECFP4_923,ECFP4_924,ECFP4_925,ECFP4_926,ECFP4_927,ECFP4_928,ECFP4_929,ECFP4_930,ECFP4_931,ECFP4_932,ECFP4_933,ECFP4_934,ECFP4_935,ECFP4_936,ECFP4_937,ECFP4_938,ECFP4_939,ECFP4_940,ECFP4_941,ECFP4_942,ECFP4_943,ECFP4_944,ECFP4_945,ECFP4_946,ECFP4_947,ECFP4_948,ECFP4_949,ECFP4_950,ECFP4_951,ECFP4_952,ECFP4_953,ECFP4_954,ECFP4_955,ECFP4_956,ECFP4_957,ECFP4_958,ECFP4_959,ECFP4_960,ECFP4_961,ECFP4_962,ECFP4_963,ECFP4_964,ECFP4_965,ECFP4_966,ECFP4_967,ECFP4_968,ECFP4_969,ECFP4_970,ECFP4_971,ECFP4_972,ECFP4_973,ECFP4_974,ECFP4_975,ECFP4_976,ECFP4_977,ECFP4_978,ECFP4_979,ECFP4_980,ECFP4_981,ECFP4_982,ECFP4_983,ECFP4_984,ECFP4_985,ECFP4_986,ECFP4_987,ECFP4_988,ECFP4_989,ECFP4_990,ECFP4_991,ECFP4_992,ECFP4_993,ECFP4_994,ECFP4_995,ECFP4_996,ECFP4_997,ECFP4_998,ECFP4_999,ECFP4_1000,ECFP4_1001,ECFP4_1002,ECFP4_1003,ECFP4_1004,ECFP4_1005,ECFP4_1006,ECFP4_1007,ECFP4_1008,ECFP4_1009,ECFP4_1010,ECFP4_1011,ECFP4_1012,ECFP4_1013,ECFP4_1014,ECFP4_1015,ECFP4_1016,ECFP4_1017,ECFP4_1018,ECFP4_1019,ECFP4_1020,ECFP4_1021,ECFP4_1022,ECFP4_1023,ECFP4_1024,pca_0,pca_1,pca_2,pca_3,pca_4,pca_5,pca_6,pca_7,pca_8,pca_9,pca_10,pca_11,pca_12,pca_13,pca_14,pca_15,pca_16,pca_17,pca_18,pca_19,pca_20,pca_21,pca_22,pca_23,pca_24,pca_25,pca_26,pca_27,pca_28,pca_29,pca_30,pca_31,pca_32,pca_33,pca_34,pca_35,pca_36,pca_37,pca_38,pca_39,pca_40,pca_41,pca_42,pca_43,pca_44,pca_45,pca_46,pca_47,pca_48,pca_49,pca_50,pca_51,pca_52,pca_53,pca_54,pca_55,pca_56,pca_57,pca_58,pca_59,pca_60,pca_61,pca_62,pca_63,pca_64,pca_65,pca_66,pca_67,pca_68,pca_69,pca_70,pca_71,pca_72,pca_73,pca_74,pca_75,pca_76,pca_77,pca_78,pca_79,pca_80,pca_81,pca_82,pca_83,pca_84,pca_85,pca_86,pca_87,pca_88,pca_89,pca_90,pca_91,pca_92,pca_93,pca_94,pca_95,pca_96,pca_97,pca_98,pca_99,pca_100,pca_101,pca_102,pca_103,pca_104,pca_105,pca_106,pca_107,pca_108,pca_109,pca_110,pca_111,pca_112,pca_113,pca_114,pca_115,pca_116,pca_117,pca_118,pca_119,pca_120,pca_121,pca_122,pca_123,pca_124,pca_125,pca_126,pca_127,Activity
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,-23.414692,17.367395,-0.56707,-2.258919,2.941819,-1.069853,-0.46085,0.009324,1.385928,-0.838153,-0.690136,0.73501,-0.335573,-0.441801,0.708819,-0.070971,0.440361,0.315317,0.161827,-0.372513,0.310928,0.298683,-0.167921,-0.618924,-0.465926,-0.328647,-0.639408,0.287938,0.260239,-0.406381,-0.177062,-0.00789,-0.159858,0.008463,0.032187,0.107971,-0.123364,0.261635,-0.155557,0.413912,-0.060697,-0.020867,-0.108947,-0.060487,-0.099331,-0.145221,-0.172442,-0.127735,-0.26639,0.346915,0.035868,-0.131664,0.237931,-0.193124,-0.086544,0.137069,-0.118297,-0.009448,0.112613,-0.040571,-0.133156,-0.214963,-0.195147,0.20211,-0.161206,0.003007,0.444735,0.232208,-0.408421,-0.082563,0.070576,-0.055187,-0.052134,0.095305,-0.096178,-0.100429,0.162558,-0.011645,-0.086803,-0.038043,0.003376,-0.07196,0.336396,0.005932,0.158437,0.071403,0.084629,-0.087787,0.021154,0.16718,-0.09187,0.207595,-0.040144,-0.053504,-0.057594,-0.122718,0.000962,0.200552,-0.044998,0.035926,-0.014885,0.068906,0.027022,0.021801,-0.148385,0.00484,0.18128,0.130153,-0.258649,0.199445,-0.00226,0.113933,-0.007046,0.255071,0.088929,0.056722,-0.068876,-0.166346,0.027573,-0.061661,0.1137,-0.009143,0.098965,-0.176308,-0.026539,-0.064741,0.283923,0.031125,0
1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.580123,-8.157248,-5.330592,-1.090514,0.402345,3.446673,0.834178,-0.249051,-0.371038,1.291344,-0.082128,0.098678,-0.560427,-0.804397,0.455517,-0.066798,-0.942268,0.091028,-0.451757,0.640092,0.419408,0.077473,0.054529,-0.042357,-0.107825,0.202582,0.225008,-0.074648,0.070041,-0.01152,0.227688,0.229352,0.00246,0.111817,0.100184,0.034532,0.294381,-0.071308,0.311113,-0.224276,-0.181229,-0.042759,-0.008869,-0.168246,0.127332,-0.289468,0.080501,-0.018348,-0.142706,-0.08249,-0.303341,0.155064,0.106941,0.220404,-0.048545,0.048206,0.110674,-0.164371,-0.038507,-0.149049,-0.012023,-0.097599,-0.069822,0.1237,0.025696,-0.123554,0.197152,-0.045825,0.086322,-0.051978,-0.011258,-0.085686,-0.033766,0.127918,-0.08204,-0.185318,0.016197,0.067314,-0.117194,-0.14208,-0.100158,-0.022822,0.115577,-0.020305,0.063366,-0.051085,-0.113358,-0.103866,0.047256,-0.117943,0.027892,-0.066433,0.049052,0.024147,0.076209,0.06715,0.028419,-0.073025,0.089591,-0.005654,0.083331,-0.014071,0.115386,0.036998,0.063574,0.06088,-0.117809,0.098031,-0.055998,0.047993,0.056828,0.08757,-0.019525,0.045241,0.1039,-0.057234,-0.072135,0.065073,0.056261,-0.084389,-0.051685,0.064481,-0.145076,0.049177,-0.207601,0.039722,0.070079,-1e-05,0


# Loss function with weighted classes

In [19]:
def get_loss_func(df):
    TARGET = 'Activity'
    class_count_df = df.groupby(TARGET).count()
    n_0, n_1 = class_count_df.iloc[0, 0], class_count_df.iloc[1, 0]
    w_0 = (n_0 + n_1) / (2.0 * n_0)
    w_1 = (n_0 + n_1) / (2.0 * n_1)
    print(w_0)
    print(w_1)
    class_weights=torch.FloatTensor([w_0, w_1]).cuda()
    loss_func = CrossEntropyLossFlat(weight=class_weights)
    return loss_func

In [20]:
loss_func = get_loss_func(df)

0.55
5.5


# Train tabular DNN model

In [21]:
def train_model(dls, dataset, loss_func=None, epochs=11, wd=None, layers=[200,100]):
    
    print(f'Training model on dataset: {dataset}')
    print(f'Trained epochs: epochs={epochs}')
    
    learn = tabular_learner(dls, 
                            layers=[100,50],
                            wd=wd,
                            metrics=[accuracy, 
                            F1Score(), 
                            Precision(), 
                            Recall(), 
                            RocAucBinary(), 
                            MatthewsCorrCoef()]).to_fp16()
    
    
    #print(f'Finding learning rate...')
    #lr_min, lr_steep = learn.lr_find(suggestions=True, show_plot=False)
    #print(f'Training model with learning rate: {lr_min}')
    learn.fit_one_cycle(epochs).to_fp16()
    
    
    return learn

In [22]:
train_model(dls, dataset, epochs=1)

Training model on dataset: CHEMBL205
Trained epochs: epochs=1


epoch,train_loss,valid_loss,accuracy,f1_score,precision_score,recall_score,roc_auc_score,matthews_corrcoef,time


RuntimeError: CUDA out of memory. Tried to allocate 20.00 MiB (GPU 0; 7.93 GiB total capacity; 6.14 GiB already allocated; 21.69 MiB free; 6.60 GiB reserved in total by PyTorch)

# Test parameters

In [None]:
from sklearn.model_selection import ParameterGrid

In [None]:
param_grid = {
    'layers': [[200,100], [300,150], [400, 200], [500,250], [600,300], [700, 350], [1000, 500]]
}
param_grid= ParameterGrid(param_grid)

In [None]:
def train_with_parameters ():
    datasets = ['CHEMBL205_cl', 'CHEMBL301_cl', 'CHEMBL218_cl', 
                'CHEMBL240_cl', 'CHEMBL219_cl', 
                'CHEMBL244_cl', 'CHEMBL1978_cl']
    i = 0
    
    
    df = pd.read_csv(path/f'{datasets[i]}_ecfp_512.csv')
        
    x_train, x_valid = train_test_split(df.index, test_size=0.2, random_state=42, stratify=df['Activity'])
    splits = (list(x_train), list(x_valid))
    procs = [Categorify]
        
    dep_var = ['Activity']
    X = df.drop(["CID", "SMILES", "Activity"], axis=1)
    cat_vars = X.columns
    cat_names = list(cat_vars)
    
    to = TabularPandas(df, 
                        procs,
                        cat_names=cat_names, 
                        y_names=dep_var, 
                        splits=splits, 
                        y_block = CategoryBlock())
    dls = to.dataloaders()
    
    for setting in param_grid:
        
        print(f"Training with layers: {setting['layers']}")
        learn = train_model(dls, datasets[i], layers=setting['layers'])
        

In [None]:
train_with_parameters()