In [1]:
import pandas as pd
import numpy as np
import json
from math import log, floor
from sklearn.model_selection import train_test_split, KFold
from sklearn.linear_model import LogisticRegression, RidgeClassifier, SGDClassifier, LinearRegression
from sklearn.naive_bayes import MultinomialNB
from sklearn.metrics import roc_auc_score
from sklearn.preprocessing import MinMaxScaler, OneHotEncoder, LabelEncoder
from sklearn.neural_network import MLPClassifier
from sklearn.ensemble import RandomForestClassifier, ExtraTreesClassifier, AdaBoostClassifier, GradientBoostingClassifier
from gensim.models.doc2vec import Doc2Vec, TaggedDocument

import warnings
warnings.filterwarnings("ignore")

In [2]:
df = pd.read_csv('./Data/preprocessed_data.csv')
with open('./Data/feature_config.json') as json_data:
  features = json.load(json_data)

features.keys()

len_columns = features['length']+ features['core_count']+ features['unique']+\
  features['blosum_sum']+ features['blosum']
len_fea = df[len_columns]
len_fea = len_fea.divide(len_fea.max())
df.drop(columns=len_columns, inplace = True)
df = df.join(len_fea)

origin_cols = df.columns
onehot_columns = features['hla']+features['core']+features['PFR']+features['cluster']
one_hot = pd.get_dummies(data=df, columns=onehot_columns)
one_hot.drop(columns = set(origin_cols)-set(onehot_columns), inplace = True)


In [3]:
def hla_preprocess(df):
  hla_encoder = LabelEncoder()
  #hla_encoder.fit(df['hla'])
  #np.save('Data/hla_encoder_classes.npy', hla_encoder.classes_)
  hla_encoder.classes_ = np.load('./Data/hla_encoder_classes.npy')
  df['hla'] = hla_encoder.transform(df['hla'])


  return df

v = pd.read_csv('./Data/vectors_data.csv')
v = hla_preprocess(v)
df = pd.merge(df, v, on = ['peptide', 'hla'], how = 'left')

columns = features['blosum']+features['unique']+features['core_tfidf']+[c for c in list(v.columns) if c not in ['peptide', 'hla']]+['aff']
cols_to_drop = ['aff','peptide','core','LPFR','RPFR','true_index','n_label']

In [4]:
data = one_hot.join(df[columns]).drop_duplicates()
y = data['aff'].apply(lambda x: 1 if x >= (1-log (500)/log(50000)) else 0)
data.drop(columns = 'aff', inplace = True)
data.fillna(0,inplace = True)
xtrain, xvalid, ytrain, yvalid = train_test_split(data, y, 
                                                  stratify=y, 
                                                  random_state=42, 
                                                  test_size=0.2, shuffle=True)
result = {}
# Scale the data to (0,1) for Bayesyes
scl = MinMaxScaler()
scl.fit(xtrain)
xtrain_svd_scl = scl.transform(xtrain)
xvalid_svd_scl = scl.transform(xvalid)

In [5]:
pd.options.display.max_columns = 1200
data.head(2)

Unnamed: 0,hla_0,hla_2,hla_3,hla_5,hla_6,hla_7,hla_8,hla_9,hla_12,hla_13,hla_14,hla_17,hla_18,hla_19,hla_20,hla_21,hla_22,hla_23,hla_25,hla_26,hla_28,hla_29,hla_30,hla_31,hla_32,hla_33,hla_34,hla_36,hla_37,hla_38,hla_40,hla_41,hla_42,hla_43,hla_44,hla_45,hla_46,hla_47,hla_48,hla_49,hla_50,hla_51,hla_52,hla_53,hla_54,hla_55,hla_56,hla_59,hla_60,hla_62,hla_63,hla_64,hla_65,hla_67,hla_68,hla_71,hla_72,hla_73,hla_74,hla_75,hla_76,hla_77,hla_79,allele_type_0,allele_type_1,allele_type_2,allele_type_3,core_P1_1,core_P1_2,core_P1_3,core_P1_4,core_P1_5,core_P1_6,core_P1_7,core_P1_8,core_P1_9,core_P1_10,core_P1_11,core_P1_12,core_P1_13,core_P1_14,core_P1_15,core_P1_16,core_P1_17,core_P1_18,core_P1_19,core_P1_20,core_P2_1,core_P2_2,core_P2_3,core_P2_4,core_P2_5,core_P2_6,core_P2_7,core_P2_8,core_P2_9,core_P2_10,core_P2_11,core_P2_12,core_P2_13,core_P2_14,core_P2_15,core_P2_16,core_P2_17,core_P2_18,core_P2_19,core_P2_20,core_P3_1,core_P3_2,core_P3_3,core_P3_4,core_P3_5,core_P3_6,core_P3_7,core_P3_8,core_P3_9,core_P3_10,core_P3_11,core_P3_12,core_P3_13,core_P3_14,core_P3_15,core_P3_16,core_P3_17,core_P3_18,core_P3_19,core_P3_20,core_P4_1,core_P4_2,core_P4_3,core_P4_4,core_P4_5,core_P4_6,core_P4_7,core_P4_8,core_P4_9,core_P4_10,core_P4_11,core_P4_12,core_P4_13,core_P4_14,core_P4_15,core_P4_16,core_P4_17,core_P4_18,core_P4_19,core_P4_20,core_P5_1,core_P5_2,core_P5_3,core_P5_4,core_P5_5,core_P5_6,core_P5_7,core_P5_8,core_P5_9,core_P5_10,core_P5_11,core_P5_12,core_P5_13,core_P5_14,core_P5_15,core_P5_16,core_P5_17,core_P5_18,core_P5_19,core_P5_20,core_P6_1,core_P6_2,core_P6_3,core_P6_4,core_P6_5,core_P6_6,core_P6_7,core_P6_8,core_P6_9,core_P6_10,core_P6_11,core_P6_12,core_P6_13,core_P6_14,core_P6_15,core_P6_16,core_P6_17,core_P6_18,core_P6_19,core_P6_20,core_P7_1,core_P7_2,core_P7_3,core_P7_4,core_P7_5,core_P7_6,core_P7_7,core_P7_8,core_P7_9,core_P7_10,core_P7_11,core_P7_12,core_P7_13,core_P7_14,core_P7_15,core_P7_16,core_P7_17,core_P7_18,core_P7_19,core_P7_20,core_P8_1,core_P8_2,core_P8_3,core_P8_4,core_P8_5,core_P8_6,core_P8_7,core_P8_8,core_P8_9,core_P8_10,core_P8_11,core_P8_12,core_P8_13,core_P8_14,core_P8_15,core_P8_16,core_P8_17,core_P8_18,core_P8_19,core_P8_20,core_P9_1,core_P9_2,core_P9_3,core_P9_4,core_P9_5,core_P9_6,core_P9_7,core_P9_8,core_P9_9,core_P9_10,core_P9_11,core_P9_12,core_P9_13,core_P9_14,core_P9_15,core_P9_16,core_P9_17,core_P9_18,core_P9_19,core_P9_20,LPFR_P1_0,LPFR_P1_1,LPFR_P1_2,LPFR_P1_3,LPFR_P1_4,LPFR_P1_5,LPFR_P1_6,LPFR_P1_7,LPFR_P1_8,LPFR_P1_9,LPFR_P1_10,LPFR_P1_11,LPFR_P1_12,LPFR_P1_13,LPFR_P1_14,LPFR_P1_15,LPFR_P1_16,LPFR_P1_17,LPFR_P1_18,LPFR_P1_19,LPFR_P1_20,LPFR_P2_0,LPFR_P2_1,LPFR_P2_2,LPFR_P2_3,LPFR_P2_4,LPFR_P2_5,LPFR_P2_6,LPFR_P2_7,LPFR_P2_8,LPFR_P2_9,LPFR_P2_10,LPFR_P2_11,LPFR_P2_12,LPFR_P2_13,LPFR_P2_14,LPFR_P2_15,LPFR_P2_16,LPFR_P2_17,LPFR_P2_18,LPFR_P2_19,LPFR_P2_20,LPFR_P3_0,LPFR_P3_1,LPFR_P3_2,LPFR_P3_3,LPFR_P3_4,LPFR_P3_5,LPFR_P3_6,LPFR_P3_7,LPFR_P3_8,LPFR_P3_9,LPFR_P3_10,LPFR_P3_11,LPFR_P3_12,LPFR_P3_13,LPFR_P3_14,LPFR_P3_15,LPFR_P3_16,LPFR_P3_17,LPFR_P3_18,LPFR_P3_19,LPFR_P3_20,RPFR_P1_0,RPFR_P1_1,RPFR_P1_2,RPFR_P1_3,RPFR_P1_4,RPFR_P1_5,RPFR_P1_6,RPFR_P1_7,RPFR_P1_8,RPFR_P1_9,RPFR_P1_10,RPFR_P1_11,RPFR_P1_12,RPFR_P1_13,RPFR_P1_14,RPFR_P1_15,RPFR_P1_16,RPFR_P1_17,RPFR_P1_18,RPFR_P1_19,RPFR_P1_20,RPFR_P2_0,RPFR_P2_1,RPFR_P2_2,RPFR_P2_3,RPFR_P2_4,RPFR_P2_5,RPFR_P2_6,RPFR_P2_7,RPFR_P2_8,RPFR_P2_9,RPFR_P2_10,RPFR_P2_11,RPFR_P2_12,RPFR_P2_13,RPFR_P2_14,RPFR_P2_15,RPFR_P2_16,RPFR_P2_17,RPFR_P2_18,RPFR_P2_19,RPFR_P2_20,RPFR_P3_0,RPFR_P3_1,RPFR_P3_2,RPFR_P3_3,RPFR_P3_4,RPFR_P3_5,RPFR_P3_6,RPFR_P3_7,RPFR_P3_8,RPFR_P3_9,RPFR_P3_10,RPFR_P3_11,RPFR_P3_12,RPFR_P3_13,RPFR_P3_14,RPFR_P3_15,RPFR_P3_16,RPFR_P3_17,RPFR_P3_18,RPFR_P3_19,RPFR_P3_20,cluster_0,cluster_1,cluster_2,cluster_3,cluster_4,cluster_5,cluster_6,cluster_7,cluster_8,cluster_9,cluster_10,cluster_11,cluster_12,cluster_13,cluster_14,cluster_15,cluster_16,cluster_17,cluster_18,cluster_19,cluster_20,cluster_21,cluster_22,cluster_23,cluster_24,cluster_25,cluster_26,cluster_27,cluster_28,cluster_29,cluster_30,cluster_31,cluster_32,cluster_33,cluster_34,cluster_35,cluster_36,cluster_37,cluster_38,cluster_39,cluster_40,cluster_41,cluster_42,cluster_43,cluster_44,cluster_45,cluster_46,cluster_47,cluster_48,cluster_49,cluster_50,cluster_51,cluster_52,cluster_53,cluster_54,cluster_55,cluster_56,cluster_57,cluster_58,cluster_59,cluster_60,cluster_61,cluster_62,cluster_63,cluster_64,cluster_65,cluster_66,cluster_67,cluster_68,cluster_69,cluster_70,cluster_71,cluster_72,cluster_73,cluster_74,cluster_75,cluster_76,cluster_77,cluster_78,cluster_79,cluster_80,cluster_81,cluster_82,cluster_83,cluster_84,cluster_85,cluster_86,cluster_87,cluster_88,cluster_89,cluster_90,cluster_91,cluster_92,cluster_93,cluster_94,cluster_95,cluster_96,cluster_97,cluster_98,cluster_99,cluster_100,cluster_101,cluster_102,cluster_103,cluster_104,cluster_105,cluster_106,cluster_107,cluster_108,cluster_109,cluster_110,cluster_111,cluster_112,cluster_113,cluster_114,cluster_115,cluster_116,cluster_117,cluster_118,cluster_119,cluster_120,cluster_121,cluster_122,cluster_123,cluster_124,cluster_125,cluster_126,cluster_127,cluster_128,cluster_129,cluster_130,cluster_131,cluster_132,cluster_133,cluster_134,cluster_135,cluster_136,cluster_137,cluster_138,cluster_139,cluster_140,cluster_141,cluster_142,cluster_143,cluster_144,cluster_145,cluster_146,cluster_147,cluster_148,cluster_149,cluster_150,cluster_151,cluster_152,cluster_153,cluster_154,cluster_155,cluster_156,cluster_157,cluster_158,cluster_159,cluster_160,cluster_161,cluster_162,cluster_163,cluster_164,cluster_165,cluster_166,cluster_167,cluster_168,cluster_169,cluster_170,cluster_171,cluster_172,cluster_173,cluster_174,cluster_175,cluster_176,cluster_177,cluster_178,cluster_179,cluster_180,cluster_181,cluster_182,cluster_183,cluster_184,cluster_185,cluster_186,cluster_187,cluster_188,cluster_189,cluster_190,cluster_191,cluster_192,cluster_193,cluster_194,cluster_195,cluster_196,cluster_197,cluster_198,cluster_199,cluster_200,cluster_201,cluster_202,cluster_203,cluster_204,cluster_205,cluster_206,cluster_207,cluster_208,cluster_209,cluster_210,cluster_211,cluster_212,cluster_213,cluster_214,cluster_215,cluster_216,cluster_217,cluster_218,cluster_219,cluster_220,cluster_221,cluster_222,cluster_223,cluster_224,cluster_225,cluster_226,cluster_227,cluster_228,cluster_229,cluster_230,cluster_231,cluster_232,cluster_233,cluster_234,cluster_235,cluster_236,cluster_237,cluster_238,cluster_239,cluster_240,cluster_241,cluster_242,cluster_243,cluster_244,cluster_245,cluster_246,cluster_247,cluster_248,cluster_249,cluster_250,cluster_251,cluster_252,cluster_253,cluster_254,cluster_255,cluster_256,cluster_257,cluster_258,cluster_259,cluster_260,cluster_261,cluster_262,cluster_263,cluster_264,cluster_265,cluster_266,cluster_267,cluster_268,cluster_269,cluster_270,cluster_271,cluster_272,cluster_273,cluster_274,cluster_275,cluster_276,cluster_277,cluster_278,p1,p2,p3,p4,p5,p6,p7,p8,p9,peptide_nunique,unique_rate,core_atfidf,core_ctfidf,core_dtfidf,core_etfidf,core_ftfidf,core_gtfidf,core_htfidf,core_itfidf,core_ktfidf,core_ltfidf,core_mtfidf,core_ntfidf,core_ptfidf,core_qtfidf,core_rtfidf,core_stfidf,core_ttfidf,core_vtfidf,core_wtfidf,core_ytfidf,peptide_0,peptide_1,peptide_2,peptide_3,peptide_4,peptide_5,peptide_6,peptide_7,peptide_8,peptide_9,peptide_10,peptide_11,peptide_12,peptide_13,peptide_14,peptide_15,peptide_16,peptide_17,peptide_18,peptide_19,peptide_20,peptide_21,peptide_22,peptide_23,peptide_24,peptide_25,peptide_26,peptide_27,peptide_28,peptide_29,peptide_30,peptide_31,peptide_32,peptide_33,peptide_34,peptide_35,peptide_36,peptide_37,peptide_38,peptide_39,peptide_40,peptide_41,peptide_42,peptide_43,peptide_44,peptide_45,peptide_46,peptide_47,peptide_48,peptide_49,peptide_50,peptide_51,peptide_52,peptide_53,peptide_54,peptide_55,peptide_56,peptide_57,peptide_58,peptide_59,peptide_60,peptide_61,peptide_62,peptide_63,peptide_64,peptide_65,peptide_66,peptide_67,peptide_68,peptide_69,peptide_70,peptide_71,peptide_72,peptide_73,peptide_74,peptide_75,peptide_76,peptide_77,peptide_78,peptide_79,exon1_0,exon1_1,exon1_2,exon1_3,exon1_4,exon1_5,exon1_6,exon1_7,exon1_8,exon1_9,exon1_10,exon1_11,exon1_12,exon1_13,exon1_14,exon1_15,exon1_16,exon1_17,exon1_18,exon1_19,exon1_20,exon1_21,exon1_22,exon1_23,exon1_24,exon1_25,exon1_26,exon1_27,exon1_28,exon1_29,exon2_0,exon2_1,exon2_2,exon2_3,exon2_4,exon2_5,exon2_6,exon2_7,exon2_8,exon2_9,exon2_10,exon2_11,exon2_12,exon2_13,exon2_14,exon2_15,exon2_16,exon2_17,exon2_18,exon2_19,exon2_20,exon2_21,exon2_22,exon2_23,exon2_24,exon2_25,exon2_26,exon2_27,exon2_28,exon2_29,exon3_0,exon3_1,exon3_2,exon3_3,exon3_4,exon3_5,exon3_6,exon3_7,exon3_8,exon3_9,exon3_10,exon3_11,exon3_12,exon3_13,exon3_14,exon3_15,exon3_16,exon3_17,exon3_18,exon3_19,exon3_20,exon3_21,exon3_22,exon3_23,exon3_24,exon3_25,exon3_26,exon3_27,exon3_28,exon3_29,exon4_0,exon4_1,exon4_2,exon4_3,exon4_4,exon4_5,exon4_6,exon4_7,exon4_8,exon4_9,exon4_10,exon4_11,exon4_12,exon4_13,exon4_14,exon4_15,exon4_16,exon4_17,exon4_18,exon4_19,exon4_20,exon4_21,exon4_22,exon4_23,exon4_24,exon4_25,exon4_26,exon4_27,exon4_28,exon4_29,exon5_0,exon5_1,exon5_2,exon5_3,exon5_4,exon5_5,exon5_6,exon5_7,exon5_8,exon5_9,exon5_10,exon5_11,exon5_12,exon5_13,exon5_14,exon5_15,exon5_16,exon5_17,exon5_18,exon5_19,exon5_20,exon5_21,exon5_22,exon5_23,exon5_24,exon5_25,exon5_26,exon5_27,exon5_28,exon5_29,exon6_0,exon6_1,exon6_2,exon6_3,exon6_4,exon6_5,exon6_6,exon6_7,exon6_8,exon6_9,exon6_10,exon6_11,exon6_12,exon6_13,exon6_14,exon6_15,exon6_16,exon6_17,exon6_18,exon6_19,exon6_20,exon6_21,exon6_22,exon6_23,exon6_24,exon6_25,exon6_26,exon6_27,exon6_28,exon6_29,exon_0,exon_1,exon_2,exon_3,exon_4,exon_5,exon_6,exon_7,exon_8,exon_9,exon_10,exon_11,exon_12,exon_13,exon_14,exon_15,exon_16,exon_17,exon_18,exon_19,exon_20,exon_21,exon_22,exon_23,exon_24,exon_25,exon_26,exon_27,exon_28,exon_29
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.765957,0.765957,0.679245,0.679245,0.679245,0.679245,0.679245,0.679245,0.679245,0.055556,0.090909,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.765957,0.765957,0.679245,0.679245,0.679245,0.679245,0.679245,0.679245,0.679245,0.055556,0.090909,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


In [6]:
data.shape

(974576, 973)

In [7]:
zxc = pd.read_csv('./feature_selected.csv')

In [8]:
zxc.head()

Unnamed: 0,hla_0,hla_2,hla_3,hla_4,hla_5,hla_6,hla_7,hla_8,hla_9,hla_12,hla_13,hla_14,hla_17,hla_18,hla_19,hla_21,hla_22,hla_23,hla_25,hla_28,hla_29,hla_30,hla_31,hla_32,hla_33,hla_34,hla_36,hla_37,hla_38,hla_39,hla_40,hla_41,hla_42,hla_43,hla_44,hla_45,hla_46,hla_47,hla_48,hla_49,hla_50,hla_51,hla_52,hla_53,hla_54,hla_55,hla_56,hla_57,hla_59,hla_60,hla_62,hla_63,hla_64,hla_65,hla_67,hla_68,hla_71,hla_72,hla_73,hla_74,hla_75,hla_76,hla_77,hla_79,allele_type_0,allele_type_1,allele_type_2,allele_type_3,core_P1_1,core_P1_2,core_P1_3,core_P1_4,core_P1_5,core_P1_6,core_P1_7,core_P1_8,core_P1_9,core_P1_10,core_P1_11,core_P1_12,core_P1_13,core_P1_14,core_P1_15,core_P1_16,core_P1_17,core_P1_18,core_P1_19,core_P1_20,core_P2_1,core_P2_2,core_P2_3,core_P2_4,core_P2_5,core_P2_6,core_P2_7,core_P2_8,core_P2_9,core_P2_10,core_P2_11,core_P2_12,core_P2_13,core_P2_14,core_P2_15,core_P2_16,core_P2_17,core_P2_18,core_P2_19,core_P2_20,core_P3_1,core_P3_2,core_P3_3,core_P3_4,core_P3_5,core_P3_6,core_P3_7,core_P3_8,core_P3_9,core_P3_10,core_P3_11,core_P3_12,core_P3_13,core_P3_14,core_P3_15,core_P3_16,core_P3_17,core_P3_18,core_P3_19,core_P3_20,core_P4_1,core_P4_2,core_P4_3,core_P4_4,core_P4_5,core_P4_6,core_P4_7,core_P4_8,core_P4_9,core_P4_10,core_P4_11,core_P4_12,core_P4_13,core_P4_14,core_P4_15,core_P4_16,core_P4_17,core_P4_18,core_P4_19,core_P4_20,core_P5_1,core_P5_2,core_P5_3,core_P5_4,core_P5_5,core_P5_6,core_P5_7,core_P5_8,core_P5_9,core_P5_10,core_P5_11,core_P5_12,core_P5_13,core_P5_14,core_P5_15,core_P5_16,core_P5_17,core_P5_18,core_P5_19,core_P5_20,core_P6_1,core_P6_2,core_P6_3,core_P6_4,core_P6_5,core_P6_6,core_P6_7,core_P6_8,core_P6_9,core_P6_10,core_P6_11,core_P6_12,core_P6_13,core_P6_14,core_P6_15,core_P6_16,core_P6_17,core_P6_18,core_P6_19,core_P6_20,core_P7_1,core_P7_2,core_P7_3,core_P7_4,core_P7_5,core_P7_6,core_P7_7,core_P7_8,core_P7_9,core_P7_10,core_P7_11,core_P7_12,core_P7_13,core_P7_14,core_P7_15,core_P7_16,core_P7_17,core_P7_18,core_P7_19,core_P7_20,core_P8_1,core_P8_2,core_P8_3,core_P8_4,core_P8_5,core_P8_6,core_P8_7,core_P8_8,core_P8_9,core_P8_10,core_P8_11,core_P8_12,core_P8_13,core_P8_14,core_P8_15,core_P8_16,core_P8_17,core_P8_18,core_P8_19,core_P8_20,core_P9_1,core_P9_2,core_P9_3,core_P9_4,core_P9_5,core_P9_6,core_P9_7,core_P9_8,core_P9_9,core_P9_10,core_P9_11,core_P9_12,core_P9_13,core_P9_14,core_P9_15,core_P9_16,core_P9_17,core_P9_18,core_P9_19,core_P9_20,LPFR_P1_0,LPFR_P1_1,LPFR_P1_2,LPFR_P1_3,LPFR_P1_4,LPFR_P1_5,LPFR_P1_6,LPFR_P1_7,LPFR_P1_8,LPFR_P1_9,LPFR_P1_10,LPFR_P1_11,LPFR_P1_12,LPFR_P1_13,LPFR_P1_14,LPFR_P1_15,LPFR_P1_16,LPFR_P1_17,LPFR_P1_18,LPFR_P1_19,LPFR_P1_20,LPFR_P2_0,LPFR_P2_1,LPFR_P2_2,LPFR_P2_3,LPFR_P2_4,LPFR_P2_5,LPFR_P2_6,LPFR_P2_7,LPFR_P2_8,LPFR_P2_9,LPFR_P2_10,LPFR_P2_11,LPFR_P2_12,LPFR_P2_13,LPFR_P2_14,LPFR_P2_15,LPFR_P2_16,LPFR_P2_17,LPFR_P2_18,LPFR_P2_19,LPFR_P2_20,LPFR_P3_0,LPFR_P3_1,LPFR_P3_2,LPFR_P3_3,LPFR_P3_4,LPFR_P3_5,LPFR_P3_6,LPFR_P3_7,LPFR_P3_8,LPFR_P3_9,LPFR_P3_10,LPFR_P3_11,LPFR_P3_12,LPFR_P3_13,LPFR_P3_14,LPFR_P3_15,LPFR_P3_16,LPFR_P3_17,LPFR_P3_18,LPFR_P3_19,LPFR_P3_20,RPFR_P1_0,RPFR_P1_1,RPFR_P1_2,RPFR_P1_3,RPFR_P1_4,RPFR_P1_5,RPFR_P1_6,RPFR_P1_7,RPFR_P1_8,RPFR_P1_9,RPFR_P1_10,RPFR_P1_11,RPFR_P1_12,RPFR_P1_13,RPFR_P1_14,RPFR_P1_15,RPFR_P1_16,RPFR_P1_17,RPFR_P1_18,RPFR_P1_19,RPFR_P1_20,RPFR_P2_0,RPFR_P2_1,RPFR_P2_2,RPFR_P2_3,RPFR_P2_4,RPFR_P2_5,RPFR_P2_6,RPFR_P2_7,RPFR_P2_8,RPFR_P2_9,RPFR_P2_10,RPFR_P2_11,RPFR_P2_12,RPFR_P2_13,RPFR_P2_14,RPFR_P2_15,RPFR_P2_16,RPFR_P2_17,RPFR_P2_18,RPFR_P2_19,RPFR_P2_20,RPFR_P3_0,RPFR_P3_1,RPFR_P3_2,RPFR_P3_3,RPFR_P3_4,RPFR_P3_5,RPFR_P3_6,RPFR_P3_7,RPFR_P3_8,RPFR_P3_9,RPFR_P3_10,RPFR_P3_11,RPFR_P3_12,RPFR_P3_13,RPFR_P3_14,RPFR_P3_15,RPFR_P3_16,RPFR_P3_17,RPFR_P3_18,RPFR_P3_19,RPFR_P3_20,cluster_0,cluster_1,cluster_2,cluster_3,cluster_4,cluster_5,cluster_6,cluster_7,cluster_8,cluster_9,cluster_10,cluster_11,cluster_12,cluster_13,cluster_14,cluster_15,cluster_16,cluster_17,cluster_18,cluster_19,cluster_20,cluster_21,cluster_22,cluster_23,cluster_24,cluster_25,cluster_26,cluster_27,cluster_28,cluster_29,cluster_30,cluster_31,cluster_32,cluster_33,cluster_34,cluster_35,cluster_36,cluster_37,cluster_38,cluster_39,cluster_40,cluster_41,cluster_42,cluster_43,cluster_44,cluster_45,cluster_46,cluster_47,cluster_48,cluster_49,cluster_50,cluster_51,cluster_52,cluster_53,cluster_54,cluster_55,cluster_56,cluster_57,cluster_58,cluster_59,cluster_60,cluster_61,cluster_62,cluster_63,cluster_64,cluster_65,cluster_66,cluster_67,cluster_68,cluster_69,cluster_70,cluster_71,cluster_72,cluster_73,cluster_74,cluster_75,cluster_76,cluster_77,cluster_78,cluster_79,cluster_80,cluster_81,cluster_82,cluster_83,cluster_84,cluster_85,cluster_86,cluster_87,cluster_88,cluster_89,cluster_90,cluster_91,cluster_92,cluster_93,cluster_94,cluster_95,cluster_96,cluster_97,cluster_98,cluster_99,cluster_100,cluster_101,cluster_102,cluster_103,cluster_104,cluster_105,cluster_106,cluster_107,cluster_108,cluster_109,cluster_110,cluster_111,cluster_112,cluster_113,cluster_114,cluster_115,cluster_116,cluster_117,cluster_118,cluster_119,cluster_120,cluster_121,cluster_122,cluster_123,cluster_124,cluster_125,cluster_126,cluster_127,cluster_128,cluster_129,cluster_130,cluster_131,cluster_132,cluster_133,cluster_134,cluster_135,cluster_136,cluster_137,cluster_138,cluster_139,cluster_140,cluster_141,cluster_142,cluster_143,cluster_144,cluster_145,cluster_146,cluster_147,cluster_148,cluster_149,cluster_150,cluster_151,cluster_152,cluster_153,cluster_154,cluster_155,cluster_156,cluster_157,cluster_158,cluster_159,cluster_160,cluster_161,cluster_162,cluster_163,cluster_164,cluster_165,cluster_166,cluster_167,cluster_168,cluster_169,cluster_170,cluster_171,cluster_172,cluster_173,cluster_174,cluster_175,cluster_176,cluster_177,cluster_178,cluster_179,cluster_180,cluster_181,cluster_182,cluster_183,cluster_184,cluster_185,cluster_186,cluster_187,cluster_188,cluster_189,cluster_190,cluster_191,cluster_192,cluster_193,cluster_194,cluster_195,cluster_196,cluster_197,cluster_198,cluster_199,cluster_200,cluster_201,cluster_202,cluster_203,cluster_204,cluster_205,cluster_206,cluster_207,cluster_208,cluster_209,cluster_210,cluster_211,cluster_212,cluster_213,cluster_214,cluster_215,cluster_216,cluster_217,cluster_218,cluster_219,cluster_220,cluster_221,cluster_222,cluster_223,cluster_224,cluster_225,cluster_226,cluster_227,cluster_228,cluster_229,cluster_230,cluster_231,cluster_232,cluster_233,cluster_234,cluster_235,cluster_236,cluster_237,cluster_238,cluster_239,cluster_240,cluster_241,cluster_242,cluster_243,cluster_244,cluster_245,cluster_246,cluster_247,cluster_248,cluster_249,cluster_250,cluster_251,cluster_252,cluster_253,cluster_254,cluster_255,cluster_256,cluster_257,cluster_258,cluster_259,cluster_260,cluster_261,cluster_262,cluster_263,cluster_264,cluster_265,cluster_266,cluster_267,cluster_268,cluster_269,cluster_270,cluster_271,cluster_272,cluster_273,cluster_274,cluster_275,cluster_276,cluster_277,cluster_278,aff,p1,p2,p3,p4,p5,p6,p7,p8,p9,peptide_nunique,unique_rate,core_atfidf,core_ctfidf,core_dtfidf,core_etfidf,core_ftfidf,core_gtfidf,core_htfidf,core_itfidf,core_ktfidf,core_ltfidf,core_mtfidf,core_ntfidf,core_ptfidf,core_qtfidf,core_rtfidf,core_stfidf,core_ttfidf,core_vtfidf,core_wtfidf,core_ytfidf,length,blosum_sum
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.324088,36,36,36,36,36,36,36,36,36,1,0.090909,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,11,324
1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.324088,36,36,36,36,36,36,36,36,36,1,0.090909,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,11,324
2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.324088,36,36,36,36,36,36,36,36,36,1,0.090909,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,11,324
3,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.129502,20,20,20,20,20,-1,8,8,1,6,0.4,0.8696,0.0,0.0,0.0,0.0,0.2037,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.407,0.1901,0.0,0.0,15,116
4,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0.129502,14,14,14,14,-4,6,6,0,-9,6,0.4,0.78,0.0,0.0,0.0,0.0,0.2283,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.4563,0.213,0.0,0.2932,15,55
