In [1]:
from __future__ import division
import time
import pandas as pd
import numpy as np
from sklearn.metrics import classification_report
from sklearn.model_selection import StratifiedKFold
import pickle
import os.path
from zipfile import ZipFile
import sys, os
from os.path import join, dirname, abspath
from pathlib import Path
import classification as cl
import feature_selection as fs

In [2]:
def load_data():
    beta_file = os.path.realpath('../GSE59685_betas2.csv.zip')
    zipfile = ZipFile(beta_file)
    zipfile.getinfo('GSE59685_betas2.csv').file_size += (2 ** 64) - 1
    betaqn = pd.read_csv(zipfile.open('GSE59685_betas2.csv'),skiprows=(1,2), index_col=0,sep=',')
    betaqn = betaqn.T

    info = pd.read_csv('info.csv.zip',index_col=1, compression='zip',sep=',')
    info = info.drop('Unnamed: 0', 1)

    info.loc[(info.braak_stage=='5') | (info.braak_stage=='6'),'braak_bin'] = 1
    cond = ((info.braak_stage=='0') | (info.braak_stage=='1') | (info.braak_stage=='2') |
            (info.braak_stage=='3') | (info.braak_stage=='4'))
    info.loc[cond ,'braak_bin'] = 0
    info.loc[info.source_tissue == 'entorhinal cortex', 'tissue'] = 'EC'
    info.loc[info.source_tissue == 'whole blood', 'tissue'] = 'WB'
    info.loc[info.source_tissue == 'frontal cortex', 'tissue'] = 'FC'
    info.loc[info.source_tissue == 'superior temporal gyrus', 'tissue'] = 'STG'
    info.loc[info.source_tissue == 'cerebellum', 'tissue'] = 'CER'
    return (betaqn, info)

In [3]:
betaqn, info = load_data()

In [6]:
tissue = 'EC'

In [12]:
save_file = os.path.realpath('../data_str_pr_general/')
iters_big = 10
iters_small = 30
big_small = 200
feat_sel = 't_test'

ec = betaqn.loc[info[(info.tissue == tissue) & (info.braak_stage != 'Exclude')].index]
svm_accuracy = {}
samples = ec.shape[0]

features_num = [20]

features_file = save_file + "/features_%s_%s.p" % (tissue, feat_sel)
my_file = Path(features_file)
if my_file.is_file():
    features_per_i = pickle.load( open( features_file, "rb" ) )
else:
    print('no features file')



In [36]:
for num in features_num:
    print(num)
    features_sel = dict.fromkeys(list(ec),0)
    y_true = np.zeros(samples)
    y_pred_rbf = np.zeros(samples)
    c_val_rbf = np.zeros(samples)
    gamma_val_rbf = np.zeros(samples)
    for i in range(samples):
        print('iteracion %d para %d features' %(i,num))
        train_full = ec.loc[ec.index != ec.index[i]]
        start_time = time.time()
        train = train_full[features_per_i[i][0:num]]
        print("--- %s seconds for feature selection ---" % (time.time() - start_time))
        print('features selected')
        test = ec.loc[ec.index == ec.index[i]]
        test = test[features_per_i[i][0:num]]
        y_train = info['braak_bin'].loc[train.index]
        y_true[i] = info['braak_bin'].loc[test.index]
        if(((i < iters_big) & (num > big_small)) | ((i < iters_small) & (num < big_small))):
            print('entro primeros')
            (y_pred_rbf[i], c_val_rbf[i], gamma_val_rbf[i]) = SVM_rbf(train, y_train, test)
        elif((i >= iters_big) & (num > big_small)):
            print('entro big iters')
            (y_pred_rbf[i], c_val_rbf[i], gamma_val_rbf[i]) = SVM_rbf(train, y_train, test,
            C_range = np.unique(c_val_rbf[0:iters_big]),gamma_range = np.unique(gamma_val_rbf[0:iters_big]))
        elif((i >= iters_small) & (num < big_small)):
            print('entro small iters')
            (y_pred_rbf[i], c_val_rbf[i], gamma_val_rbf[i]) = SVM_rbf(train, y_train, test,
            C_range = np.unique(c_val_rbf[0:iters_small]),gamma_range = np.unique(gamma_val_rbf[0:iters_small]))
    parameters = pd.DataFrame(
    {'C_rbf': c_val_rbf,
     'gamma_rbf': gamma_val_rbf,
    })
    pickle.dump(parameters, open(save_file + "/params_%s_%s_%d.p" %(tissue, feat_sel, num), "wb"))
    predictions = pd.DataFrame(
    {'y_true': y_true,
     'y_rbf': y_pred_rbf,
    })
    pickle.dump(predictions, open(save_file + "/pred_%s_%s_%d.p" %(tissue, feat_sel, num), "wb"))
    #pickle.dump(features_sel, open(save_file + "/feat_%s_%s_%d.p" %(tissue, feat_sel, num), "wb"))
    #features_sel_total = {key: value + [features_sel[key]] for key, value in features_sel_total.items()}
    #svm_accuracy[num] = [np.where((predictions['y_true']==predictions['y_rbf'])==True)[0].shape[0]/samples,
    #                    np.where((predictions['y_true']==predictions['y_poly'])==True)[0].shape[0]/samples,
    #                    np.where((predictions['y_true']==predictions['y_lin'])==True)[0].shape[0]/samples]
#pickle.dump(svm_accuracy, open(save_file + "/accuracy_%s_%s.p" % (tissue, feat_sel), "wb"))

20
iteracion 0 para 20 features
--- 0.009142875671386719 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:    6.4s finished


iteracion 1 para 20 features
--- 0.017201900482177734 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:    4.4s finished


iteracion 2 para 20 features
--- 0.003421783447265625 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:    6.1s finished


iteracion 3 para 20 features
--- 0.03354382514953613 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:    7.4s finished


iteracion 4 para 20 features
--- 0.014032125473022461 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:    5.4s finished


iteracion 5 para 20 features
--- 0.0310819149017334 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:    5.4s finished


iteracion 6 para 20 features
--- 0.0045430660247802734 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:   17.7s finished


iteracion 7 para 20 features
--- 0.0018851757049560547 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:    6.4s finished


iteracion 8 para 20 features
--- 0.0023369789123535156 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:    4.9s finished


iteracion 9 para 20 features
--- 0.0007150173187255859 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:    4.3s finished


iteracion 10 para 20 features
--- 0.0015552043914794922 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:    5.6s finished


iteracion 11 para 20 features
--- 0.0011191368103027344 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:    5.3s finished


iteracion 12 para 20 features
--- 0.00347900390625 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:    5.8s finished


iteracion 13 para 20 features
--- 0.004379987716674805 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:    5.9s finished


iteracion 14 para 20 features
--- 0.060801029205322266 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:    6.2s finished


iteracion 15 para 20 features
--- 0.00080108642578125 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:    6.4s finished


iteracion 16 para 20 features
--- 0.22652292251586914 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:   13.2s finished


iteracion 17 para 20 features
--- 0.0011820793151855469 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:    6.9s finished


iteracion 18 para 20 features
--- 0.0025968551635742188 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:    6.2s finished


iteracion 19 para 20 features
--- 0.0014498233795166016 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:    6.2s finished


iteracion 20 para 20 features
--- 0.0017158985137939453 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:    5.9s finished


iteracion 21 para 20 features
--- 0.011139154434204102 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:    7.9s finished


iteracion 22 para 20 features
--- 0.008589982986450195 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:    3.9s finished


iteracion 23 para 20 features
--- 0.012923955917358398 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:    5.4s finished


iteracion 24 para 20 features
--- 0.0016970634460449219 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:    7.9s finished


iteracion 25 para 20 features
--- 0.0031669139862060547 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:    6.0s finished


iteracion 26 para 20 features
--- 0.015290021896362305 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:    6.5s finished


iteracion 27 para 20 features
--- 0.011461019515991211 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:   17.5s finished


iteracion 28 para 20 features
--- 0.0015609264373779297 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:   10.0s finished


iteracion 29 para 20 features
--- 0.0018091201782226562 seconds for feature selection ---
features selected
entro primeros
SVM-rbf
Fitting 5 folds for each of 169 candidates, totalling 845 fits


[Parallel(n_jobs=1)]: Done 845 out of 845 | elapsed:    5.5s finished


iteracion 30 para 20 features
--- 0.0007379055023193359 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    1.8s finished


iteracion 31 para 20 features
--- 0.009780168533325195 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    1.5s finished


iteracion 32 para 20 features
--- 0.003515005111694336 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    1.5s finished


iteracion 33 para 20 features
--- 0.0298309326171875 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    1.4s finished


iteracion 34 para 20 features
--- 0.042088985443115234 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.2s finished


iteracion 35 para 20 features
--- 0.0014019012451171875 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.0s finished


iteracion 36 para 20 features
--- 0.030321121215820312 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.6s finished


iteracion 37 para 20 features
--- 0.006626129150390625 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.5s finished


iteracion 38 para 20 features
--- 0.0012309551239013672 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    3.1s finished


iteracion 39 para 20 features
--- 0.015469074249267578 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.8s finished


iteracion 40 para 20 features
--- 0.03830099105834961 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    4.5s finished


iteracion 41 para 20 features
--- 0.011389970779418945 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    3.3s finished


iteracion 42 para 20 features
--- 0.031147003173828125 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.3s finished


iteracion 43 para 20 features
--- 0.2305281162261963 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    1.7s finished


iteracion 44 para 20 features
--- 0.0009670257568359375 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.8s finished


iteracion 45 para 20 features
--- 0.1003570556640625 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.5s finished


iteracion 46 para 20 features
--- 0.0017368793487548828 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.7s finished


iteracion 47 para 20 features
--- 0.016302108764648438 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.6s finished


iteracion 48 para 20 features
--- 0.023194074630737305 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.3s finished


iteracion 49 para 20 features
--- 0.00992894172668457 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.7s finished


iteracion 50 para 20 features
--- 0.015205860137939453 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    5.7s finished


iteracion 51 para 20 features
--- 0.040879011154174805 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    3.3s finished


iteracion 52 para 20 features
--- 0.05603599548339844 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    3.2s finished


iteracion 53 para 20 features
--- 0.03864693641662598 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    3.7s finished


iteracion 54 para 20 features
--- 0.03295612335205078 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    1.8s finished


iteracion 55 para 20 features
--- 0.010573148727416992 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    3.1s finished


iteracion 56 para 20 features
--- 0.04450678825378418 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.5s finished


iteracion 57 para 20 features
--- 0.0407559871673584 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.8s finished


iteracion 58 para 20 features
--- 0.002814054489135742 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    1.7s finished


iteracion 59 para 20 features
--- 0.04121994972229004 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.8s finished


iteracion 60 para 20 features
--- 0.1574239730834961 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.5s finished


iteracion 61 para 20 features
--- 0.002679109573364258 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    1.9s finished


iteracion 62 para 20 features
--- 0.020257949829101562 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.4s finished


iteracion 63 para 20 features
--- 0.08763313293457031 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    1.9s finished


iteracion 64 para 20 features
--- 0.002440929412841797 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    1.8s finished


iteracion 65 para 20 features
--- 0.2342820167541504 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    1.5s finished


iteracion 66 para 20 features
--- 0.0024709701538085938 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    1.6s finished


iteracion 67 para 20 features
--- 0.016665935516357422 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    1.9s finished


iteracion 68 para 20 features
--- 0.08408403396606445 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.4s finished


iteracion 69 para 20 features
--- 0.019877910614013672 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.0s finished


iteracion 70 para 20 features
--- 0.028953075408935547 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    1.8s finished


iteracion 71 para 20 features
--- 0.036370038986206055 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.1s finished


iteracion 72 para 20 features
--- 0.002936124801635742 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:   14.8s finished


iteracion 73 para 20 features
--- 0.0016360282897949219 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    1.9s finished


iteracion 74 para 20 features
--- 0.0013289451599121094 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    1.4s finished


iteracion 75 para 20 features
--- 0.0008039474487304688 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    1.8s finished


iteracion 76 para 20 features
--- 0.0009849071502685547 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    1.8s finished


iteracion 77 para 20 features
--- 0.0014851093292236328 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    1.9s finished


iteracion 78 para 20 features
--- 0.000762939453125 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    1.6s finished


iteracion 79 para 20 features
--- 0.0007588863372802734 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    1.8s finished


iteracion 80 para 20 features
--- 0.0021088123321533203 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    1.6s finished


iteracion 81 para 20 features
--- 0.0009260177612304688 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.1s finished


iteracion 82 para 20 features
--- 0.036791086196899414 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    1.9s finished


iteracion 83 para 20 features
--- 0.0012309551239013672 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    1.9s finished


iteracion 84 para 20 features
--- 0.055280208587646484 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.4s finished


iteracion 85 para 20 features
--- 0.11529898643493652 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    3.3s finished


iteracion 86 para 20 features
--- 0.023931026458740234 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.2s finished


iteracion 87 para 20 features
--- 0.025162935256958008 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    1.8s finished


iteracion 88 para 20 features
--- 0.010129928588867188 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.0s finished


iteracion 89 para 20 features
--- 0.0008428096771240234 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.0s finished


iteracion 90 para 20 features
--- 0.04520988464355469 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.9s finished


iteracion 91 para 20 features
--- 0.027888059616088867 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.6s finished


iteracion 92 para 20 features
--- 0.0015149116516113281 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.1s finished


iteracion 93 para 20 features
--- 0.02198004722595215 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.3s finished


iteracion 94 para 20 features
--- 0.00518798828125 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    1.5s finished


iteracion 95 para 20 features
--- 0.014066934585571289 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    3.0s finished


iteracion 96 para 20 features
--- 0.02188396453857422 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    3.1s finished


iteracion 97 para 20 features
--- 0.01800084114074707 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    3.1s finished


iteracion 98 para 20 features
--- 0.14531588554382324 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.2s finished


iteracion 99 para 20 features
--- 0.029806852340698242 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.3s finished


iteracion 100 para 20 features
--- 0.0023031234741210938 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    2.1s finished


iteracion 101 para 20 features
--- 0.03101801872253418 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    1.8s finished


iteracion 102 para 20 features
--- 0.025790929794311523 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    1.8s finished


iteracion 103 para 20 features
--- 0.004480123519897461 seconds for feature selection ---
features selected
entro small iters
SVM-rbf
Fitting 5 folds for each of 64 candidates, totalling 320 fits


[Parallel(n_jobs=1)]: Done 320 out of 320 | elapsed:    1.7s finished


KeyError: 'y_poly'

In [None]:
save_file = os.path.realpath('../data_str_pr_general/')
tissue = 'EC'
feat_sel = 't_test'
predictionsNOW = pickle.load( open( save_file + "/pred_%s_%s_%d.p" %(tissue, feat_sel, num), "rb" ) )

In [None]:
save_file = os.path.realpath('../DATA/t_test')
tissue = 'EC'
feat_sel = 't_test'
predictionsBEF = pickle.load( open( save_file + "/pred_%s_%s_%d.p" %(tissue, feat_sel, num), "rb" ) )

In [31]:
def SVM_rbf(train, y_train, test,C_range = np.logspace(-2, 10, 13),gamma_range = np.logspace(-9, 3, 13)):
    #C_range = np.logspace(-2, 10, 13)
    #gamma_range = np.logspace(-9, 3, 13)
    #C_range = np.logspace(-2, 10, 6)
    #gamma_range = np.logspace(-6, 3, 8)
    #rbf
    print('SVM-rbf')
    param_grid = [{'C': C_range, 'gamma': gamma_range, 'kernel': ['rbf']}]

    svr = svm.SVC(random_state=1234)
    clf = GridSearchCV(svr, param_grid, cv=5, verbose=1)
    clf.fit(train, y_train)
    y_rbf = clf.predict(test)[0]
    c_rbf = clf.best_params_['C']
    gamma_rbf = clf.best_params_['gamma']
    return (y_rbf, c_rbf, gamma_rbf)