# Spurious Correlations of Highly Dimensional Big Data

This Notebook aims at showing how PCA and random projection can solve the problem of spurious correlations in Big Data.

In [1]:
import numpy as np
import pandas as pd
from sklearn.decomposition import PCA
from sklearn import random_projection
from sklearn.utils import shuffle

## DataFrame Creation

In [2]:
# User defined parameters

# Number of rows for df1
x = 5000

# Number of columns for df1
y = 100000

# Number of rows for df2
z = 500

In [3]:
# Creating a dataframe with x number of rows and y number of columns
df = pd.DataFrame(np.random.random_sample((x,y)))
df

Unnamed: 0,0,1,2,3,4,5,6,7,8,9,...,99990,99991,99992,99993,99994,99995,99996,99997,99998,99999
0,0.558074,0.146873,0.194376,0.775783,0.683251,0.415910,0.340106,0.893966,0.838358,0.766523,...,0.533803,0.196517,0.302158,0.683084,0.727478,0.261291,0.675339,0.036686,0.512563,0.821115
1,0.442975,0.364266,0.120413,0.392387,0.982486,0.040099,0.283628,0.353170,0.304411,0.469894,...,0.463385,0.914663,0.328172,0.743567,0.704333,0.022282,0.665417,0.996602,0.847563,0.983614
2,0.108512,0.277351,0.034606,0.269334,0.280282,0.536049,0.486009,0.073816,0.669429,0.934776,...,0.596549,0.925016,0.291458,0.701571,0.498374,0.949404,0.631273,0.315561,0.425863,0.435383
3,0.057350,0.842868,0.694966,0.368945,0.094541,0.040207,0.452919,0.964794,0.804167,0.170156,...,0.440702,0.743454,0.098431,0.422255,0.680113,0.605082,0.275792,0.664262,0.053862,0.197751
4,0.653964,0.246600,0.604770,0.901564,0.047478,0.560173,0.639300,0.952426,0.284205,0.401732,...,0.574574,0.361121,0.949710,0.169760,0.620968,0.796997,0.795930,0.571932,0.488411,0.593988
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
4995,0.024019,0.349027,0.923871,0.741608,0.551494,0.840439,0.074507,0.821145,0.891022,0.329218,...,0.166387,0.334517,0.570511,0.194337,0.164196,0.977888,0.630438,0.277733,0.284135,0.757116
4996,0.604995,0.721532,0.289859,0.904756,0.457525,0.871019,0.737033,0.930697,0.358638,0.722931,...,0.182380,0.602360,0.131831,0.647140,0.268863,0.985441,0.767758,0.425082,0.987190,0.401223
4997,0.805926,0.331434,0.326477,0.134768,0.858607,0.174894,0.569535,0.041845,0.568255,0.932867,...,0.565931,0.395334,0.043295,0.720348,0.453616,0.694472,0.302853,0.840466,0.777154,0.166080
4998,0.320861,0.070816,0.559053,0.258198,0.232864,0.538174,0.686964,0.512688,0.280173,0.505906,...,0.594987,0.293719,0.556181,0.359171,0.176295,0.725837,0.269820,0.331039,0.664191,0.070739


In order to assess the correlations of the different parameters, correlations between the column with index 0 and the 999 other first columns is assessed.

In [4]:
# Assigning X to all columns except 0
X_df = df.drop(columns=0)
X_df.head()

# Assigning Y to column 0
Y_df = df[0]
print(Y_df)

# The following line makes Y become a list
Y_df = np.array(Y_df).reshape(-1)
print(X_df.shape,Y_df.shape)

list_titles = X_df.columns
list_corr_df1 = []
for i in list_titles[0:1000]:
    print(i)
    list_corr_df1.append(abs(np.corrcoef(Y_df, X_df[i])[0][1]))
    print('Correlation matrix for column 0 and and column' + str(i) + ': ' + str(np.corrcoef(Y_df, X_df[i])[0][1]))

0       0.558074
1       0.442975
2       0.108512
3       0.057350
4       0.653964
          ...   
4995    0.024019
4996    0.604995
4997    0.805926
4998    0.320861
4999    0.861687
Name: 0, Length: 5000, dtype: float64
(5000, 99999) (5000,)
1
Correlation matrix for column 0 and and column1: 0.02314597436713407
2
Correlation matrix for column 0 and and column2: -0.00793328194225734
3
Correlation matrix for column 0 and and column3: 7.685934515822803e-05
4
Correlation matrix for column 0 and and column4: 0.0007676901919735704
5
Correlation matrix for column 0 and and column5: -0.0025477726765214966
6
Correlation matrix for column 0 and and column6: 0.013882617550794623
7
Correlation matrix for column 0 and and column7: 0.021617773510114135
8
Correlation matrix for column 0 and and column8: -0.011054912345790615
9
Correlation matrix for column 0 and and column9: -0.00400912123743751
10
Correlation matrix for column 0 and and column10: 0.010761658277739606
11
Correlation matrix for c

Correlation matrix for column 0 and and column121: 0.009968816096632529
122
Correlation matrix for column 0 and and column122: 0.001721578742275054
123
Correlation matrix for column 0 and and column123: 0.00748899755205426
124
Correlation matrix for column 0 and and column124: -0.01148880163275305
125
Correlation matrix for column 0 and and column125: -0.015305823171607317
126
Correlation matrix for column 0 and and column126: -0.035454222514670335
127
Correlation matrix for column 0 and and column127: 0.0020678737944470654
128
Correlation matrix for column 0 and and column128: 0.022153343975135464
129
Correlation matrix for column 0 and and column129: -0.001960640157669343
130
Correlation matrix for column 0 and and column130: -0.011617642562331694
131
Correlation matrix for column 0 and and column131: -0.007396535653491021
132
Correlation matrix for column 0 and and column132: 0.01490010304032045
133
Correlation matrix for column 0 and and column133: 0.013957406823177115
134
Correlat

Correlation matrix for column 0 and and column233: 0.0017148573825680228
234
Correlation matrix for column 0 and and column234: -0.013096200959906202
235
Correlation matrix for column 0 and and column235: 0.01091519783830241
236
Correlation matrix for column 0 and and column236: 0.010248630981762928
237
Correlation matrix for column 0 and and column237: 0.004198325797913436
238
Correlation matrix for column 0 and and column238: -0.0012321385404495406
239
Correlation matrix for column 0 and and column239: -0.014054927182070905
240
Correlation matrix for column 0 and and column240: 0.015614261149572609
241
Correlation matrix for column 0 and and column241: -0.010999885592766845
242
Correlation matrix for column 0 and and column242: -0.008008239692023859
243
Correlation matrix for column 0 and and column243: -0.012318366829122402
244
Correlation matrix for column 0 and and column244: 0.0050456051635646235
245
Correlation matrix for column 0 and and column245: 0.0030320262629882654
246
Cor

Correlation matrix for column 0 and and column362: 0.0036186226731378317
363
Correlation matrix for column 0 and and column363: 0.0065968690563527
364
Correlation matrix for column 0 and and column364: 0.012291226253869322
365
Correlation matrix for column 0 and and column365: 0.024231081550472097
366
Correlation matrix for column 0 and and column366: 0.0023601519267048053
367
Correlation matrix for column 0 and and column367: -0.0060422377517470125
368
Correlation matrix for column 0 and and column368: -0.002701646731318528
369
Correlation matrix for column 0 and and column369: 0.01412802319883795
370
Correlation matrix for column 0 and and column370: -0.032153585250971985
371
Correlation matrix for column 0 and and column371: -0.0006683746619211012
372
Correlation matrix for column 0 and and column372: 0.007114894773349186
373
Correlation matrix for column 0 and and column373: 0.007858430550023682
374
Correlation matrix for column 0 and and column374: 0.008214231283281082
375
Correla

Correlation matrix for column 0 and and column506: 0.014015458928741651
507
Correlation matrix for column 0 and and column507: 0.024831398971468955
508
Correlation matrix for column 0 and and column508: -0.003513662347713052
509
Correlation matrix for column 0 and and column509: 0.007958815446381565
510
Correlation matrix for column 0 and and column510: 0.015050552263589437
511
Correlation matrix for column 0 and and column511: -0.0037533101566501943
512
Correlation matrix for column 0 and and column512: 0.015246356361224504
513
Correlation matrix for column 0 and and column513: -0.028596882718534007
514
Correlation matrix for column 0 and and column514: 0.032596672469259555
515
Correlation matrix for column 0 and and column515: 0.03431889873040239
516
Correlation matrix for column 0 and and column516: 0.009623895617239243
517
Correlation matrix for column 0 and and column517: -0.014402835477116996
518
Correlation matrix for column 0 and and column518: 0.008378741628589825
519
Correlat

Correlation matrix for column 0 and and column657: 0.006184576397577933
658
Correlation matrix for column 0 and and column658: -0.029295326171021773
659
Correlation matrix for column 0 and and column659: 0.03675034520396087
660
Correlation matrix for column 0 and and column660: 0.0020881591867648666
661
Correlation matrix for column 0 and and column661: 0.015047874488220233
662
Correlation matrix for column 0 and and column662: -0.02353634784435567
663
Correlation matrix for column 0 and and column663: -0.0034815656425784863
664
Correlation matrix for column 0 and and column664: -0.000254759211676073
665
Correlation matrix for column 0 and and column665: 0.0033451852632964624
666
Correlation matrix for column 0 and and column666: -0.018172170569000626
667
Correlation matrix for column 0 and and column667: 0.042488208139293604
668
Correlation matrix for column 0 and and column668: -0.03130744482029388
669
Correlation matrix for column 0 and and column669: 0.030295963433716384
670
Correl

Correlation matrix for column 0 and and column801: 0.006104523394897101
802
Correlation matrix for column 0 and and column802: 0.002390324028809278
803
Correlation matrix for column 0 and and column803: 0.03411338491910348
804
Correlation matrix for column 0 and and column804: -0.011510419527216709
805
Correlation matrix for column 0 and and column805: -0.0011755085086974028
806
Correlation matrix for column 0 and and column806: -0.025928951509990375
807
Correlation matrix for column 0 and and column807: 0.006738370255015089
808
Correlation matrix for column 0 and and column808: -0.005454358887780953
809
Correlation matrix for column 0 and and column809: 0.004584966269030434
810
Correlation matrix for column 0 and and column810: -0.002724436064404247
811
Correlation matrix for column 0 and and column811: 0.008584719060744409
812
Correlation matrix for column 0 and and column812: -0.0028260387963211257
813
Correlation matrix for column 0 and and column813: -0.0031571222806395815
814
Cor

Correlation matrix for column 0 and and column932: -0.007141938869019415
933
Correlation matrix for column 0 and and column933: 0.004973174849529831
934
Correlation matrix for column 0 and and column934: 0.0023529423321722275
935
Correlation matrix for column 0 and and column935: -0.008581765136012541
936
Correlation matrix for column 0 and and column936: 0.014438548343306516
937
Correlation matrix for column 0 and and column937: 0.013658565347122335
938
Correlation matrix for column 0 and and column938: 0.015500914903683459
939
Correlation matrix for column 0 and and column939: 0.0029386698444804223
940
Correlation matrix for column 0 and and column940: -0.01300989274546147
941
Correlation matrix for column 0 and and column941: 0.00019852901172126783
942
Correlation matrix for column 0 and and column942: 0.0049681429013808285
943
Correlation matrix for column 0 and and column943: 0.013427158249238843
944
Correlation matrix for column 0 and and column944: -0.008043913485396643
945
Corr

To see if indeed the correlations between the different parameters increases with the data size, the original dataframe is compared to a sub-set dataframe which only takes the first z rows of the original dataframe. If the correlations in the original dataframe are higher than in the smaller dataframe this would prove that the bigger the data size the more frequent the number of spurious correlations.

In [5]:
# Creating smaller dataframe taking z number of rows from original dataframe
df2 = df.iloc[:z]
df2

Unnamed: 0,0,1,2,3,4,5,6,7,8,9,...,99990,99991,99992,99993,99994,99995,99996,99997,99998,99999
0,0.558074,0.146873,0.194376,0.775783,0.683251,0.415910,0.340106,0.893966,0.838358,0.766523,...,0.533803,0.196517,0.302158,0.683084,0.727478,0.261291,0.675339,0.036686,0.512563,0.821115
1,0.442975,0.364266,0.120413,0.392387,0.982486,0.040099,0.283628,0.353170,0.304411,0.469894,...,0.463385,0.914663,0.328172,0.743567,0.704333,0.022282,0.665417,0.996602,0.847563,0.983614
2,0.108512,0.277351,0.034606,0.269334,0.280282,0.536049,0.486009,0.073816,0.669429,0.934776,...,0.596549,0.925016,0.291458,0.701571,0.498374,0.949404,0.631273,0.315561,0.425863,0.435383
3,0.057350,0.842868,0.694966,0.368945,0.094541,0.040207,0.452919,0.964794,0.804167,0.170156,...,0.440702,0.743454,0.098431,0.422255,0.680113,0.605082,0.275792,0.664262,0.053862,0.197751
4,0.653964,0.246600,0.604770,0.901564,0.047478,0.560173,0.639300,0.952426,0.284205,0.401732,...,0.574574,0.361121,0.949710,0.169760,0.620968,0.796997,0.795930,0.571932,0.488411,0.593988
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
495,0.223368,0.881053,0.707576,0.971805,0.760852,0.317258,0.599083,0.975095,0.984770,0.299032,...,0.087753,0.318703,0.382462,0.169939,0.103677,0.893924,0.517671,0.374775,0.766880,0.478400
496,0.542535,0.141542,0.142608,0.527549,0.090314,0.595009,0.084914,0.887192,0.301638,0.215686,...,0.370532,0.894899,0.462810,0.385923,0.280016,0.783014,0.917456,0.302043,0.625849,0.431223
497,0.116178,0.456436,0.266922,0.059559,0.823246,0.586194,0.673686,0.796881,0.196431,0.277549,...,0.477552,0.939067,0.841834,0.433350,0.762524,0.580428,0.227161,0.804237,0.320367,0.175748
498,0.271197,0.090007,0.719916,0.879129,0.643429,0.360167,0.122288,0.580904,0.553362,0.307162,...,0.555936,0.224383,0.680516,0.039773,0.810634,0.373424,0.188701,0.103498,0.063140,0.111218


In [6]:
# Assigning X to all columns except 0
X_df2 = df2.drop(columns=0)
X_df2.head()

# Assigning Y to column 0
Y_df2 = df2[0]
print(Y_df2)

# The following line makes Y become a list
Y_df2 = np.array(Y_df2).reshape(-1)
print(X_df2.shape,Y_df2.shape)

list_titles = X_df2.columns

list_corr_df2 = []
for i in list_titles[0:1000]:
    print(i)
    list_corr_df2.append(abs(np.corrcoef(Y_df2, X_df2[i])[0][1]))
    print('Correlation matrix for column 0 and and column' + str(i) + ': ' + str(np.corrcoef(Y_df2, X_df2[i])[0][1]))

0      0.558074
1      0.442975
2      0.108512
3      0.057350
4      0.653964
         ...   
495    0.223368
496    0.542535
497    0.116178
498    0.271197
499    0.004604
Name: 0, Length: 500, dtype: float64
(500, 99999) (500,)
1
Correlation matrix for column 0 and and column1: -0.04364590526355567
2
Correlation matrix for column 0 and and column2: -0.0055245515283112966
3
Correlation matrix for column 0 and and column3: -0.010385792699257365
4
Correlation matrix for column 0 and and column4: -0.05984027637516156
5
Correlation matrix for column 0 and and column5: 0.0404859885455979
6
Correlation matrix for column 0 and and column6: -0.060615629959973015
7
Correlation matrix for column 0 and and column7: 0.0487985121910718
8
Correlation matrix for column 0 and and column8: -0.02420685559697924
9
Correlation matrix for column 0 and and column9: 0.06972571267298595
10
Correlation matrix for column 0 and and column10: 0.07590728747219251
11
Correlation matrix for column 0 and and colu

Correlation matrix for column 0 and and column235: 0.06597181536874756
236
Correlation matrix for column 0 and and column236: 0.050642143147879445
237
Correlation matrix for column 0 and and column237: 0.05677306474700845
238
Correlation matrix for column 0 and and column238: 0.014341181392526586
239
Correlation matrix for column 0 and and column239: 0.022933720664840316
240
Correlation matrix for column 0 and and column240: -0.08435118562599288
241
Correlation matrix for column 0 and and column241: 0.0546345806056442
242
Correlation matrix for column 0 and and column242: -0.010483817709018888
243
Correlation matrix for column 0 and and column243: -0.04254685573281812
244
Correlation matrix for column 0 and and column244: 0.01084381438773266
245
Correlation matrix for column 0 and and column245: -0.02196128060265268
246
Correlation matrix for column 0 and and column246: 0.05523482938214486
247
Correlation matrix for column 0 and and column247: 0.05567302265128125
248
Correlation matrix

Correlation matrix for column 0 and and column435: 0.00502223217649026
436
Correlation matrix for column 0 and and column436: -0.007231152648440345
437
Correlation matrix for column 0 and and column437: -0.013700800940102767
438
Correlation matrix for column 0 and and column438: 0.01730683019919483
439
Correlation matrix for column 0 and and column439: 0.047668911198249016
440
Correlation matrix for column 0 and and column440: 0.0015775185172652035
441
Correlation matrix for column 0 and and column441: 0.09953409641635926
442
Correlation matrix for column 0 and and column442: -0.014220720752179474
443
Correlation matrix for column 0 and and column443: -0.005166261789069203
444
Correlation matrix for column 0 and and column444: -0.06417224294460114
445
Correlation matrix for column 0 and and column445: 0.019335938855030568
446
Correlation matrix for column 0 and and column446: -0.02701797762531689
447
Correlation matrix for column 0 and and column447: 0.11279567897652293
448
Correlation

630
Correlation matrix for column 0 and and column630: -0.07230155247108959
631
Correlation matrix for column 0 and and column631: 0.06192658254413668
632
Correlation matrix for column 0 and and column632: -0.006880243128079215
633
Correlation matrix for column 0 and and column633: 0.04562853816914245
634
Correlation matrix for column 0 and and column634: 0.05716963704601371
635
Correlation matrix for column 0 and and column635: -0.011763428664171901
636
Correlation matrix for column 0 and and column636: 0.06793567208691782
637
Correlation matrix for column 0 and and column637: -0.0001575409789538901
638
Correlation matrix for column 0 and and column638: -0.0822720582754899
639
Correlation matrix for column 0 and and column639: -0.0646518231906961
640
Correlation matrix for column 0 and and column640: 0.018968485680824765
641
Correlation matrix for column 0 and and column641: -0.04567162929808356
642
Correlation matrix for column 0 and and column642: 0.0705561022029827
643
Correlation 

Correlation matrix for column 0 and and column860: -0.018868557966149828
861
Correlation matrix for column 0 and and column861: -0.03854968765836934
862
Correlation matrix for column 0 and and column862: -0.022215386568594418
863
Correlation matrix for column 0 and and column863: -0.05978527410724426
864
Correlation matrix for column 0 and and column864: -0.0014430139911228792
865
Correlation matrix for column 0 and and column865: 0.03862724110904599
866
Correlation matrix for column 0 and and column866: -0.023815487195569068
867
Correlation matrix for column 0 and and column867: -0.008445261643794954
868
Correlation matrix for column 0 and and column868: 0.10868469224621267
869
Correlation matrix for column 0 and and column869: 0.0011473546036171
870
Correlation matrix for column 0 and and column870: -0.010538466511511692
871
Correlation matrix for column 0 and and column871: -0.07577944133066478
872
Correlation matrix for column 0 and and column872: -0.028460947824938455
873
Correlat

We now compare which of the correlation lists has the highest numbers of every parameter

In [7]:
a = 0
b = 0
for i in range(0,1000):
    if abs(list_corr_df1[i]) > abs(list_corr_df2[i]):
        a+=1
    elif abs(list_corr_df1[i]) < abs(list_corr_df2[i]):
        b+=1
    else:
        print()
        
print(a)
print(b)

207
793


In [8]:
a = 0
b = 0
for i in range(0,len(list_corr_df1)):
    if abs(list_corr_df1[i]) > 0.01:
        a+=1
    else:
        pass
        
for i in range(0,len(list_corr_df2)):
    if abs(list_corr_df2[i]) > 0.01:
        b+=1
    else:
        pass

print("Percentage of correlations in df1:",(a/len(list_corr_df1)*100),"%")

print("Percentage of correlations in df2:",(b/len(list_corr_df2)*100),"%")

Percentage of correlations in df1: 46.300000000000004 %
Percentage of correlations in df2: 80.7 %


Clearly it is seen that the lower the number of observations, the higher the frequency of spurious correlations. However the number of spurious correlations present in the bigger DataFrame is still very significant.

To counter spurious correlations, random projection can be used.

## Random Projection eps = 0.1

In [9]:
# Pass df1 in the random projection to create a new reduced DataFrame
transformer = random_projection.GaussianRandomProjection(eps = 0.1)
df_new = pd.DataFrame(transformer.fit_transform(df))
df_new

Unnamed: 0,0,1,2,3,4,5,6,7,8,9,...,7290,7291,7292,7293,7294,7295,7296,7297,7298,7299
0,-0.128362,0.817648,1.241955,-0.872799,-1.868267,1.541777,-0.027354,-0.567468,-2.599919,-1.988877,...,-0.720649,0.895238,-3.590158,1.222767,-1.057153,1.418575,-0.922029,-2.264503,-0.583607,1.207703
1,0.553699,-0.237677,-0.125647,-2.342176,-1.916403,2.029114,-1.700311,-1.111416,-1.161022,-2.582140,...,-2.447773,-1.449137,-5.750021,-0.310218,0.053238,2.343667,-1.127257,-1.795590,-0.524429,2.426150
2,1.159617,2.547392,2.330427,-3.043360,-0.742959,0.479377,-0.683320,-2.546391,-3.359355,-1.208370,...,-2.620150,-0.062721,-4.320984,2.351188,0.018352,0.550837,0.715337,-2.664801,-1.015692,1.661312
3,1.927495,0.720345,0.922932,-0.564959,-2.226839,1.753817,-0.712425,-0.742290,-0.191014,-0.777285,...,-3.258309,-1.775065,-5.461386,-1.264483,0.015380,1.356115,-0.198016,-2.697311,2.148320,2.837279
4,1.411960,1.301391,0.290096,-1.422156,-1.164816,2.174815,0.398986,-0.612970,-1.612210,-2.613369,...,0.282244,-0.087570,-3.900833,-0.478888,-0.317812,0.718787,-0.705241,-1.886241,2.238937,0.693207
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
4995,2.864636,0.472198,1.087439,-0.490655,-1.808591,1.432861,0.548080,1.551048,0.210490,-2.211085,...,-1.585997,0.204686,-3.532977,-1.282475,-2.051200,2.453373,-0.314776,-1.032843,1.521577,2.950749
4996,0.253804,0.905608,0.800554,-1.742974,-0.290230,3.029215,0.310151,-1.067118,0.100052,-1.657885,...,-3.992088,-0.776798,-5.493631,-0.017286,-1.547238,1.648767,1.401075,-0.877622,0.519174,1.692601
4997,0.044828,-1.280083,-0.205799,-1.424158,-1.324524,1.565390,1.013948,-0.970467,-0.907614,-2.225273,...,-1.211267,0.277194,-3.790778,-0.590092,-1.595265,1.871978,0.467176,-2.979432,0.217973,2.106058
4998,-0.247888,2.120055,3.522785,-1.643004,-0.983278,2.225134,-0.835447,-2.625912,-1.718619,-3.046819,...,-2.556106,0.963618,-4.412617,-1.650420,-0.629229,1.525345,-1.558076,-2.995993,-0.179425,2.038479


In [10]:
# Assigning X to all columns except 0
X_df_new = df_new.drop(columns=0)

# Assigning Y to column 0
Y_df_new = df_new[0]
print(Y_df_new)

# The following line makes Y become a list
Y_df_new = np.array(Y_df_new).reshape(-1)
print(X_df_new.shape,Y_df_new.shape)

list_titles = X_df_new.columns

list_corr_df_new = []
for i in list_titles[0:len(list_titles)]:
    print(i)
    list_corr_df_new.append(abs(np.corrcoef(Y_df_new, X_df_new[i])[0][1]))
    print('Correlation matrix for column 0 and and column' + str(i) + ': ' + str(np.corrcoef(Y_df_new, X_df_new[i])[0][1]))

0      -0.128362
1       0.553699
2       1.159617
3       1.927495
4       1.411960
          ...   
4995    2.864636
4996    0.253804
4997    0.044828
4998   -0.247888
4999    1.224505
Name: 0, Length: 5000, dtype: float64
(5000, 7299) (5000,)
1
Correlation matrix for column 0 and and column1: 0.02186155011883491
2
Correlation matrix for column 0 and and column2: 0.006923115412907284
3
Correlation matrix for column 0 and and column3: -0.007064477026262293
4
Correlation matrix for column 0 and and column4: 0.01117413934196592
5
Correlation matrix for column 0 and and column5: 0.0063859221084106785
6
Correlation matrix for column 0 and and column6: 0.029122905479867886
7
Correlation matrix for column 0 and and column7: -0.020223527867335507
8
Correlation matrix for column 0 and and column8: -0.0018318318192047977
9
Correlation matrix for column 0 and and column9: 0.004747650862631521
10
Correlation matrix for column 0 and and column10: -0.011186010293024715
11
Correlation matrix for co

193
Correlation matrix for column 0 and and column193: -0.029758251560699632
194
Correlation matrix for column 0 and and column194: -0.015306120945476901
195
Correlation matrix for column 0 and and column195: -0.025260057264700663
196
Correlation matrix for column 0 and and column196: 0.021004551756656182
197
Correlation matrix for column 0 and and column197: 0.0046236106873612185
198
Correlation matrix for column 0 and and column198: 0.006610908962700525
199
Correlation matrix for column 0 and and column199: -0.032281609594807414
200
Correlation matrix for column 0 and and column200: -0.018482915316836105
201
Correlation matrix for column 0 and and column201: -0.0013077831707360482
202
Correlation matrix for column 0 and and column202: 0.001879427495855727
203
Correlation matrix for column 0 and and column203: 0.006959251609713091
204
Correlation matrix for column 0 and and column204: -0.003847480109284455
205
Correlation matrix for column 0 and and column205: 0.026086027713356243
206

350
Correlation matrix for column 0 and and column350: 0.0022056316930853317
351
Correlation matrix for column 0 and and column351: 0.009836000697450522
352
Correlation matrix for column 0 and and column352: 0.0020309068360854525
353
Correlation matrix for column 0 and and column353: 0.002111134566889632
354
Correlation matrix for column 0 and and column354: -0.02633978549801253
355
Correlation matrix for column 0 and and column355: 0.034257916849449385
356
Correlation matrix for column 0 and and column356: -0.007429949204258204
357
Correlation matrix for column 0 and and column357: -0.026036891200339096
358
Correlation matrix for column 0 and and column358: -0.011616860244941567
359
Correlation matrix for column 0 and and column359: -0.01926204215080936
360
Correlation matrix for column 0 and and column360: 0.03162310040536307
361
Correlation matrix for column 0 and and column361: -0.004622325834196339
362
Correlation matrix for column 0 and and column362: 0.015060423214645412
363
Cor

Correlation matrix for column 0 and and column510: -0.0025485949484463466
511
Correlation matrix for column 0 and and column511: 0.017885138220321336
512
Correlation matrix for column 0 and and column512: -0.013928417551094894
513
Correlation matrix for column 0 and and column513: 0.002761788709001681
514
Correlation matrix for column 0 and and column514: -0.020220286069819567
515
Correlation matrix for column 0 and and column515: 0.0010165117309624597
516
Correlation matrix for column 0 and and column516: 0.011235273390591424
517
Correlation matrix for column 0 and and column517: 0.0030006750157097516
518
Correlation matrix for column 0 and and column518: -0.01635900409976668
519
Correlation matrix for column 0 and and column519: 0.01261667420320169
520
Correlation matrix for column 0 and and column520: 0.015833220838560525
521
Correlation matrix for column 0 and and column521: 0.005046936803828048
522
Correlation matrix for column 0 and and column522: 0.013975669994098354
523
Correla

Correlation matrix for column 0 and and column672: -0.0026069711361659557
673
Correlation matrix for column 0 and and column673: 0.035653659230355246
674
Correlation matrix for column 0 and and column674: 0.02296565094468194
675
Correlation matrix for column 0 and and column675: 0.015406531855930756
676
Correlation matrix for column 0 and and column676: -0.01634515047568241
677
Correlation matrix for column 0 and and column677: 0.017098411757065737
678
Correlation matrix for column 0 and and column678: -0.00022117038748696049
679
Correlation matrix for column 0 and and column679: 0.00960362887338575
680
Correlation matrix for column 0 and and column680: -0.013957644302815906
681
Correlation matrix for column 0 and and column681: 0.02053414660699989
682
Correlation matrix for column 0 and and column682: -0.024159408695653105
683
Correlation matrix for column 0 and and column683: -0.00893917281403396
684
Correlation matrix for column 0 and and column684: -0.008582383712418758
685
Correla

Correlation matrix for column 0 and and column829: 0.004903906096244253
830
Correlation matrix for column 0 and and column830: 0.021289994204422773
831
Correlation matrix for column 0 and and column831: -0.020887204117463018
832
Correlation matrix for column 0 and and column832: 0.02285297116617496
833
Correlation matrix for column 0 and and column833: -0.00527991702602847
834
Correlation matrix for column 0 and and column834: -0.005364122768185003
835
Correlation matrix for column 0 and and column835: 0.0002283391512896184
836
Correlation matrix for column 0 and and column836: 0.0032637685652502123
837
Correlation matrix for column 0 and and column837: -0.009188469572707568
838
Correlation matrix for column 0 and and column838: 0.01616950954060041
839
Correlation matrix for column 0 and and column839: 0.004373945698710276
840
Correlation matrix for column 0 and and column840: 0.02156785806168743
841
Correlation matrix for column 0 and and column841: 0.013415481738053295
842
Correlatio

Correlation matrix for column 0 and and column981: 0.0009013818175975932
982
Correlation matrix for column 0 and and column982: -0.02630333552661926
983
Correlation matrix for column 0 and and column983: 0.00233044474872342
984
Correlation matrix for column 0 and and column984: -0.008686598581450362
985
Correlation matrix for column 0 and and column985: 0.009014802627970102
986
Correlation matrix for column 0 and and column986: 0.011510982667873496
987
Correlation matrix for column 0 and and column987: -0.0031673672577460276
988
Correlation matrix for column 0 and and column988: -0.009392926649352514
989
Correlation matrix for column 0 and and column989: 0.017048864850945335
990
Correlation matrix for column 0 and and column990: -0.0230588205794134
991
Correlation matrix for column 0 and and column991: 0.006463998599808438
992
Correlation matrix for column 0 and and column992: 0.01402614328102264
993
Correlation matrix for column 0 and and column993: -0.008228191301168431
994
Correlati

1142
Correlation matrix for column 0 and and column1142: 0.002767288926846841
1143
Correlation matrix for column 0 and and column1143: -0.013270297758663539
1144
Correlation matrix for column 0 and and column1144: 0.022960478049170046
1145
Correlation matrix for column 0 and and column1145: -0.025117721112280677
1146
Correlation matrix for column 0 and and column1146: 0.004913700340848785
1147
Correlation matrix for column 0 and and column1147: -0.0062843938007331145
1148
Correlation matrix for column 0 and and column1148: 0.004664387515299502
1149
Correlation matrix for column 0 and and column1149: 0.01144485144358661
1150
Correlation matrix for column 0 and and column1150: 0.008703357488923699
1151
Correlation matrix for column 0 and and column1151: -0.0003958940711831421
1152
Correlation matrix for column 0 and and column1152: 0.019798491837968068
1153
Correlation matrix for column 0 and and column1153: -0.002408571376657334
1154
Correlation matrix for column 0 and and column1154: 0

1305
Correlation matrix for column 0 and and column1305: 0.0030502636464552957
1306
Correlation matrix for column 0 and and column1306: 0.016666419511218934
1307
Correlation matrix for column 0 and and column1307: 0.017800645822688702
1308
Correlation matrix for column 0 and and column1308: 0.005908699955944196
1309
Correlation matrix for column 0 and and column1309: -0.0028220081745124327
1310
Correlation matrix for column 0 and and column1310: -0.010464960511516812
1311
Correlation matrix for column 0 and and column1311: 0.004169782566335938
1312
Correlation matrix for column 0 and and column1312: -0.009869053079508808
1313
Correlation matrix for column 0 and and column1313: -0.001162733993770827
1314
Correlation matrix for column 0 and and column1314: -0.004602196631755992
1315
Correlation matrix for column 0 and and column1315: -0.00036052834975002087
1316
Correlation matrix for column 0 and and column1316: -0.010546288601228231
1317
Correlation matrix for column 0 and and column13

1468
Correlation matrix for column 0 and and column1468: 0.026023714644457085
1469
Correlation matrix for column 0 and and column1469: 0.007481895023815485
1470
Correlation matrix for column 0 and and column1470: -0.01604625231262037
1471
Correlation matrix for column 0 and and column1471: 0.00135428465141366
1472
Correlation matrix for column 0 and and column1472: -0.004263678944618372
1473
Correlation matrix for column 0 and and column1473: 0.032311560508560544
1474
Correlation matrix for column 0 and and column1474: -0.007360741942041787
1475
Correlation matrix for column 0 and and column1475: 0.032212729661570884
1476
Correlation matrix for column 0 and and column1476: -0.006275912723052799
1477
Correlation matrix for column 0 and and column1477: 0.021152205093270218
1478
Correlation matrix for column 0 and and column1478: -0.017211344711036518
1479
Correlation matrix for column 0 and and column1479: -0.014069695766855279
1480
Correlation matrix for column 0 and and column1480: -0.

Correlation matrix for column 0 and and column1623: -0.0196615051019492
1624
Correlation matrix for column 0 and and column1624: 0.002363353366775366
1625
Correlation matrix for column 0 and and column1625: -0.0005366309254908124
1626
Correlation matrix for column 0 and and column1626: 0.003840685592640545
1627
Correlation matrix for column 0 and and column1627: 0.003375043792954491
1628
Correlation matrix for column 0 and and column1628: 0.005801936642986844
1629
Correlation matrix for column 0 and and column1629: 0.002830436714517052
1630
Correlation matrix for column 0 and and column1630: 0.0003126078082685732
1631
Correlation matrix for column 0 and and column1631: 0.00954680509285313
1632
Correlation matrix for column 0 and and column1632: -0.015227138913462574
1633
Correlation matrix for column 0 and and column1633: -0.0044752392874702045
1634
Correlation matrix for column 0 and and column1634: 0.00854557931411772
1635
Correlation matrix for column 0 and and column1635: 0.0022146

Correlation matrix for column 0 and and column1786: -0.003746673022172295
1787
Correlation matrix for column 0 and and column1787: 0.015872057910022448
1788
Correlation matrix for column 0 and and column1788: -0.0035297463217332107
1789
Correlation matrix for column 0 and and column1789: 0.009295905281193997
1790
Correlation matrix for column 0 and and column1790: 0.01627048544317716
1791
Correlation matrix for column 0 and and column1791: -0.0031527708034992754
1792
Correlation matrix for column 0 and and column1792: -0.031135326782795257
1793
Correlation matrix for column 0 and and column1793: -0.009761490083726785
1794
Correlation matrix for column 0 and and column1794: 0.006862439765687909
1795
Correlation matrix for column 0 and and column1795: -0.007116477571020462
1796
Correlation matrix for column 0 and and column1796: 0.015460721023696456
1797
Correlation matrix for column 0 and and column1797: 0.01468563015064018
1798
Correlation matrix for column 0 and and column1798: 0.0254

Correlation matrix for column 0 and and column1948: -0.000505589854972826
1949
Correlation matrix for column 0 and and column1949: -0.009091785404570047
1950
Correlation matrix for column 0 and and column1950: 0.004092278313261978
1951
Correlation matrix for column 0 and and column1951: -0.014537072092170195
1952
Correlation matrix for column 0 and and column1952: 0.012013601427428655
1953
Correlation matrix for column 0 and and column1953: 0.007941043395737746
1954
Correlation matrix for column 0 and and column1954: -0.00205039110598917
1955
Correlation matrix for column 0 and and column1955: 0.0005414618014731113
1956
Correlation matrix for column 0 and and column1956: -0.02770989636101999
1957
Correlation matrix for column 0 and and column1957: 0.007973036130785963
1958
Correlation matrix for column 0 and and column1958: 0.0031332034049507233
1959
Correlation matrix for column 0 and and column1959: -0.020070377469032556
1960
Correlation matrix for column 0 and and column1960: -0.019

Correlation matrix for column 0 and and column2110: 0.013012392618536012
2111
Correlation matrix for column 0 and and column2111: 0.01878375679792723
2112
Correlation matrix for column 0 and and column2112: -0.007356407305656953
2113
Correlation matrix for column 0 and and column2113: 0.022611677245816312
2114
Correlation matrix for column 0 and and column2114: 0.011681203479142206
2115
Correlation matrix for column 0 and and column2115: 0.02635759324717297
2116
Correlation matrix for column 0 and and column2116: -0.01595343486673634
2117
Correlation matrix for column 0 and and column2117: 0.02855028441735885
2118
Correlation matrix for column 0 and and column2118: 0.004145032452978334
2119
Correlation matrix for column 0 and and column2119: -0.02559907992622852
2120
Correlation matrix for column 0 and and column2120: -0.006808286852287073
2121
Correlation matrix for column 0 and and column2121: 0.014644002404390045
2122
Correlation matrix for column 0 and and column2122: -0.0030896273

Correlation matrix for column 0 and and column2274: 0.018271609689694306
2275
Correlation matrix for column 0 and and column2275: -0.0022412557654254224
2276
Correlation matrix for column 0 and and column2276: -0.01394580620399998
2277
Correlation matrix for column 0 and and column2277: 0.0004860904459749214
2278
Correlation matrix for column 0 and and column2278: -0.02471383729034653
2279
Correlation matrix for column 0 and and column2279: 0.020415955615903685
2280
Correlation matrix for column 0 and and column2280: -0.018680800035283576
2281
Correlation matrix for column 0 and and column2281: 0.006980442370530687
2282
Correlation matrix for column 0 and and column2282: -0.013236871958853699
2283
Correlation matrix for column 0 and and column2283: -0.011510648255690077
2284
Correlation matrix for column 0 and and column2284: -0.01601455281661371
2285
Correlation matrix for column 0 and and column2285: 0.010365402580248099
2286
Correlation matrix for column 0 and and column2286: -0.006

2430
Correlation matrix for column 0 and and column2430: 0.00342899624548756
2431
Correlation matrix for column 0 and and column2431: -0.011645877033090285
2432
Correlation matrix for column 0 and and column2432: 0.03206086888818681
2433
Correlation matrix for column 0 and and column2433: 0.00704892661063211
2434
Correlation matrix for column 0 and and column2434: 0.009403936009105942
2435
Correlation matrix for column 0 and and column2435: 0.013929181290942507
2436
Correlation matrix for column 0 and and column2436: 0.0029687532961772925
2437
Correlation matrix for column 0 and and column2437: -0.0024902789038903504
2438
Correlation matrix for column 0 and and column2438: -0.001389847565509864
2439
Correlation matrix for column 0 and and column2439: -0.005208253058477614
2440
Correlation matrix for column 0 and and column2440: 0.017506256617657454
2441
Correlation matrix for column 0 and and column2441: 0.006041953492582917
2442
Correlation matrix for column 0 and and column2442: 0.01

Correlation matrix for column 0 and and column2575: 0.013318951959478461
2576
Correlation matrix for column 0 and and column2576: -0.00279701912727388
2577
Correlation matrix for column 0 and and column2577: 0.004446450996546239
2578
Correlation matrix for column 0 and and column2578: -0.015083021238893964
2579
Correlation matrix for column 0 and and column2579: -0.007860251821215416
2580
Correlation matrix for column 0 and and column2580: 0.009172096983492955
2581
Correlation matrix for column 0 and and column2581: -0.008766266327299032
2582
Correlation matrix for column 0 and and column2582: 0.005100148180684397
2583
Correlation matrix for column 0 and and column2583: -0.010968969252662381
2584
Correlation matrix for column 0 and and column2584: -0.0115979487358934
2585
Correlation matrix for column 0 and and column2585: -0.01064263106845309
2586
Correlation matrix for column 0 and and column2586: 0.01897031070551278
2587
Correlation matrix for column 0 and and column2587: 0.02977960

2732
Correlation matrix for column 0 and and column2732: 0.0018891400413675891
2733
Correlation matrix for column 0 and and column2733: -0.022860734429741632
2734
Correlation matrix for column 0 and and column2734: -0.00455763313804976
2735
Correlation matrix for column 0 and and column2735: 0.005254778938027227
2736
Correlation matrix for column 0 and and column2736: -0.028754604709903004
2737
Correlation matrix for column 0 and and column2737: -0.024999232538121436
2738
Correlation matrix for column 0 and and column2738: 0.033291934719903014
2739
Correlation matrix for column 0 and and column2739: 0.002244555945307444
2740
Correlation matrix for column 0 and and column2740: 0.0060620161037501985
2741
Correlation matrix for column 0 and and column2741: 0.01016567199271947
2742
Correlation matrix for column 0 and and column2742: 0.009160260809843522
2743
Correlation matrix for column 0 and and column2743: -0.006968210031187241
2744
Correlation matrix for column 0 and and column2744: 0.

Correlation matrix for column 0 and and column2883: -0.026175683633249996
2884
Correlation matrix for column 0 and and column2884: 0.013833945174513583
2885
Correlation matrix for column 0 and and column2885: 0.0006724610498619633
2886
Correlation matrix for column 0 and and column2886: 0.008597403839754148
2887
Correlation matrix for column 0 and and column2887: 0.011777180555665654
2888
Correlation matrix for column 0 and and column2888: -0.00031251512540613965
2889
Correlation matrix for column 0 and and column2889: 0.023667362706697725
2890
Correlation matrix for column 0 and and column2890: -0.021108524992110217
2891
Correlation matrix for column 0 and and column2891: -0.013544477074629203
2892
Correlation matrix for column 0 and and column2892: 0.023335780384237465
2893
Correlation matrix for column 0 and and column2893: -0.0009263778953951859
2894
Correlation matrix for column 0 and and column2894: 0.010570236372932432
2895
Correlation matrix for column 0 and and column2895: -0.

Correlation matrix for column 0 and and column3041: -0.006890917323660042
3042
Correlation matrix for column 0 and and column3042: -0.020127592796993957
3043
Correlation matrix for column 0 and and column3043: 0.0009019449228604869
3044
Correlation matrix for column 0 and and column3044: 0.013320701243070946
3045
Correlation matrix for column 0 and and column3045: -0.024364972920294835
3046
Correlation matrix for column 0 and and column3046: -0.0023571292808934846
3047
Correlation matrix for column 0 and and column3047: 0.009079158754675052
3048
Correlation matrix for column 0 and and column3048: -0.0034733966130295305
3049
Correlation matrix for column 0 and and column3049: 0.010586674587536373
3050
Correlation matrix for column 0 and and column3050: -0.016564859965879045
3051
Correlation matrix for column 0 and and column3051: -0.03884069071751326
3052
Correlation matrix for column 0 and and column3052: 0.0016107243397905137
3053
Correlation matrix for column 0 and and column3053: -0

3204
Correlation matrix for column 0 and and column3204: 0.005183915396267064
3205
Correlation matrix for column 0 and and column3205: 0.02923359579503477
3206
Correlation matrix for column 0 and and column3206: 0.00017521967182515898
3207
Correlation matrix for column 0 and and column3207: -0.010251679888580474
3208
Correlation matrix for column 0 and and column3208: -0.014745114529466448
3209
Correlation matrix for column 0 and and column3209: -0.009180122826466063
3210
Correlation matrix for column 0 and and column3210: 0.00010752761761820651
3211
Correlation matrix for column 0 and and column3211: 0.004028116686561831
3212
Correlation matrix for column 0 and and column3212: -0.003461199030106405
3213
Correlation matrix for column 0 and and column3213: -0.013963860002683477
3214
Correlation matrix for column 0 and and column3214: -0.011214125875153936
3215
Correlation matrix for column 0 and and column3215: 0.000493506239145206
3216
Correlation matrix for column 0 and and column3216

Correlation matrix for column 0 and and column3355: 0.00544404593573206
3356
Correlation matrix for column 0 and and column3356: 0.008661591444818291
3357
Correlation matrix for column 0 and and column3357: -0.00380594055349353
3358
Correlation matrix for column 0 and and column3358: 0.003320920029412995
3359
Correlation matrix for column 0 and and column3359: 0.007996885896015462
3360
Correlation matrix for column 0 and and column3360: -0.0025955577912550273
3361
Correlation matrix for column 0 and and column3361: -0.03324154408390391
3362
Correlation matrix for column 0 and and column3362: 0.018723702662966434
3363
Correlation matrix for column 0 and and column3363: 0.008917240584257545
3364
Correlation matrix for column 0 and and column3364: 0.01648298455069448
3365
Correlation matrix for column 0 and and column3365: -0.01612090128255823
3366
Correlation matrix for column 0 and and column3366: 0.006207014230107349
3367
Correlation matrix for column 0 and and column3367: 0.0291870141

Correlation matrix for column 0 and and column3519: -0.00837707061421417
3520
Correlation matrix for column 0 and and column3520: -0.007374870294518553
3521
Correlation matrix for column 0 and and column3521: -0.007167801645222658
3522
Correlation matrix for column 0 and and column3522: 0.01726409664129208
3523
Correlation matrix for column 0 and and column3523: 0.018831925298068087
3524
Correlation matrix for column 0 and and column3524: 0.01209440985002633
3525
Correlation matrix for column 0 and and column3525: -0.0012123699366222414
3526
Correlation matrix for column 0 and and column3526: 0.016814391558540434
3527
Correlation matrix for column 0 and and column3527: -0.016814404995811695
3528
Correlation matrix for column 0 and and column3528: -0.04274191378383655
3529
Correlation matrix for column 0 and and column3529: 0.005204630513973236
3530
Correlation matrix for column 0 and and column3530: 0.022218348660757906
3531
Correlation matrix for column 0 and and column3531: 0.0163433

Correlation matrix for column 0 and and column3681: 0.020724010365519005
3682
Correlation matrix for column 0 and and column3682: -0.009149967216961567
3683
Correlation matrix for column 0 and and column3683: -0.0005309497393331472
3684
Correlation matrix for column 0 and and column3684: 0.017926993749514952
3685
Correlation matrix for column 0 and and column3685: -0.0012664542759019991
3686
Correlation matrix for column 0 and and column3686: -0.0017682034780658893
3687
Correlation matrix for column 0 and and column3687: -0.01108414676952709
3688
Correlation matrix for column 0 and and column3688: 0.006686183932531333
3689
Correlation matrix for column 0 and and column3689: -0.0011435257199186
3690
Correlation matrix for column 0 and and column3690: -0.020226876966669072
3691
Correlation matrix for column 0 and and column3691: 0.010882442696666387
3692
Correlation matrix for column 0 and and column3692: 0.021016187058775157
3693
Correlation matrix for column 0 and and column3693: -0.00

3844
Correlation matrix for column 0 and and column3844: -0.029490761380533546
3845
Correlation matrix for column 0 and and column3845: -0.00692413667087716
3846
Correlation matrix for column 0 and and column3846: -0.018069375080009442
3847
Correlation matrix for column 0 and and column3847: -0.01726056366042104
3848
Correlation matrix for column 0 and and column3848: -0.013147685256274425
3849
Correlation matrix for column 0 and and column3849: -3.313190064382882e-05
3850
Correlation matrix for column 0 and and column3850: 0.00033460946178192605
3851
Correlation matrix for column 0 and and column3851: -0.014609805625519027
3852
Correlation matrix for column 0 and and column3852: -0.015497612300988195
3853
Correlation matrix for column 0 and and column3853: -0.0035896158594140065
3854
Correlation matrix for column 0 and and column3854: 0.01778091751456393
3855
Correlation matrix for column 0 and and column3855: 0.00448992772764995
3856
Correlation matrix for column 0 and and column3856

Correlation matrix for column 0 and and column4007: -0.013110279940965912
4008
Correlation matrix for column 0 and and column4008: 0.016476018093818042
4009
Correlation matrix for column 0 and and column4009: -0.009758675289894879
4010
Correlation matrix for column 0 and and column4010: -0.018858214748936817
4011
Correlation matrix for column 0 and and column4011: -0.013400492678815983
4012
Correlation matrix for column 0 and and column4012: 0.011384082173832943
4013
Correlation matrix for column 0 and and column4013: -0.002096327608105479
4014
Correlation matrix for column 0 and and column4014: 0.004176572138097447
4015
Correlation matrix for column 0 and and column4015: -0.0050764208877590415
4016
Correlation matrix for column 0 and and column4016: -0.0057761211791804365
4017
Correlation matrix for column 0 and and column4017: -0.015518743126451547
4018
Correlation matrix for column 0 and and column4018: -0.012854835265087535
4019
Correlation matrix for column 0 and and column4019: 0

Correlation matrix for column 0 and and column4135: 0.008155806645930899
4136
Correlation matrix for column 0 and and column4136: -0.0004847153003027253
4137
Correlation matrix for column 0 and and column4137: -0.015520802518584793
4138
Correlation matrix for column 0 and and column4138: 0.005716295139192639
4139
Correlation matrix for column 0 and and column4139: 0.0002806143431839805
4140
Correlation matrix for column 0 and and column4140: 0.01891281446050922
4141
Correlation matrix for column 0 and and column4141: -0.014018822285440331
4142
Correlation matrix for column 0 and and column4142: -0.0038274257558297406
4143
Correlation matrix for column 0 and and column4143: -0.04248480707414867
4144
Correlation matrix for column 0 and and column4144: 0.020386030811618387
4145
Correlation matrix for column 0 and and column4145: 0.004242889113348091
4146
Correlation matrix for column 0 and and column4146: -0.011886215835837237
4147
Correlation matrix for column 0 and and column4147: 0.006

Correlation matrix for column 0 and and column4293: -0.006095972948763304
4294
Correlation matrix for column 0 and and column4294: -0.01061127578034576
4295
Correlation matrix for column 0 and and column4295: -0.006056878217189089
4296
Correlation matrix for column 0 and and column4296: 0.01656067212850548
4297
Correlation matrix for column 0 and and column4297: 0.0015604639971359643
4298
Correlation matrix for column 0 and and column4298: 0.01777593708200344
4299
Correlation matrix for column 0 and and column4299: 0.0034571194275691106
4300
Correlation matrix for column 0 and and column4300: 0.01181545723247308
4301
Correlation matrix for column 0 and and column4301: -0.012521103072087595
4302
Correlation matrix for column 0 and and column4302: 0.001173069031973771
4303
Correlation matrix for column 0 and and column4303: 0.01409335144976937
4304
Correlation matrix for column 0 and and column4304: 0.002878860373202294
4305
Correlation matrix for column 0 and and column4305: -0.00957946

Correlation matrix for column 0 and and column4453: 0.018946158075776844
4454
Correlation matrix for column 0 and and column4454: 0.011184286727127932
4455
Correlation matrix for column 0 and and column4455: -0.01025535669355376
4456
Correlation matrix for column 0 and and column4456: 0.0038259728443665233
4457
Correlation matrix for column 0 and and column4457: -0.010097370156916143
4458
Correlation matrix for column 0 and and column4458: 0.013404013186210957
4459
Correlation matrix for column 0 and and column4459: -0.003012591131689127
4460
Correlation matrix for column 0 and and column4460: -0.008137107786709716
4461
Correlation matrix for column 0 and and column4461: 0.047379156889277796
4462
Correlation matrix for column 0 and and column4462: -0.0012346849182830715
4463
Correlation matrix for column 0 and and column4463: -0.02519965932620209
4464
Correlation matrix for column 0 and and column4464: 0.005286670404338192
4465
Correlation matrix for column 0 and and column4465: 0.0067

Correlation matrix for column 0 and and column4613: -0.003449852262010013
4614
Correlation matrix for column 0 and and column4614: 0.004437247986369211
4615
Correlation matrix for column 0 and and column4615: 0.012717407194055645
4616
Correlation matrix for column 0 and and column4616: 0.011598456409492443
4617
Correlation matrix for column 0 and and column4617: 0.019374639964614804
4618
Correlation matrix for column 0 and and column4618: -0.005259182760086609
4619
Correlation matrix for column 0 and and column4619: 0.01604668344439581
4620
Correlation matrix for column 0 and and column4620: 0.015806464502742878
4621
Correlation matrix for column 0 and and column4621: -0.005241038951975257
4622
Correlation matrix for column 0 and and column4622: -0.002933887574482598
4623
Correlation matrix for column 0 and and column4623: -0.0027462054576577848
4624
Correlation matrix for column 0 and and column4624: 0.005447858249436
4625
Correlation matrix for column 0 and and column4625: 0.00550007

4779
Correlation matrix for column 0 and and column4779: -0.005433822299860022
4780
Correlation matrix for column 0 and and column4780: -0.019222300578960738
4781
Correlation matrix for column 0 and and column4781: -0.01559356966906543
4782
Correlation matrix for column 0 and and column4782: 0.028766953720691654
4783
Correlation matrix for column 0 and and column4783: 0.018834377746795968
4784
Correlation matrix for column 0 and and column4784: 0.013168484551786779
4785
Correlation matrix for column 0 and and column4785: 0.008233482664014422
4786
Correlation matrix for column 0 and and column4786: 0.02463640338004494
4787
Correlation matrix for column 0 and and column4787: -0.01741834340625152
4788
Correlation matrix for column 0 and and column4788: 0.012819359643135766
4789
Correlation matrix for column 0 and and column4789: 0.0006933409014057572
4790
Correlation matrix for column 0 and and column4790: -0.02430762846809343
4791
Correlation matrix for column 0 and and column4791: 0.017

Correlation matrix for column 0 and and column4941: 0.003964194001370567
4942
Correlation matrix for column 0 and and column4942: -0.01171291306202165
4943
Correlation matrix for column 0 and and column4943: -0.018743002284246604
4944
Correlation matrix for column 0 and and column4944: -0.0014790046935563683
4945
Correlation matrix for column 0 and and column4945: -0.01242268939044181
4946
Correlation matrix for column 0 and and column4946: 0.018235794388315317
4947
Correlation matrix for column 0 and and column4947: 0.028641976850738302
4948
Correlation matrix for column 0 and and column4948: -0.036681421205065
4949
Correlation matrix for column 0 and and column4949: -0.013750305949121324
4950
Correlation matrix for column 0 and and column4950: 0.0016373704774526763
4951
Correlation matrix for column 0 and and column4951: -0.0034686183240487892
4952
Correlation matrix for column 0 and and column4952: -0.035327265703525346
4953
Correlation matrix for column 0 and and column4953: -0.004

Correlation matrix for column 0 and and column5096: -0.01437737926319226
5097
Correlation matrix for column 0 and and column5097: -0.01716749069823099
5098
Correlation matrix for column 0 and and column5098: 0.003993268953900459
5099
Correlation matrix for column 0 and and column5099: -0.008354138095436954
5100
Correlation matrix for column 0 and and column5100: -0.003493071846779758
5101
Correlation matrix for column 0 and and column5101: 0.0024981218310594607
5102
Correlation matrix for column 0 and and column5102: -0.01317213278537384
5103
Correlation matrix for column 0 and and column5103: -0.004392514879941991
5104
Correlation matrix for column 0 and and column5104: 0.022998368718153864
5105
Correlation matrix for column 0 and and column5105: -0.002127461813379614
5106
Correlation matrix for column 0 and and column5106: -0.009352240186476716
5107
Correlation matrix for column 0 and and column5107: 0.018475818755750013
5108
Correlation matrix for column 0 and and column5108: 0.0142

Correlation matrix for column 0 and and column5258: -0.006456915899343391
5259
Correlation matrix for column 0 and and column5259: -0.014312128615529164
5260
Correlation matrix for column 0 and and column5260: -0.00030882770552936303
5261
Correlation matrix for column 0 and and column5261: -0.021371140670618963
5262
Correlation matrix for column 0 and and column5262: -0.002267093557410997
5263
Correlation matrix for column 0 and and column5263: -0.0003795555838738998
5264
Correlation matrix for column 0 and and column5264: -0.0065431963695725395
5265
Correlation matrix for column 0 and and column5265: -0.026771308296639203
5266
Correlation matrix for column 0 and and column5266: -0.004119505722561278
5267
Correlation matrix for column 0 and and column5267: -0.014937913594544688
5268
Correlation matrix for column 0 and and column5268: -0.006268197615497133
5269
Correlation matrix for column 0 and and column5269: 0.0027875736810187546
5270
Correlation matrix for column 0 and and column52

Correlation matrix for column 0 and and column5419: 0.00729337371886688
5420
Correlation matrix for column 0 and and column5420: 0.009148025435229908
5421
Correlation matrix for column 0 and and column5421: -0.0075376454728840305
5422
Correlation matrix for column 0 and and column5422: -0.008542002987331328
5423
Correlation matrix for column 0 and and column5423: 0.014213893059597155
5424
Correlation matrix for column 0 and and column5424: 0.006552170692006023
5425
Correlation matrix for column 0 and and column5425: 0.010230449058682076
5426
Correlation matrix for column 0 and and column5426: -0.016509620269561227
5427
Correlation matrix for column 0 and and column5427: -0.00307192509936948
5428
Correlation matrix for column 0 and and column5428: 0.007705594100533621
5429
Correlation matrix for column 0 and and column5429: -0.004829758992941267
5430
Correlation matrix for column 0 and and column5430: -0.014070081926362945
5431
Correlation matrix for column 0 and and column5431: -0.0112

Correlation matrix for column 0 and and column5579: -0.0028860131719995407
5580
Correlation matrix for column 0 and and column5580: 0.0005270234786618761
5581
Correlation matrix for column 0 and and column5581: 0.007020553351411903
5582
Correlation matrix for column 0 and and column5582: 0.007398121149130891
5583
Correlation matrix for column 0 and and column5583: -0.0075565711459271885
5584
Correlation matrix for column 0 and and column5584: 0.011318339955988358
5585
Correlation matrix for column 0 and and column5585: 5.201010274506945e-05
5586
Correlation matrix for column 0 and and column5586: 0.009908402156154003
5587
Correlation matrix for column 0 and and column5587: 0.019592814255565864
5588
Correlation matrix for column 0 and and column5588: -0.004355549651094933
5589
Correlation matrix for column 0 and and column5589: 0.0018610365445771034
5590
Correlation matrix for column 0 and and column5590: 0.025062438004043595
5591
Correlation matrix for column 0 and and column5591: -0.0

5740
Correlation matrix for column 0 and and column5740: -0.00951168375576674
5741
Correlation matrix for column 0 and and column5741: -0.024011877366964317
5742
Correlation matrix for column 0 and and column5742: -0.027662319579245857
5743
Correlation matrix for column 0 and and column5743: -0.005498059144527088
5744
Correlation matrix for column 0 and and column5744: -0.001745589388442449
5745
Correlation matrix for column 0 and and column5745: 0.0021939028110391913
5746
Correlation matrix for column 0 and and column5746: -0.025934787725837412
5747
Correlation matrix for column 0 and and column5747: 0.032440609534312846
5748
Correlation matrix for column 0 and and column5748: -0.00641914661183759
5749
Correlation matrix for column 0 and and column5749: 0.012706717145701393
5750
Correlation matrix for column 0 and and column5750: -0.03406266042270289
5751
Correlation matrix for column 0 and and column5751: -0.010907136450364105
5752
Correlation matrix for column 0 and and column5752: 

Correlation matrix for column 0 and and column5891: -0.0005335406562388847
5892
Correlation matrix for column 0 and and column5892: 0.013360440245114636
5893
Correlation matrix for column 0 and and column5893: -0.006885042448351817
5894
Correlation matrix for column 0 and and column5894: 0.0019389249966802954
5895
Correlation matrix for column 0 and and column5895: 0.013462032254317042
5896
Correlation matrix for column 0 and and column5896: -0.004566246082058716
5897
Correlation matrix for column 0 and and column5897: 0.0011153462182710357
5898
Correlation matrix for column 0 and and column5898: -0.011410621912296108
5899
Correlation matrix for column 0 and and column5899: -0.01017991125903515
5900
Correlation matrix for column 0 and and column5900: -0.001988325590250998
5901
Correlation matrix for column 0 and and column5901: -0.01165492087465503
5902
Correlation matrix for column 0 and and column5902: 0.008476423839385407
5903
Correlation matrix for column 0 and and column5903: 0.01

Correlation matrix for column 0 and and column6052: 0.021911463141578876
6053
Correlation matrix for column 0 and and column6053: 0.02552760754855854
6054
Correlation matrix for column 0 and and column6054: 0.017713537987896218
6055
Correlation matrix for column 0 and and column6055: 0.0036737680111870053
6056
Correlation matrix for column 0 and and column6056: 0.008952525442101952
6057
Correlation matrix for column 0 and and column6057: 0.012195878107878963
6058
Correlation matrix for column 0 and and column6058: 0.017576276335843518
6059
Correlation matrix for column 0 and and column6059: -0.02213276452280137
6060
Correlation matrix for column 0 and and column6060: -0.006887251815545705
6061
Correlation matrix for column 0 and and column6061: 0.015276723505073121
6062
Correlation matrix for column 0 and and column6062: -0.007663269483035286
6063
Correlation matrix for column 0 and and column6063: 0.00877193731002588
6064
Correlation matrix for column 0 and and column6064: -0.01065053

Correlation matrix for column 0 and and column6212: 0.02367561374567531
6213
Correlation matrix for column 0 and and column6213: 0.02100308407534944
6214
Correlation matrix for column 0 and and column6214: 0.012016702344385665
6215
Correlation matrix for column 0 and and column6215: -0.0044185415987814695
6216
Correlation matrix for column 0 and and column6216: -0.007015075065961251
6217
Correlation matrix for column 0 and and column6217: 0.00858406805088879
6218
Correlation matrix for column 0 and and column6218: 0.0027582795005064438
6219
Correlation matrix for column 0 and and column6219: -0.0010115496546379897
6220
Correlation matrix for column 0 and and column6220: 0.010137325725615966
6221
Correlation matrix for column 0 and and column6221: 0.009417582205716998
6222
Correlation matrix for column 0 and and column6222: -0.020412982912051434
6223
Correlation matrix for column 0 and and column6223: 0.0016532504293611929
6224
Correlation matrix for column 0 and and column6224: -0.0294

Correlation matrix for column 0 and and column6376: -0.028109322822823354
6377
Correlation matrix for column 0 and and column6377: -0.010623747517975507
6378
Correlation matrix for column 0 and and column6378: 0.01996780256897293
6379
Correlation matrix for column 0 and and column6379: 0.012537496735752492
6380
Correlation matrix for column 0 and and column6380: 0.009727586139840413
6381
Correlation matrix for column 0 and and column6381: 0.0034405635769563445
6382
Correlation matrix for column 0 and and column6382: 0.02979133566227124
6383
Correlation matrix for column 0 and and column6383: -0.0005158928558597155
6384
Correlation matrix for column 0 and and column6384: 0.00019727666807444722
6385
Correlation matrix for column 0 and and column6385: 0.011757190187691646
6386
Correlation matrix for column 0 and and column6386: 0.022382479921125666
6387
Correlation matrix for column 0 and and column6387: -0.010986726066095926
6388
Correlation matrix for column 0 and and column6388: 0.0122

Correlation matrix for column 0 and and column6539: 0.042700001578388054
6540
Correlation matrix for column 0 and and column6540: -0.0038816335195773835
6541
Correlation matrix for column 0 and and column6541: 0.015611103869201984
6542
Correlation matrix for column 0 and and column6542: 0.01676731751723396
6543
Correlation matrix for column 0 and and column6543: -0.013282442461469037
6544
Correlation matrix for column 0 and and column6544: 0.0048572042714142075
6545
Correlation matrix for column 0 and and column6545: 0.002177244110896442
6546
Correlation matrix for column 0 and and column6546: 0.01781259370277626
6547
Correlation matrix for column 0 and and column6547: 0.0021086254066294
6548
Correlation matrix for column 0 and and column6548: -0.006871689026754384
6549
Correlation matrix for column 0 and and column6549: 0.013006814066438473
6550
Correlation matrix for column 0 and and column6550: 0.0006872603601838957
6551
Correlation matrix for column 0 and and column6551: 0.01404604

Correlation matrix for column 0 and and column6686: -0.00035816467524810207
6687
Correlation matrix for column 0 and and column6687: 0.017013204651046745
6688
Correlation matrix for column 0 and and column6688: 0.01770634652285275
6689
Correlation matrix for column 0 and and column6689: -0.015139818435657728
6690
Correlation matrix for column 0 and and column6690: -0.021535219903312853
6691
Correlation matrix for column 0 and and column6691: -0.023091439452308068
6692
Correlation matrix for column 0 and and column6692: -0.005535953283684938
6693
Correlation matrix for column 0 and and column6693: -0.0008966732854451675
6694
Correlation matrix for column 0 and and column6694: 0.024247500599579978
6695
Correlation matrix for column 0 and and column6695: -0.024900654728928155
6696
Correlation matrix for column 0 and and column6696: -0.01928524768903073
6697
Correlation matrix for column 0 and and column6697: 0.014872429010900362
6698
Correlation matrix for column 0 and and column6698: 0.0

Correlation matrix for column 0 and and column6847: 0.0029601713172189227
6848
Correlation matrix for column 0 and and column6848: 0.0018083672545228734
6849
Correlation matrix for column 0 and and column6849: -0.004436081282698351
6850
Correlation matrix for column 0 and and column6850: -0.004753726175952196
6851
Correlation matrix for column 0 and and column6851: 0.017616505855934023
6852
Correlation matrix for column 0 and and column6852: 0.012336998822254653
6853
Correlation matrix for column 0 and and column6853: -0.021130548512725132
6854
Correlation matrix for column 0 and and column6854: -0.006989217817015745
6855
Correlation matrix for column 0 and and column6855: 0.007604487018305495
6856
Correlation matrix for column 0 and and column6856: 0.003164454078787439
6857
Correlation matrix for column 0 and and column6857: 0.020823127142140206
6858
Correlation matrix for column 0 and and column6858: 0.01051606706150482
6859
Correlation matrix for column 0 and and column6859: -0.0098

Correlation matrix for column 0 and and column7010: -0.010209642948472543
7011
Correlation matrix for column 0 and and column7011: 0.0003267529948275133
7012
Correlation matrix for column 0 and and column7012: 0.0006200659325218668
7013
Correlation matrix for column 0 and and column7013: 0.009003937454814565
7014
Correlation matrix for column 0 and and column7014: 0.003802310831492354
7015
Correlation matrix for column 0 and and column7015: -0.004382818200725225
7016
Correlation matrix for column 0 and and column7016: -0.0090706460095083
7017
Correlation matrix for column 0 and and column7017: 0.012227293187055987
7018
Correlation matrix for column 0 and and column7018: 0.029915116090099076
7019
Correlation matrix for column 0 and and column7019: 0.0037790630666873063
7020
Correlation matrix for column 0 and and column7020: 0.016590245284959726
7021
Correlation matrix for column 0 and and column7021: -0.012439580620159062
7022
Correlation matrix for column 0 and and column7022: -0.0320

Correlation matrix for column 0 and and column7172: -0.006985569598924909
7173
Correlation matrix for column 0 and and column7173: 0.01591577842322913
7174
Correlation matrix for column 0 and and column7174: -0.002069324336671767
7175
Correlation matrix for column 0 and and column7175: 0.016740563446995045
7176
Correlation matrix for column 0 and and column7176: -0.008515890777695509
7177
Correlation matrix for column 0 and and column7177: 0.0016910471597005815
7178
Correlation matrix for column 0 and and column7178: 0.01777526232256592
7179
Correlation matrix for column 0 and and column7179: 0.05699983005099229
7180
Correlation matrix for column 0 and and column7180: -0.012253419774139872
7181
Correlation matrix for column 0 and and column7181: -0.016566945135141016
7182
Correlation matrix for column 0 and and column7182: -3.0395895721200878e-05
7183
Correlation matrix for column 0 and and column7183: 0.02385515343408042
7184
Correlation matrix for column 0 and and column7184: 0.00401

In [11]:
a = 0
b = 0
for i in range(0,len(list_corr_df1)):
    if abs(list_corr_df1[i]) > 0.01:
        a+=1
    else:
        pass
        
for i in range(0,len(list_corr_df_new)):
    if abs(list_corr_df_new[i]) > 0.01:
        b+=1
    else:
        pass

print("Percentage of correlations in df1:",(a/len(list_corr_df1)*100),"%")

print("Percentage of correlations in df_new:",(b/len(list_corr_df_new)*100),"%")

Percentage of correlations in df1: 46.300000000000004 %
Percentage of correlations in df_new: 47.8832716810522 %


## Random Projection eps = 0.5

In [12]:
# Pass df1 in the random projection to create a new reduced DataFrame
transformer = random_projection.GaussianRandomProjection(eps = 0.5)
df_new = pd.DataFrame(transformer.fit_transform(df))
df_new

Unnamed: 0,0,1,2,3,4,5,6,7,8,9,...,398,399,400,401,402,403,404,405,406,407
0,4.393873,-5.418870,-18.804631,-8.756233,-2.894961,-28.460906,6.498153,5.382570,1.494611,-12.505758,...,14.568440,7.115923,-1.092132,2.118208,-2.256701,-1.070940,18.447298,-4.253091,-0.295686,-0.048403
1,6.513317,-8.598065,-18.862545,-2.679299,-10.444649,-23.852196,2.970171,4.582985,-1.740843,-5.813995,...,1.773110,0.019862,1.973441,4.012337,-5.715563,3.564803,17.271407,-7.640295,0.476062,4.472542
2,0.467242,-9.960916,-14.490054,-4.748114,-4.836908,-19.017380,-4.788136,-0.206744,12.692724,-11.082344,...,7.881596,5.657443,5.547112,8.807565,7.719181,-1.709014,13.859097,-3.451287,1.868450,2.347666
3,5.234576,-16.513798,-15.791535,-3.937882,-12.143270,-20.819429,-10.585996,0.740352,2.581232,-0.953379,...,6.277563,5.351048,6.738107,12.394177,11.740391,-0.939854,14.629208,-5.494908,3.374834,2.713411
4,10.408715,-10.260841,-9.870698,1.462573,-3.737125,-25.604084,-3.606723,-1.301646,3.598168,-7.722082,...,14.630930,3.848384,0.903191,9.567900,0.392781,-0.945019,7.688441,-8.536405,1.128304,4.137700
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
4995,5.887463,-6.278177,-15.128034,-7.876788,-1.742725,-25.665281,7.890721,3.295730,5.383875,-1.343779,...,4.340008,4.163532,0.101050,-2.546813,-5.742349,-3.790223,7.892898,0.300802,8.944671,5.361549
4996,4.077137,-2.354803,-18.151604,-4.440123,-8.787833,-24.103703,5.541465,4.687959,9.539368,-0.653738,...,4.712374,3.635433,5.638101,7.833833,-1.241566,5.693987,12.625935,-5.403219,-0.135564,-1.851855
4997,5.468390,2.364466,-13.400492,-6.133005,-3.532374,-27.814375,-3.412852,0.081685,7.925154,-9.907500,...,7.654710,16.197803,-2.618574,5.018329,4.096011,-0.866468,7.780802,-8.816029,2.000661,1.122377
4998,0.472801,-10.924625,-8.415826,5.812143,-7.709488,-20.373467,-2.194205,-1.611080,4.954928,-7.325797,...,8.293716,4.458438,1.532285,8.818166,3.028416,0.740922,17.871133,-1.554829,0.852225,0.512098


In [13]:
# Assigning X to all columns except 0
X_df_new = df_new.drop(columns=0)

# Assigning Y to column 0
Y_df_new = df_new[0]
print(Y_df_new)

# The following line makes Y become a list
Y_df_new = np.array(Y_df_new).reshape(-1)
print(X_df_new.shape,Y_df_new.shape)

list_titles = X_df_new.columns

list_corr_df_new = []
for i in list_titles[0:1000]:
    print(i)
    list_corr_df_new.append(abs(np.corrcoef(Y_df_new, X_df_new[i])[0][1]))
    print('Correlation matrix for column 0 and and column' + str(i) + ': ' + str(np.corrcoef(Y_df_new, X_df_new[i])[0][1]))

0        4.393873
1        6.513317
2        0.467242
3        5.234576
4       10.408715
          ...    
4995     5.887463
4996     4.077137
4997     5.468390
4998     0.472801
4999     9.074463
Name: 0, Length: 5000, dtype: float64
(5000, 407) (5000,)
1
Correlation matrix for column 0 and and column1: -0.0028870620189320596
2
Correlation matrix for column 0 and and column2: 0.007806281930038427
3
Correlation matrix for column 0 and and column3: 0.0005280609396455487
4
Correlation matrix for column 0 and and column4: 0.012219055381986484
5
Correlation matrix for column 0 and and column5: -0.0039031504486875712
6
Correlation matrix for column 0 and and column6: -0.032501077527416454
7
Correlation matrix for column 0 and and column7: 0.017670529471172803
8
Correlation matrix for column 0 and and column8: 0.004958643691837147
9
Correlation matrix for column 0 and and column9: 0.002809632746095086
10
Correlation matrix for column 0 and and column10: 0.005133677037260717
11
Correlation m

Correlation matrix for column 0 and and column165: 0.009886653147963533
166
Correlation matrix for column 0 and and column166: 5.0283927213131584e-05
167
Correlation matrix for column 0 and and column167: 0.020276822944402886
168
Correlation matrix for column 0 and and column168: -0.021262263993357903
169
Correlation matrix for column 0 and and column169: -0.02326140373973558
170
Correlation matrix for column 0 and and column170: 0.007257629821749707
171
Correlation matrix for column 0 and and column171: -0.007287459827457389
172
Correlation matrix for column 0 and and column172: -0.012114896794749745
173
Correlation matrix for column 0 and and column173: 0.02445528967985027
174
Correlation matrix for column 0 and and column174: -0.01509733411714978
175
Correlation matrix for column 0 and and column175: 0.030018909264297185
176
Correlation matrix for column 0 and and column176: -0.016208204852069065
177
Correlation matrix for column 0 and and column177: 0.025025269844965767
178
Correla

Correlation matrix for column 0 and and column293: 0.016250488326983285
294
Correlation matrix for column 0 and and column294: -0.0022392021897495533
295
Correlation matrix for column 0 and and column295: 0.00035707736984074654
296
Correlation matrix for column 0 and and column296: 0.009394383470505455
297
Correlation matrix for column 0 and and column297: -0.014146119788638544
298
Correlation matrix for column 0 and and column298: -0.023387545730737373
299
Correlation matrix for column 0 and and column299: -0.007531510996882473
300
Correlation matrix for column 0 and and column300: -0.036432601081910806
301
Correlation matrix for column 0 and and column301: 0.00950154097977583
302
Correlation matrix for column 0 and and column302: 0.028049772516251473
303
Correlation matrix for column 0 and and column303: -0.016759398932995485
304
Correlation matrix for column 0 and and column304: 0.007013892435121382
305
Correlation matrix for column 0 and and column305: 0.02272615758562774
306
Corre

In [14]:
a = 0
b = 0
for i in range(0,len(list_corr_df1)):
    if abs(list_corr_df1[i]) > 0.01:
        a+=1
    else:
        pass
        
for i in range(0,len(list_corr_df_new)):
    if abs(list_corr_df_new[i]) > 0.01:
        b+=1
    else:
        pass

print("Percentage of correlations in df1:",(a/len(list_corr_df1)*100),"%")

print("Percentage of correlations in df_new:",(b/len(list_corr_df_new)*100),"%")

Percentage of correlations in df1: 46.300000000000004 %
Percentage of correlations in df_new: 44.47174447174447 %
