# Exome Aggregation Consortium CNV Map & eQTLs

### Background

Enrichment for eQTLs of genes affected by CNVs according to ExAC exome sequencing data

### Imports

In [2]:
import pandas as pd
import re
import os.path

### Functions

In [2]:
def removeGeneIDVersions(text):
    return re.findall('(ENSG\d+)', text)[0]

### Input/Output files

---

### Prepare CNV data

ExAC CNV gene scores available from ftp://ftp.broadinstitute.org/pub/ExAC_release/release0.3.1/cnv/exac-final-cnv.gene.scores071316

In [3]:
ExAC = pd.read_csv('../datasets/ExACCNVGenes/exac-final-cnv.gene.scores071316.txt', sep='\t')
ExAC['Ensembl Gene ID'] = ExAC['gene'].apply(removeGeneIDVersions)
ExAC.head()

Unnamed: 0,gene,chr,start,end,gene_symbol,mean_rd,gc_content,complexity,cds_len,gene_length,...,dup,del.sing,dup.sing,del.sing.score,dup.sing.score,del.score,dup.score,cnv.score,flag,Ensembl Gene ID
0,ENSG00000138131.3,10,100007447,100028007,LOXL4,68.73759,0.599301,168.214286,2355,20560,...,2,1,0,-0.343404,0.618145,0.163146,0.339478,0.339117,0,ENSG00000138131
1,ENSG00000119943.6,10,100143322,100174941,PYROXD2,84.115106,0.586477,116.0,1856,31619,...,0,1,0,-0.022225,0.918334,0.422492,1.23837,1.104569,0,ENSG00000119943
2,ENSG00000107521.14,10,100175955,100206684,HPS1,91.062743,0.607213,129.176471,2196,30729,...,0,0,0,1.035914,1.026984,1.078684,1.327732,1.533227,0,ENSG00000107521
3,ENSG00000172987.8,10,100218875,100995619,HPSE2,101.726677,0.494474,145.230769,1888,776744,...,0,1,0,0.566906,1.521308,0.68056,1.280794,1.246748,0,ENSG00000172987
4,ENSG00000119946.9,10,101088856,101154087,CNNM1,48.409783,0.547731,274.272727,3017,65231,...,1,1,1,-0.82642,-0.573062,-0.207902,0.371796,0.220174,0,ENSG00000119946


In [4]:
ExAC.columns

Index(['gene', 'chr', 'start', 'end', 'gene_symbol', 'mean_rd', 'gc_content',
       'complexity', 'cds_len', 'gene_length', 'num_targ', 'segdups', 'dip',
       'del', 'dup', 'del.sing', 'dup.sing', 'del.sing.score',
       'dup.sing.score', 'del.score', 'dup.score', 'cnv.score', 'flag',
       'Ensembl Gene ID'],
      dtype='object')

In [5]:
len(ExAC)

15734

In [6]:
ExAC.groupby('chr').describe()

Unnamed: 0_level_0,cds_len,cds_len,cds_len,cds_len,cds_len,cds_len,cds_len,cds_len,cnv.score,cnv.score,...,segdups,segdups,start,start,start,start,start,start,start,start
Unnamed: 0_level_1,count,mean,std,min,25%,50%,75%,max,count,mean,...,75%,max,count,mean,std,min,25%,50%,75%,max
chr,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2,Unnamed: 9_level_2,Unnamed: 10_level_2,Unnamed: 11_level_2,Unnamed: 12_level_2,Unnamed: 13_level_2,Unnamed: 14_level_2,Unnamed: 15_level_2,Unnamed: 16_level_2,Unnamed: 17_level_2,Unnamed: 18_level_2,Unnamed: 19_level_2,Unnamed: 20_level_2,Unnamed: 21_level_2
1,1698.0,1855.590695,1742.782637,138.0,921.0,1423.5,2275.5,28379.0,1698.0,0.091826,...,0.0,3.0,1698.0,115047400.0,75317030.0,860260.0,40442077.75,114496938.5,171653100.0,249200395.0
2,1044.0,2046.978927,1746.983571,138.0,1004.5,1549.5,2522.25,14796.0,1044.0,-0.048687,...,0.0,5.0,1044.0,125101600.0,75093080.0,38814.0,61376666.25,114179190.0,198467200.0,242811752.0
3,956.0,1964.401674,1562.574109,162.0,970.5,1573.0,2431.25,13360.0,956.0,0.22028,...,0.0,3.0,956.0,96677740.0,58061680.0,3111233.0,47621003.75,100067910.0,142204900.0,197676858.0
4,630.0,1957.147619,1783.697117,180.0,939.75,1468.5,2500.5,15939.0,630.0,-0.070909,...,0.0,8.0,630.0,89599880.0,55696830.0,264464.0,46782862.25,84352790.5,140187900.0,189060573.0
5,734.0,1968.121253,1726.853363,168.0,948.25,1561.0,2479.0,19706.0,734.0,0.222072,...,0.0,14.0,734.0,109371800.0,51500730.0,140373.0,68517857.25,130670400.0,148747600.0,180681417.0
6,899.0,1834.938821,2097.678605,165.0,807.0,1357.0,2072.5,29261.0,899.0,0.097688,...,0.0,2.0,899.0,68423700.0,48621530.0,485133.0,30777587.0,43612783.0,111237900.0,170884383.0
7,724.0,1868.828729,1641.149832,57.0,911.5,1487.5,2364.25,15715.0,724.0,-0.053805,...,1.0,8.0,724.0,84933610.0,47347270.0,536895.0,42967964.25,95307338.5,128356700.0,158820866.0
8,538.0,1963.704461,1766.31234,218.0,972.5,1431.5,2364.0,14901.0,538.0,-0.017002,...,0.0,2.0,538.0,76694000.0,44635660.0,182137.0,37625510.5,74771868.0,117927400.0,146155744.0
9,646.0,1911.30031,1594.896898,170.0,900.5,1365.5,2426.75,11061.0,646.0,-0.01924,...,0.0,3.0,646.0,92747190.0,44687670.0,470291.0,37511302.75,107534860.5,131005000.0,140513444.0
10,623.0,1946.951846,1542.118266,248.0,1026.0,1494.0,2404.0,14015.0,623.0,0.084499,...,0.0,5.0,623.0,75995540.0,38428460.0,180405.0,45099843.0,85954410.0,104172700.0,135192695.0


In [7]:
ExAC['dip'].describe()

count    15734.000000
mean     58975.659845
std        162.401432
min      57455.000000
25%      58891.000000
50%      58992.000000
75%      59075.000000
max      59885.000000
Name: dip, dtype: float64

In [8]:
ExAC['dup'].describe()

count    15734.000000
mean         6.648786
std         18.125443
min          0.000000
25%          1.000000
50%          2.000000
75%          6.000000
max        454.000000
Name: dup, dtype: float64

In [9]:
ExAC['del'].describe()

count    15734.000000
mean         3.108809
std         12.514256
min          0.000000
25%          0.000000
50%          1.000000
75%          3.000000
max        512.000000
Name: del, dtype: float64

* Note: ExAC CNV data only available for autosomes

### eQTL affected tissues per gene

In [10]:
genesTestedForeQTLsWithNumberOfTissues = pd.read_csv('../outputFiles/GTExV7/genesTestedWithNumberOfTissues.csv')
genesTestedForeQTLsWithNumberOfTissues.head()

Unnamed: 0,expressedTissues,Ensembl Gene ID
0,48,ENSG00000272186
1,48,ENSG00000117748
2,48,ENSG00000130856
3,48,ENSG00000169446
4,48,ENSG00000013573


In [11]:
genesTestedForeQTLsWithNumberOfMergedTissues = pd.read_csv('../outputFiles/GTExV7/genesTestedWithNumberOfMergedTissues.csv')
genesTestedForeQTLsWithNumberOfMergedTissues.head()

Unnamed: 0,expressedTissues,Ensembl Gene ID
0,26,ENSG00000170604
1,26,ENSG00000178458
2,26,ENSG00000141425
3,26,ENSG00000117115
4,26,ENSG00000105204


In [12]:
PCGenes = pd.read_csv('../datasets/geneLists/Ensembl/EnsV75ProteinCodingGenes1-Y.txt', sep='\t')
PCGenes.head()

Unnamed: 0,Ensembl Gene ID,Chromosome Name,Gene Start (bp),Gene End (bp),Strand
0,ENSG00000215405,15,20737094,20747114,-1
1,ENSG00000268343,15,21004687,21005367,1
2,ENSG00000230031,15,21040701,21071643,-1
3,ENSG00000138593,15,49280673,49338760,-1
4,ENSG00000268531,15,22011370,22012050,1


In [13]:
genesTestedForeQTLsWithNumberOfTissues = pd.merge(genesTestedForeQTLsWithNumberOfTissues, PCGenes, on="Ensembl Gene ID")
genesTestedForeQTLsWithNumberOfMergedTissues = pd.merge(genesTestedForeQTLsWithNumberOfMergedTissues, PCGenes, on="Ensembl Gene ID")

In [14]:
len(genesTestedForeQTLsWithNumberOfTissues)

19067

In [17]:
genesTestedForeQTLsWithNumberOfTissues.drop(
    genesTestedForeQTLsWithNumberOfTissues[genesTestedForeQTLsWithNumberOfTissues['Chromosome Name'] == 'X'].index,
    inplace=True)
genesTestedForeQTLsWithNumberOfMergedTissues.drop(
    genesTestedForeQTLsWithNumberOfMergedTissues[genesTestedForeQTLsWithNumberOfMergedTissues['Chromosome Name'] == 'X'].index,
    inplace=True)

In [18]:
len(genesTestedForeQTLsWithNumberOfTissues)

18301

##### Bonferroni-corrected

In [27]:
genesWitheQTLTissueCountBonferroni = pd.read_csv('../outputFiles/GTExV7/genesWithNumberOfBonferroniAffectedTissues.csv', index_col = 0)
genesWitheQTLTissueCountBonferroni.head()

Unnamed: 0,Ensembl Gene ID,affectedTissues
0,ENSG00000138593,4
1,ENSG00000166351,1
2,ENSG00000168675,1
3,ENSG00000188992,13
4,ENSG00000185272,8


In [28]:
genesWitheQTLTissueCountBonferroni = pd.merge(genesWitheQTLTissueCountBonferroni, genesTestedForeQTLsWithNumberOfTissues, on='Ensembl Gene ID', how='right')
genesWitheQTLTissueCountBonferroni

Unnamed: 0,Ensembl Gene ID,affectedTissues,expressedTissues,Chromosome Name,Gene Start (bp),Gene End (bp),Strand
0,ENSG00000138593,4.0,48,15,49280673,49338760,-1
1,ENSG00000166351,1.0,1,21,14982498,15013906,1
2,ENSG00000168675,1.0,47,18,13217497,13652754,1
3,ENSG00000188992,13.0,30,21,15481134,15583166,-1
4,ENSG00000185272,8.0,48,21,15588451,15600693,1
5,ENSG00000182974,1.0,1,15,22368478,22369561,1
6,ENSG00000155304,1.0,48,21,15743436,15755805,-1
7,ENSG00000153575,8.0,48,15,22833395,22873892,1
8,ENSG00000180530,2.0,48,21,16333556,16437321,-1
9,ENSG00000137824,9.0,48,15,41028082,41048049,-1


In [29]:
genesWitheQTLTissueCountBonferroni['affectedTissues'].fillna(0, inplace=True)

##### Tested for CNV

In [30]:
genesWitheQTLTissueCountBonferroni = pd.merge(genesWitheQTLTissueCountBonferroni, ExAC, on='Ensembl Gene ID', how='inner')

In [31]:
genesWitheQTLTissueCountBonferroni

Unnamed: 0,Ensembl Gene ID,affectedTissues,expressedTissues,Chromosome Name,Gene Start (bp),Gene End (bp),Strand,gene,chr,start,...,del,dup,del.sing,dup.sing,del.sing.score,dup.sing.score,del.score,dup.score,cnv.score,flag
0,ENSG00000138593,4.0,48,15,49280673,49338760,-1,ENSG00000138593.4,15,49280673,...,0,0,0,0,1.006221,0.976367,1.092999,1.275552,1.523702,0
1,ENSG00000168675,1.0,47,18,13217497,13652754,1,ENSG00000168675.14,18,13217497,...,0,3,0,0,0.620675,0.737930,0.723574,-0.029705,0.297903,0
2,ENSG00000185272,8.0,48,21,15588451,15600693,1,ENSG00000185272.9,21,15588451,...,0,9,0,0,0.187194,0.266138,0.728772,-1.183084,-0.702303,1
3,ENSG00000155304,1.0,48,21,15743436,15755805,-1,ENSG00000155304.4,21,15743436,...,0,3,0,0,0.416765,0.407245,0.962883,0.202447,0.548186,0
4,ENSG00000180530,2.0,48,21,16333556,16437321,-1,ENSG00000180530.5,21,16333556,...,0,0,0,0,0.093782,0.097961,0.577557,0.553032,0.719674,0
5,ENSG00000137824,9.0,48,15,41028082,41048049,-1,ENSG00000137824.11,15,41028082,...,3,2,3,0,-1.590585,0.776270,-0.421097,0.534328,0.192307,0
6,ENSG00000137880,1.0,48,15,41056218,41059906,1,ENSG00000137880.4,15,41056218,...,0,2,0,0,-0.066143,-0.003908,0.323604,0.019842,0.207774,0
7,ENSG00000104129,9.0,48,15,41060067,41099675,-1,ENSG00000104129.5,15,41060067,...,0,3,0,0,0.648261,0.707249,0.779957,0.110761,0.418014,0
8,ENSG00000177150,4.0,48,18,13663346,13726662,-1,ENSG00000177150.8,18,13663346,...,1,4,0,0,0.344554,0.375130,0.364536,-0.110495,0.069348,1
9,ENSG00000155313,1.0,48,21,17102344,17252377,1,ENSG00000155313.11,21,17102344,...,1,3,1,2,0.642495,0.144497,1.087454,0.740681,0.981162,0


In [32]:
genesWitheQTLTissueCountBonferroni['CNV'] = 'N'
genesWitheQTLTissueCountBonferroni.loc[(genesWitheQTLTissueCountBonferroni['del'] != 0) | (genesWitheQTLTissueCountBonferroni['dup'] != 0) , 'CNV'] = 'Y'

In [37]:
genesWitheQTLTissueCountBonferroni['propOfExpressedAffectedByeQTL'] = genesWitheQTLTissueCountBonferroni['affectedTissues'] / genesWitheQTLTissueCountBonferroni['expressedTissues']

In [38]:
genesWitheQTLTissueCountBonferroni.groupby('CNV').describe()

Unnamed: 0_level_0,Gene End (bp),Gene End (bp),Gene End (bp),Gene End (bp),Gene End (bp),Gene End (bp),Gene End (bp),Gene End (bp),Gene Start (bp),Gene Start (bp),...,segdups,segdups,start,start,start,start,start,start,start,start
Unnamed: 0_level_1,count,mean,std,min,25%,50%,75%,max,count,mean,...,75%,max,count,mean,std,min,25%,50%,75%,max
CNV,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2,Unnamed: 9_level_2,Unnamed: 10_level_2,Unnamed: 11_level_2,Unnamed: 12_level_2,Unnamed: 13_level_2,Unnamed: 14_level_2,Unnamed: 15_level_2,Unnamed: 16_level_2,Unnamed: 17_level_2,Unnamed: 18_level_2,Unnamed: 19_level_2,Unnamed: 20_level_2,Unnamed: 21_level_2
N,1813.0,79451950.0,55635940.0,683385.0,38069245.0,59486827.0,117956726.0,244220778.0,1813.0,79404690.0,...,0.0,12.0,1813.0,79404690.0,55626970.0,676392.0,38059189.0,59475296.0,117816444.0,244214585.0
Y,13337.0,74470310.0,56052040.0,46870.0,31732622.0,58671688.0,111349466.0,249214145.0,13337.0,74394830.0,...,0.0,14.0,13337.0,74394830.0,56044100.0,38814.0,31667450.0,58570607.0,111286889.0,249200395.0


In [39]:
genesWitheQTLTissueCountBonferroni[genesWitheQTLTissueCountBonferroni['affectedTissues']>0].groupby('CNV').describe()

Unnamed: 0_level_0,Gene End (bp),Gene End (bp),Gene End (bp),Gene End (bp),Gene End (bp),Gene End (bp),Gene End (bp),Gene End (bp),Gene Start (bp),Gene Start (bp),...,segdups,segdups,start,start,start,start,start,start,start,start
Unnamed: 0_level_1,count,mean,std,min,25%,50%,75%,max,count,mean,...,75%,max,count,mean,std,min,25%,50%,75%,max
CNV,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2,Unnamed: 9_level_2,Unnamed: 10_level_2,Unnamed: 11_level_2,Unnamed: 12_level_2,Unnamed: 13_level_2,Unnamed: 14_level_2,Unnamed: 15_level_2,Unnamed: 16_level_2,Unnamed: 17_level_2,Unnamed: 18_level_2,Unnamed: 19_level_2,Unnamed: 20_level_2,Unnamed: 21_level_2
N,1416.0,80341110.0,55483750.0,1036979.0,38287485.5,62167084.0,119286000.0,244220778.0,1416.0,80288210.0,...,0.0,12.0,1416.0,80288210.0,55472870.0,1031808.0,38249332.75,62117134.5,119256900.0,244214585.0
Y,11341.0,74473600.0,56086890.0,46870.0,31605548.0,59838601.0,111366000.0,249153343.0,11341.0,74392630.0,...,0.0,14.0,11341.0,74392630.0,56078670.0,38814.0,31535157.0,59710800.0,111293800.0,249144205.0


In [40]:
genesWitheQTLTissueCountBonferroni.to_csv("../outputFiles/genesWitheQTLTissueCountBonferroniAndCNVExACStatus.csv", sep='\t')

##### Metasoft

In [42]:
genesWitheQTLTissueCountMetasoft = pd.read_csv('../outputFiles/GTExV7/genesWithNumberOfMetasoftAffectedTissues.csv', index_col = 0)
genesWitheQTLTissueCountMetasoft = pd.merge(genesWitheQTLTissueCountMetasoft, genesTestedForeQTLsWithNumberOfTissues, on='Ensembl Gene ID', how='right')
genesWitheQTLTissueCountMetasoft['affectedTissues'].fillna(0, inplace=True)
genesWitheQTLTissueCountMetasoft = pd.merge(genesWitheQTLTissueCountMetasoft, ExAC, on='Ensembl Gene ID', how='inner')
genesWitheQTLTissueCountMetasoft['CNV'] = 'N'
genesWitheQTLTissueCountMetasoft.loc[(genesWitheQTLTissueCountMetasoft['del'] != 0) | (genesWitheQTLTissueCountMetasoft['dup'] != 0) , 'CNV'] = 'Y'
genesWitheQTLTissueCountMetasoft['propOfExpressedAffectedByeQTL'] = genesWitheQTLTissueCountMetasoft['affectedTissues'] / genesWitheQTLTissueCountMetasoft['expressedTissues']
genesWitheQTLTissueCountMetasoft

Unnamed: 0,Ensembl Gene ID,affectedTissues,expressedTissues,Chromosome Name,Gene Start (bp),Gene End (bp),Strand,gene,chr,start,...,del.sing,dup.sing,del.sing.score,dup.sing.score,del.score,dup.score,cnv.score,flag,CNV,propOfExpressedAffectedByeQTL
0,ENSG00000138593,24.0,48,15,49280673,49338760,-1,ENSG00000138593.4,15,49280673,...,0,0,1.006221,0.976367,1.092999,1.275552,1.523702,0,N,0.500000
1,ENSG00000168675,10.0,47,18,13217497,13652754,1,ENSG00000168675.14,18,13217497,...,0,0,0.620675,0.737930,0.723574,-0.029705,0.297903,0,Y,0.212766
2,ENSG00000185272,48.0,48,21,15588451,15600693,1,ENSG00000185272.9,21,15588451,...,0,0,0.187194,0.266138,0.728772,-1.183084,-0.702303,1,Y,1.000000
3,ENSG00000155304,23.0,48,21,15743436,15755805,-1,ENSG00000155304.4,21,15743436,...,0,0,0.416765,0.407245,0.962883,0.202447,0.548186,0,Y,0.479167
4,ENSG00000166200,44.0,48,15,49398268,49447858,-1,ENSG00000166200.10,15,49398268,...,0,0,0.888225,0.898726,0.989254,1.167378,1.407464,0,N,0.916667
5,ENSG00000155307,4.0,48,21,15857549,15955723,-1,ENSG00000155307.13,21,15857549,...,1,1,-0.156759,0.002268,0.617652,-0.134204,0.146159,1,Y,0.083333
6,ENSG00000180530,12.0,48,21,16333556,16437321,-1,ENSG00000180530.5,21,16333556,...,0,0,0.093782,0.097961,0.577557,0.553032,0.719674,0,N,0.250000
7,ENSG00000137824,47.0,48,15,41028082,41048049,-1,ENSG00000137824.11,15,41028082,...,3,0,-1.590585,0.776270,-0.421097,0.534328,0.192307,0,Y,0.979167
8,ENSG00000137880,3.0,48,15,41056218,41059906,1,ENSG00000137880.4,15,41056218,...,0,0,-0.066143,-0.003908,0.323604,0.019842,0.207774,0,Y,0.062500
9,ENSG00000104129,48.0,48,15,41060067,41099675,-1,ENSG00000104129.5,15,41060067,...,0,0,0.648261,0.707249,0.779957,0.110761,0.418014,0,Y,1.000000


In [43]:
genesWitheQTLTissueCountMetasoft.groupby('CNV').describe()

Unnamed: 0_level_0,Gene End (bp),Gene End (bp),Gene End (bp),Gene End (bp),Gene End (bp),Gene End (bp),Gene End (bp),Gene End (bp),Gene Start (bp),Gene Start (bp),...,segdups,segdups,start,start,start,start,start,start,start,start
Unnamed: 0_level_1,count,mean,std,min,25%,50%,75%,max,count,mean,...,75%,max,count,mean,std,min,25%,50%,75%,max
CNV,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2,Unnamed: 9_level_2,Unnamed: 10_level_2,Unnamed: 11_level_2,Unnamed: 12_level_2,Unnamed: 13_level_2,Unnamed: 14_level_2,Unnamed: 15_level_2,Unnamed: 16_level_2,Unnamed: 17_level_2,Unnamed: 18_level_2,Unnamed: 19_level_2,Unnamed: 20_level_2,Unnamed: 21_level_2
N,1813.0,79451950.0,55635940.0,683385.0,38069245.0,59486827.0,117956726.0,244220778.0,1813.0,79404690.0,...,0.0,12.0,1813.0,79404690.0,55626970.0,676392.0,38059189.0,59475296.0,117816444.0,244214585.0
Y,13337.0,74470310.0,56052040.0,46870.0,31732622.0,58671688.0,111349466.0,249214145.0,13337.0,74394830.0,...,0.0,14.0,13337.0,74394830.0,56044100.0,38814.0,31667450.0,58570607.0,111286889.0,249200395.0


In [44]:
genesWitheQTLTissueCountMetasoft[genesWitheQTLTissueCountMetasoft['affectedTissues']>0].groupby('CNV').describe()

Unnamed: 0_level_0,Gene End (bp),Gene End (bp),Gene End (bp),Gene End (bp),Gene End (bp),Gene End (bp),Gene End (bp),Gene End (bp),Gene Start (bp),Gene Start (bp),...,segdups,segdups,start,start,start,start,start,start,start,start
Unnamed: 0_level_1,count,mean,std,min,25%,50%,75%,max,count,mean,...,75%,max,count,mean,std,min,25%,50%,75%,max
CNV,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2,Unnamed: 9_level_2,Unnamed: 10_level_2,Unnamed: 11_level_2,Unnamed: 12_level_2,Unnamed: 13_level_2,Unnamed: 14_level_2,Unnamed: 15_level_2,Unnamed: 16_level_2,Unnamed: 17_level_2,Unnamed: 18_level_2,Unnamed: 19_level_2,Unnamed: 20_level_2,Unnamed: 21_level_2
N,1716.0,79319990.0,55901730.0,683385.0,37566692.25,59575849.5,117599500.0,244220778.0,1716.0,79271810.0,...,0.0,12.0,1716.0,79271810.0,55891590.0,676392.0,37546510.0,59551686.5,117574187.0,244214585.0
Y,12769.0,74631590.0,56078700.0,46870.0,31869769.0,59070327.0,111349500.0,249214145.0,12769.0,74553730.0,...,0.0,14.0,12769.0,74553730.0,56070700.0,38814.0,31802385.0,59024897.0,111286889.0,249200395.0


In [45]:
genesWitheQTLTissueCountMetasoft.to_csv("../outputFiles/genesWitheQTLTissueCountMetasoftAndCNVExACStatus.csv", sep='\t')