### Output pandas DataFrame to LaTeX tables

Assumes you already have specific simulated data.

Tables are modified later in latex for improved design.

In [1]:
import seaborn as sns
import matplotlib.pyplot as plt
import numpy as np
import scipy
import pandas as pd

## Erdos Renyi tables

In [56]:
# ne = 'three-phase-2000G.ne'
# ne = 'bottleneck-1000G.ne'
ne = 'constant-100k-2000G.ne'
size = 2000
cM = 2.0
sim = 250
rep = 500
suf = '../tables/erdosrenyi-'
filename = ne + '-size' + str(size) + '-cM' + str(cM) + '-sim' + str(sim) + '-rep' + str(rep)

out = pd.read_csv(suf+filename+'.tsv',sep='\t')
out.columns = ['Feature','Avg','Var','Min','Max','S.W.']
out.index = out['Feature']
out = out[['Avg','Var','Min','Max','S.W.']]
outstyle = out.style.format(decimal='.', thousands=',', precision=2)
print(outstyle.to_latex())

\begin{tabular}{lrrrrr}
 & Avg & Var & Min & Max & S.W. \\
Feature &  &  &  &  &  \\
Tracts & 1,979.21 & 1,982.63 & 1,780.00 & 2,162.00 & 0.08 \\
Largest & 212.26 & 13,869.14 & 35.00 & 931.00 & 1.00 \\
Tree2 & 273.49 & 272.37 & 199.00 & 348.00 & 0.08 \\
Tree3 & 100.68 & 101.14 & 59.00 & 154.00 & 0.16 \\
Complete>= 3 & 150.06 & 149.86 & 95.00 & 211.00 & 0.17 \\
\end{tabular}



## IBD tables

In [55]:
# ne = 'three-phase-2000G.ne'
# ne = 'bottleneck-1000G.ne'
ne = 'constant-100k-2000G.ne'
size = 2000
cM = 2.0
sim = 250
rep = 500
suf = '../tables/structures-'
filename = ne + '-size' + str(size) + '-cM' + str(cM) + '-sim' + str(sim) + '-rep' + str(rep)

out = pd.read_csv(suf+filename+'.tsv',sep='\t')
out.columns = ['Feature','Avg','Var','Min','Max','S.W.']
out.index = out['Feature']
out = out[['Avg','Var','Min','Max','S.W.']]
outstyle = out.style.format(decimal='.', thousands=',', precision=2)
print(outstyle.to_latex())

\begin{tabular}{lrrrrr}
 & Avg & Var & Min & Max & S.W. \\
Feature &  &  &  &  &  \\
Tracts & 1,954.07 & 5,534.83 & 1,639.00 & 2,304.00 & 0.24 \\
Largest & 10.43 & 3.23 & 6.00 & 27.00 & 1.00 \\
Tree2 & 502.59 & 383.90 & 415.00 & 582.00 & 0.08 \\
Tree3 & 34.44 & 33.41 & 13.00 & 63.00 & 0.67 \\
Complete>= 3 & 179.44 & 144.65 & 131.00 & 232.00 & 0.08 \\
\end{tabular}



## Selection tables

In [53]:
# ne = 'three-phase-2000G.ne'
ne = 'constant-100k-2000G.ne'
size = 2000
cM = 3.0
sim = 250
rep = 500
# selcoef = 0.02
# selcoef = 0.015
# selcoef = 0.01
selcoef = 0.005
suf = '../tables/isweepsel'
filename = '-selcoef' + str(selcoef) + '-freq0.33-' + ne + '-size' + str(size) + '-cM' + str(cM) + '-sim' + str(sim) + '-rep' + str(rep)

out = pd.read_csv(suf+filename+'.tsv',sep='\t')
out.columns = ['Feature','Avg','Var','Min','Max','S.W.']
out.index = out['Feature']
out = out[['Avg','Var','Min','Max','S.W.']]
outstyle = out.style.format(decimal='.', thousands=',', precision=2)
print(outstyle.to_latex())

\begin{tabular}{lrrrrr}
 & Avg & Var & Min & Max & S.W. \\
Feature &  &  &  &  &  \\
Tracts & 1,290.81 & 2,740.70 & 1,083.00 & 1,618.00 & 0.17 \\
Largest & 8.22 & 1.97 & 5.00 & 22.00 & 1.00 \\
Tree2 & 482.86 & 347.66 & 406.00 & 564.00 & 0.04 \\
Tree3 & 29.49 & 28.50 & 11.00 & 55.00 & 0.76 \\
Complete>=3 & 136.09 & 111.95 & 83.00 & 183.00 & 0.16 \\
\end{tabular}

