## Latex Tables 

**For figures, see the R script**

In [1]:
import pandas as pd

In [2]:
tab1 = pd.read_csv("../tabs/table_1.csv")
tab1.rename(columns={"Models": "Model", 
                     "Complete Test set": "Test Set", 
                     "3k weighted unique random": "Weighted Random (3k)",
                     "Bottom - 3k": "Bottom-3k"}, inplace = True)
tab1.drop("3k unique random", axis = 1, inplace = True)
tab1 = tab1.round(2)
tab1

Unnamed: 0,Model,Test Set,Weighted Random (3k),Top-3k,Bottom-3k
0,RNN,65.27,65.4,62.7,62.3
1,LSTM,75.91,75.36,73.1,72.4
2,GRU,85.3,84.13,82.4,81.96


In [3]:
tab1_style = tab1.style
tab1_style.format(subset=["Test Set", "Weighted Random (3k)", "Top-3k", "Bottom-3k"], precision = 1)\
          .format_index(escape="latex", axis=1)\
          .format_index(escape="latex", axis=0)\
          .hide(level=0, axis=0)
tab1_tex = tab1_style.to_latex(caption = "Accuracy of Different Models on the Test Set",
#                               clines="skip-last;data",
                               convert_css=True,
                               label = "model_comparison",
                               position_float="centering",
                               multicol_align="|c|",
                               hrules=True)

In [4]:
f = open("../tabs/model_comparison.tex", "w")
f.write(tab1_tex)
f.close()

In [5]:
tab2 = pd.read_csv("../tabs/stratified_by_state.csv")
tab2["state"] = tab2["state"].str.capitalize()
tab2['state'] = tab2['state'].astype('category').cat.rename_categories({'Andaman': 'Andaman and Nicobar',
                                                                        'Andhra': 'Andhra Pradesh',
                                                                        'Arunachal': 'Arunachal Pradesh',
                                                                        'Guj': 'Gujarat', 
                                                                        'Har': 'Haryana',
                                                                        'Jk':  'Jammu and Kashmir',
                                                                        'Jha': 'Jharkhand',
                                                                        'Kar': 'Karnataka',
                                                                        'Mp':  'Madhya Pradesh',
                                                                        'Odi': 'Odisha',
                                                                        'Tel': 'Telengana',
                                                                        'Up':  'Uttar Pradesh',
                                                                        'Utt': 'Uttaranchal',
                                                                       })
tab2

Unnamed: 0,state,RNN,LSTM,GRU
0,Andaman and Nicobar,50.2,69.2,66.9
1,Andhra Pradesh,65.2,70.1,80.4
2,Arunachal Pradesh,60.0,81.7,81.2
3,Assam,73.4,93.6,89.0
4,Bihar,25.7,36.5,90.2
5,Chandigarh,18.6,23.3,88.4
6,Dadra,69.7,76.9,79.7
7,Daman,44.8,50.9,61.1
8,Delhi,22.4,36.2,37.6
9,Goa,34.5,48.1,53.5


In [6]:
tab2_style = tab2.style
tab2_style.format(subset=["RNN", "LSTM", "GRU"], precision=1)\
           .hide(level=0, axis=0)\
          .format_index(escape="latex", axis=1)\
          .format_index(escape="latex", axis=0)  
tab2_tex = tab2_style.to_latex(caption = "Accuracy of Different Models By State of Residence",
                               convert_css=True,
                               label = "accuracy_by_state",
                               position_float="centering",
                               multicol_align="|c|",
                               hrules=True)

In [7]:
f = open("../tabs/accuracy_by_state.tex", "w")
f.write(tab2_tex)
f.close()