In [1]:
%matplotlib inline
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
from drs_sentani import get_survey
survey = get_survey()
import pysentani as sti

We can use value counts to get a quick summary of the number of households reporting a village name.  ``value_counts`` returns a pandas series.

In [14]:
survey['village_name'].value_counts()

Ayapo           120
Sosiri           96
Puai             74
Flafow           71
Babrongko        67
Simporo          62
Yakonde          59
Kheleubulow      52
Donday           50
Yoboi            49
Abar             46
Yokiwa           43
Kampung_Baru     36
Ebunfauw         36
Atamali          35
Yobeh            34
Kalio            30
Kwadeware        30
Asei             29
Yoka             28
Evale            22
Hobong           20
Kensio           19
Khageuw          16
Ajau             14
Khamayakha       14
Pantai_Yahim     13
Obolyo           11
Burawai           8
dtype: int64

If we convert this series into a DataFrame, we can call a method that outputs a string that will create a latex table.  If we save this to a file, the paper could read it in.

In [15]:
print(pd.DataFrame(survey['village_name'].value_counts()).to_latex())

\begin{tabular}{lr}
\toprule
{} &    0 \\
\midrule
Ayapo        &  120 \\
Sosiri       &   96 \\
Puai         &   74 \\
Flafow       &   71 \\
Babrongko    &   67 \\
Simporo      &   62 \\
Yakonde      &   59 \\
Kheleubulow  &   52 \\
Donday       &   50 \\
Yoboi        &   49 \\
Abar         &   46 \\
Yokiwa       &   43 \\
Kampung\_Baru &   36 \\
Ebunfauw     &   36 \\
Atamali      &   35 \\
Yobeh        &   34 \\
Kalio        &   30 \\
Kwadeware    &   30 \\
Asei         &   29 \\
Yoka         &   28 \\
Evale        &   22 \\
Hobong       &   20 \\
Kensio       &   19 \\
Khageuw      &   16 \\
Ajau         &   14 \\
Khamayakha   &   14 \\
Pantai\_Yahim &   13 \\
Obolyo       &   11 \\
Burawai      &    8 \\
\bottomrule
\end{tabular}



We can also use the tabulate library for a nice table we can use in a markdown document.

In [23]:
from tabulate import tabulate
print(tabulate(pd.DataFrame(survey['village_name'].value_counts()), tablefmt='pipe'))

|:-------------|----:|
| Ayapo        | 120 |
| Sosiri       |  96 |
| Puai         |  74 |
| Flafow       |  71 |
| Babrongko    |  67 |
| Simporo      |  62 |
| Yakonde      |  59 |
| Kheleubulow  |  52 |
| Donday       |  50 |
| Yoboi        |  49 |
| Abar         |  46 |
| Yokiwa       |  43 |
| Kampung_Baru |  36 |
| Ebunfauw     |  36 |
| Atamali      |  35 |
| Yobeh        |  34 |
| Kalio        |  30 |
| Kwadeware    |  30 |
| Asei         |  29 |
| Yoka         |  28 |
| Evale        |  22 |
| Hobong       |  20 |
| Kensio       |  19 |
| Khageuw      |  16 |
| Ajau         |  14 |
| Khamayakha   |  14 |
| Pantai_Yahim |  13 |
| Obolyo       |  11 |
| Burawai      |   8 |
