### POPULATION AND SAMPLE
---

### Libraries

In [1]:
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np

np.random.seed(10)

### Functions

In [2]:
def get_statistics(pd_series, sample=0):
    '''
    input: pandas Series object and sample (ddof for variance and std)
    output: list containing mean, var and std
    description: calculates the statistics for a population of numbers
    '''
    mean = pd_series.mean()
    var = pd_series.var(ddof=sample)
    std = pd_series.std(ddof=sample)
    return [mean, var, std]
    

In [3]:
def print_statistics(statistics, rounded_cases=4):
    '''
    input: get_statistics output (list) and number of desired cases (int)
    output: 
    description: print the statistics for a population of numbers
    '''
    print("Mean is: {0}".format(round(statistics[0], rounded_cases)))
    print("Var is: {0}".format(round(statistics[1], rounded_cases)))
    print("Std is: {0}".format(round(statistics[2], rounded_cases)))

### Analisys

In [4]:
population = [np.random.randint(10, 100) for i in range(10)] 
data = pd.DataFrame({"Population": population})

In [5]:
statistics = get_statistics(data["Population"], sample=0)
print_statistics(statistics)

Mean is: 45.5
Var is: 833.85
Std is: 28.8765


In [6]:
with_replacement = data["Population"].sample(5, replace=False)
statistics = get_statistics(with_replacement, sample=1)
print_statistics(statistics)

Mean is: 54.2
Var is: 580.7
Std is: 24.0977
