In [None]:
import numpy as np
import fetchmaker
from scipy.stats import binom_test
from scipy.stats import f_oneway
from statsmodels.stats.multicomp import pairwise_tukeyhsd
from scipy.stats import chi2_contingency

rottweiler_tl = fetchmaker.get_tail_length("rottweiler")
print(np.mean(rottweiler_tl)) # the mean of rottweiler_tl
print(np.std(rottweiler_tl)) # the standard deviation of rottweiler_tl 

# DATA TO THE RESCUE

whippet_rescue = fetchmaker.get_is_rescue("whippet")

# getting the number of entries in whippet_rescue that are 1
num_whippet_rescues = np.count_nonzero(whippet_rescue)
print(num_whippet_rescues)

# getting the number of samples in the whippet set
num_whippets = np.size(whippet_rescue)
print(num_whippets)

# performing a binomial test to test the number of whippet rescues
pval = binom_test(num_whippet_rescues, n=num_whippets, p=0.08)
print(pval)


# SIZE DOES MATTER

whippets_weights = fetchmaker.get_weight("whippet")
terriers_weights = fetchmaker.get_weight("terrier")
pitbulls_weights = fetchmaker.get_weight("pitbull")

_, pval_anova = f_oneway(whippets_weights, terriers_weights, pitbulls_weights)  # performing an F-test
print(pval_anova)

# Tukey's test to determine which pairs differ from each other
dog_weights = np.concatenate([whippets_weights, terriers_weights, pitbulls_weights])
labels = ['whippet'] * len(whippets_weights) + ['terrier'] * len(terriers_weights) + ['pitbull'] * len(pitbulls_weights)
tukey_results = pairwise_tukeyhsd(dog_weights, labels, 0.05)
print(tukey_results)


# CATEGORICAL DOG TEST

poodle_colors = fetchmaker.get_color("poodle")
shihtzu_colors = fetchmaker.get_color("shihtzu")

num_black = [np.count_nonzero(poodle_colors == "black"), np.count_nonzero(shihtzu_colors == "black")]
num_brown = [np.count_nonzero(poodle_colors == "brown"), np.count_nonzero(shihtzu_colors == "brown")]
num_gold = [np.count_nonzero(poodle_colors == "gold"), np.count_nonzero(shihtzu_colors == "gold")]
num_gray = [np.count_nonzero(poodle_colors == "gray"), np.count_nonzero(shihtzu_colors == "gray")]
num_white = [np.count_nonzero(poodle_colors == "white"), np.count_nonzero(shihtzu_colors == "white")]

color_table = [num_black, num_brown, num_gold, num_gray, num_white]
print(color_table)

_, col_pval, _, _ = chi2_contingency(color_table) # performing a Chi Square test
print(col_pval)





