## **Pruebas de hipótesis en Python**

In [9]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
import scipy.stats as st
from scipy.stats import f_oneway
from scipy.stats import ttest_ind

In [3]:
url = 'https://archive.ics.uci.edu/ml/machine-learning-databases/iris/iris.data'
names = ['sepal-lenght', 'sepal-width', 'petal-lenght', 'petal-width', 'class']
data = pd.read_csv(url, names=names)
data.head()

Unnamed: 0,sepal-lenght,sepal-width,petal-lenght,petal-width,class
0,5.1,3.5,1.4,0.2,Iris-setosa
1,4.9,3.0,1.4,0.2,Iris-setosa
2,4.7,3.2,1.3,0.2,Iris-setosa
3,4.6,3.1,1.5,0.2,Iris-setosa
4,5.0,3.6,1.4,0.2,Iris-setosa


### **Estándar error**

[![t-student.png](https://i.postimg.cc/XNcJ5C9w/t-student.png)](https://postimg.cc/5jybdj70)

In [4]:
# Error estándar
standard_error_length = data['sepal-lenght'].std() / np.sqrt(10)
print("Error estándar de length %.2f" % standard_error_length)

standard_error_width = data['sepal-width'].std() / np.sqrt(10)
print("Error estándar de width %.2f" % standard_error_width)

Error estándar de length 0.26
Error estándar de width 0.14


### **Desvío estándar**

[![desvio-est-ndar.png](https://i.postimg.cc/4xrP9qT2/desvio-est-ndar.png)](https://postimg.cc/CRsbyv5b)

In [5]:
# Desvío estándar
standard_deviation = np.sqrt((standard_error_length**2) + (standard_error_width**2))
print("Desvío estándar %.2f" % standard_deviation)

Desvío estándar 0.30


## **Prueba de t-Student**

[![t-student.png](https://i.postimg.cc/3xg4tcvc/t-student.png)](https://postimg.cc/4Yxxdww6)

In [6]:
# Prueba de t-Student
t_stat = (data['sepal-lenght'].mean() - data['sepal-width'].mean()) / standard_deviation
print("Prueba de t-Student %.2f" % t_stat)

Prueba de t-Student 9.44


In [7]:
p = ttest_ind(data['sepal-lenght'], data['sepal-width'])
p

Ttest_indResult(statistic=36.548157693982006, pvalue=3.987838114848222e-112)

### **Correlación y Coeficiente de Pearson**

In [8]:
correlation = data['sepal-lenght'].corr(data['sepal-width'])
print('Coeficiente de correlación %.2f' % correlation)

Coeficiente de correlación -0.11


In [12]:
pearson = st.pearsonr(data['sepal-lenght'], data['sepal-width'])
print('Coeficiente de Pearson %.2f' % pearson[0])

Coeficiente de Pearson -0.11


### **Análisis de la varianza (ANOVA)**

In [13]:
anova = f_oneway(data['sepal-lenght'], data['sepal-width'])
anova

F_onewayResult(statistic=1335.7678308241748, pvalue=3.9878381148486907e-112)