In [7]:
"""
T-Test (Small Sample, n = 10)

Dataset: t_test_data.csv
Industry Standard (μ0) = 50,000
Population Std Dev = Unknown → Use t-test
Significance Level (α) = 0.05

Questions:
1. Two-tailed test: Test whether the average salary of employees differs from the industry standard of $50,000.
   H0: μ = 50,000
   H1: μ ≠ 50,000

2. One-tailed test (Left-tailed): Test whether the average salary of employees is less than $50,000.
   H0: μ ≥ 50,000
   H1: μ < 50,000
"""

import pandas as pd
import numpy as np
from scipy import stats

t_data = pd.read_csv("t_test_data.csv")

mu_0 = 50000
alpha = 0.05

sample_mean = t_data["Salary"].mean()
sample_std = t_data["Salary"].std(ddof=1)
n = len(t_data)

t_stat = (sample_mean - mu_0) / (sample_std / np.sqrt(n))

p_value_two_tailed = 2 * (1 - stats.t.cdf(abs(t_stat), df=n-1))

p_value_one_tailed = stats.t.cdf(t_stat, df=n-1)

print("=== T-Test Results ===")
print(f"Sample Mean: {sample_mean:.2f}, Sample Std Dev: {sample_std:.2f}, n = {n}")
print(f"T-statistic: {t_stat:.4f}")

print(f"\nTwo-tailed p-value: {p_value_two_tailed:.4f}")
if p_value_two_tailed < alpha:
    print("➡ Reject H0: Mean salary differs from 50,000")
else:
    print("➡ Fail to reject H0: No significant difference")

print(f"\nOne-tailed p-value: {p_value_one_tailed:.4f}")
if p_value_one_tailed < alpha:
    print("➡ Reject H0: Mean salary is less than 50,000")
else:
    print("➡ Fail to reject H0: Not enough evidence mean < 50,000")


=== T-Test Results ===
Sample Mean: 51250.00, Sample Std Dev: 1844.66, n = 10
T-statistic: 2.1429

Two-tailed p-value: 0.0607
➡ Fail to reject H0: No significant difference

One-tailed p-value: 0.9696
➡ Fail to reject H0: Not enough evidence mean < 50,000
