In [1]:
import numpy as np
import pandas as pd
from scipy import stats

In [2]:
# Simulated dataset
np.random.seed(42)

In [3]:
# Group A (control group) - candidates who followed the standard interview preparation
group_a = np.random.binomial(1, 0.55, size=100)  # 55% success rate, 100 candidates

In [4]:
# Group B (treatment group) - candidates who followed a new interview prep strategy
group_b = np.random.binomial(1, 0.65, size=100)  # 65% success rate, 100 candidates

In [6]:
# Create a DataFrame
data = pd.DataFrame({
    'group': ['A'] * len(group_a) + ['B'] * len(group_b),
    'success': np.concatenate([group_a, group_b])
})

In [7]:
# Compute success rates for both groups
success_rate_a = data[data['group'] == 'A']['success'].mean()
success_rate_b = data[data['group'] == 'B']['success'].mean()

print(f"Success rate for Group A: {success_rate_a:.2f}")
print(f"Success rate for Group B: {success_rate_b:.2f}")

Success rate for Group A: 0.59
Success rate for Group B: 0.66


In [8]:
# Perform a t-test to see if the difference is statistically significant
t_stat, p_value = stats.ttest_ind(data[data['group'] == 'A']['success'], data[data['group'] == 'B']['success'])

print(f"T-statistic: {t_stat:.2f}")
print(f"P-value: {p_value:.4f}")

T-statistic: -1.02
P-value: 0.3090


In [9]:
# Interpretation of p-value
alpha = 0.05
if p_value < alpha:
    print("We reject the null hypothesis, there's a significant difference between the two groups.")
else:
    print("We fail to reject the null hypothesis, no significant difference between the two groups.")

We fail to reject the null hypothesis, no significant difference between the two groups.
