# Importing necessary libraries

In [8]:
import pandas as pd
import numpy as np
from scipy.stats import ttest_ind
from scipy.stats import f_oneway
import scipy.stats as stats
from scipy.stats import pearsonr
import warnings
warnings.filterwarnings('ignore')

# Q1) T-Test: Using the teachers' rating data set, does gender affect teaching evaluation rates?

## Objective:
To test whether the mean teaching evaluation score differs between male and female instructors.

## Hypotheses:

H₀: There is no significant difference in evaluation scores between genders.

H₁: There is a significant difference in evaluation scores between genders.

## Test Used:
Independent Samples t-test

In [9]:
df = pd.read_csv("/content/teachers_rating_dataset.csv")
male_eval = df[df['Gender'] == 'Male']['Rating']
female_eval = df[df['Gender'] == 'Female']['Rating']

t_stat, p_val = ttest_ind(male_eval, female_eval)
print("T-Statistic:", t_stat)
print("P-Value:", p_val)

T-Statistic: 1.4837493604624215
P-Value: 0.1405416278044922


Interpretation:

p-value ≥ 0.05, fail to reject H₀ → Gender does not affect evaluation scores.

#Q2. ANOVA: Using the teachers' rating data set, does beauty score for instructors differ by age?

## Objective:
To check whether beauty scores differ significantly across different age groups.

## Hypotheses:

H₀: Mean beauty scores are equal across all age groups.

H₁: At least one group has a different mean beauty score.

## Test Used:
One-way ANOVA

In [10]:
df['age_group'] = pd.cut(df['Age'], bins=[20,30,40,50,60,70], labels=['20s','30s','40s','50s','60s'])
grouped = [df[df['age_group']==grp]['Beauty'] for grp in df['age_group'].unique() if not df[df['age_group']==grp].empty]
f_stat, p_val = f_oneway(*grouped)
print("F-Statistic:", f_stat)
print("P-Value:", p_val)


F-Statistic: 1.0055310276264144
P-Value: 0.39304586245221135


Interpretation:

Fail to reject H₀ → No significant difference.

# Q3. Chi-square: Using the teachers' rating data set, is there an association between tenure and gender?

## Objective:
To test whether tenure and gender are independent or associated.

## Hypotheses:

H₀: Tenure and gender are independent.

H₁: There is an association between tenure and gender.

## Test Used:
Chi-square test of independence

In [11]:
contingency_table = pd.crosstab(df['Tenure'], df['Gender'])
chi2, p, dof, expected = stats.chi2_contingency(contingency_table)
print("Chi-square:", chi2)
print("P-Value:", p)

Chi-square: 0.5661505300293848
P-Value: 0.4517926608589078


Interpretation:

fail to reject H₀ → They are independent.

# Q4. Correlation: Using the teachers' rating dataset, is teaching evaluation score correlated with beauty score?

## Objective:
To test whether there is a linear relationship between evaluation and beauty.

## Hypotheses:

H₀: There is no correlation between evaluation and beauty.

H₁: There is a correlation between evaluation and beauty.

## Test Used:
Pearson Correlation Coefficient

In [12]:
corr, p_val = pearsonr(df['Rating'], df['Beauty'])
print("Correlation Coefficient:", corr)
print("P-Value:", p_val)


Correlation Coefficient: -0.032977031987411566
P-Value: 0.7206715414451285


Interpretation:

p-value > 0.05, fail to reject H₀ → There is no  correlation between evaluation and beauty.

As corr < 0, it’s negative correlation.