In [None]:
import pandas as pd

def analyze_demographics(file_path):
    data = pd.read_csv(file_path)

    race_counts = data['race'].value_counts()

    average_age_men = data.loc[data['sex'] == 'Male', 'age'].mean()

    percent_bachelors = (data['education'] == 'Bachelors').mean() * 100

    higher_edu = ['Bachelors', 'Masters', 'Doctorate']
    higher_edu_rich = data[(data['education'].isin(higher_edu)) & (data['salary'] == '>50K')]
    percent_higher_edu_rich = (len(higher_edu_rich) / len(data[data['education'].isin(higher_edu)])) * 100

    lower_edu = data[~data['education'].isin(higher_edu)]
    lower_edu_rich = lower_edu[lower_edu['salary'] == '>50K']
    percent_lower_edu_rich = (len(lower_edu_rich) / len(lower_edu)) * 100

    min_hours = data['hours-per-week'].min()

    min_workers = data[data['hours-per-week'] == min_hours]
    rich_min_workers = min_workers[min_workers['salary'] == '>50K']
    rich_percentage_min_hours = (len(rich_min_workers) / len(min_workers)) * 100
    
    country_counts = data['native-country'].value_counts()
    rich_by_country = data[data['salary'] == '>50K']['native-country'].value_counts()
    rich_percentage_country = (rich_by_country / country_counts) * 100
    top_country = rich_percentage_country.idxmax()
    top_country_percentage = round(rich_percentage_country.max(), 1)

    rich_indians = data[(data['native-country'] == 'India') & (data['salary'] == '>50K')]
    top_occupation_india = rich_indians['occupation'].mode()[0]
    return {
        'race_counts': race_counts,
        'average_age_men': round(average_age_men, 1),
        'percent_bachelors': round(percent_bachelors, 1),
        'percent_higher_edu_rich': round(percent_higher_edu_rich, 1),
        'percent_lower_edu_rich': round(percent_lower_edu_rich, 1),
        'min_hours': min_hours,
        'rich_percentage_min_hours': round(rich_percentage_min_hours, 1),
        'top_country': top_country,
        'top_country_percentage': top_country_percentage,
        'top_occupation_india': top_occupation_india
    }
if __name__ == "__main__":
    results = analyze_demographics('demographic_data.csv')
    for key, value in results.items():
        print(f"{key}: {value}")
