In [2]:
# Loading in required libraries
import pandas as pd
import seaborn as sns
import numpy as np

# Start coding here!
df = pd.read_csv("nobel.csv")

# Find the most commonly awarded gender
top_gender = df['sex'].mode()

# Find the most commonly awarded birth country
top_country = df['birth_country'].mode()

# Calculate the decade for each award
df['decade'] = (df['year'] // 10) * 10

# Calculate the ratio of US-born Nobel Prize winners to total winners for each decade
decade_counts = df['decade'].value_counts()
us_decade_counts = df[df['birth_country'] == 'USA']['decade'].value_counts()
ratio_us_decade = (us_decade_counts / decade_counts).fillna(0)

# Find the decade with the highest ratio of US-born winners
max_decade_usa = ratio_us_decade.idxmax()

# Calculate the proportion of female laureates for each decade and category combination
female_counts = df[df['sex'] == 'Female'].groupby(['decade', 'category']).size()
total_counts = df.groupby(['decade', 'category']).size()
proportion_female = (female_counts / total_counts).fillna(0)

# Find the decade and category combination with the highest proportion of female laureates
max_female_combination = proportion_female.idxmax()
max_female_dict = {max_female_combination: max_female_combination}

# Find the first woman to receive a Nobel Prize and in what category
first_woman = df[df['sex'] == 'Female'].sort_values(by='year').iloc[0]
first_woman_name = first_woman['full_name']
first_woman_category = first_woman['category']

# Find individuals or organizations that have won more than one Nobel Prize
repeat_winners = df['full_name'].value_counts()
repeat_list = repeat_winners[repeat_winners > 1].index.tolist()

print(f"The most commonly awarded gender is: {top_gender}")
print(f"The most commonly awarded birth country is: {top_country}")
print(f"The decade with the highest ratio of US-born Nobel Prize winners to total winners is: {max_decade_usa}")
print(f"The decade and category combination with the highest proportion of female laureates is: {max_female_dict}")
print(f"The first woman to receive a Nobel Prize is: {first_woman_name} in the category: {first_woman_category}")
print(f"Individuals or organizations that have won more than one Nobel Prize are: {repeat_list}")

The most commonly awarded gender is: 0    Male
Name: sex, dtype: object
The most commonly awarded birth country is: 0    United States of America
Name: birth_country, dtype: object
The decade with the highest ratio of US-born Nobel Prize winners to total winners is: 2010
The decade and category combination with the highest proportion of female laureates is: {(2020, 'Literature'): (2020, 'Literature')}
The first woman to receive a Nobel Prize is: "Marie Curie, née Sklodowska" in the category: Physics
Individuals or organizations that have won more than one Nobel Prize are: ['Comité international de la Croix Rouge (International Committee of the Red Cross)', 'Linus Carl Pauling', 'John Bardeen', 'Frederick Sanger', '"Marie Curie, née Sklodowska"', 'Office of the United Nations High Commissioner for Refugees (UNHCR)']
