In [1]:
import requests
from bs4 import BeautifulSoup

url = "https://en.wikipedia.org/wiki/List_of_Nobel_laureates#List_of_laureates"

response = requests.get(url)
response.raise_for_status()

soup = BeautifulSoup(response.text, 'html.parser')

tables = soup.find_all("table", {"class": "wikitable"})

links = []
for table in tables:
    for a_tag in table.find_all("a", href=True):
        href = a_tag["href"]
        # Ensure the link points to a Wikipedia article
        if href.startswith("/wiki/") and not href.startswith("/wiki/File:"):
            links.append("https://en.wikipedia.org" + href)

unique_links = sorted(set(links))

for link in unique_links:
    print(link)


https://en.wikipedia.org/wiki/%C3%89lie_Ducommun
https://en.wikipedia.org/wiki/%C3%89lie_Metchnikoff
https://en.wikipedia.org/wiki/%C3%93scar_Arias
https://en.wikipedia.org/wiki/14th_Dalai_Lama
https://en.wikipedia.org/wiki/Aage_Bohr
https://en.wikipedia.org/wiki/Aaron_Ciechanover
https://en.wikipedia.org/wiki/Aaron_Klug
https://en.wikipedia.org/wiki/Abdulrazak_Gurnah
https://en.wikipedia.org/wiki/Abdus_Salam
https://en.wikipedia.org/wiki/Abhijit_Banerjee
https://en.wikipedia.org/wiki/Abiy_Ahmed
https://en.wikipedia.org/wiki/Ada_Yonath
https://en.wikipedia.org/wiki/Adam_Riess
https://en.wikipedia.org/wiki/Adolf_Butenandt
https://en.wikipedia.org/wiki/Adolf_Windaus
https://en.wikipedia.org/wiki/Adolf_von_Baeyer
https://en.wikipedia.org/wiki/Adolfo_P%C3%A9rez_Esquivel
https://en.wikipedia.org/wiki/Ahmed_Zewail
https://en.wikipedia.org/wiki/Akira_Suzuki_(chemist)
https://en.wikipedia.org/wiki/Akira_Yoshino
https://en.wikipedia.org/wiki/Al_Gore
https://en.wikipedia.org/wiki/Alain_Aspect
ht

In [2]:
def scrape_education(url):
    response = requests.get(url)
    response.raise_for_status()

    soup = BeautifulSoup(response.text, 'html.parser')

    infobox = soup.find("table", {"class": "infobox"})
    if not infobox:
        return "Infobox not found."

    for row in infobox.find_all("tr"):
        header = row.find("th")
        if header and "Education" in header.text:
            education_data = row.find("td")
            if education_data:
                return education_data.get_text(separator="\n").strip()
            else:
                return "Education section is empty."

    return "Education section not found in the infobox."

url = "https://en.wikipedia.org/wiki/Bill_Gates"
education = scrape_education(url)
print(education)


Harvard University
 (dropped out)


In [3]:
import requests
from bs4 import BeautifulSoup

IVY_LEAGUE_COLLEGES = [
    "Harvard University", "Yale University", "Princeton University",
    "Columbia University", "University of Pennsylvania", "Dartmouth College",
    "Brown University", "Cornell University"
]

# Step 1: Scrape all Wikipedia links for Nobel laureates
def get_nobel_laureate_links():
    url = "https://en.wikipedia.org/wiki/List_of_Nobel_laureates#List_of_laureates"
    response = requests.get(url)
    response.raise_for_status()
    soup = BeautifulSoup(response.text, 'html.parser')

    tables = soup.find_all("table", {"class": "wikitable"})

    links = []
    for table in tables:
        for a_tag in table.find_all("a", href=True):
            href = a_tag["href"]
            # Ensure the link points to a Wikipedia article
            if href.startswith("/wiki/") and not href.startswith("/wiki/File:"):
                links.append("https://en.wikipedia.org" + href)

    return sorted(set(links))  # Remove duplicates and sort links

# Step 2: Scrape the education field from a person's Wikipedia page
def scrape_education(url):
    response = requests.get(url)
    response.raise_for_status()
    soup = BeautifulSoup(response.text, 'html.parser')

    # Check for infobox
    infobox = soup.find("table", {"class": "infobox"})
    if infobox:
        for row in infobox.find_all("tr"):
            header = row.find("th")
            if header and "Education" in header.text:
                education_data = row.find("td")
                if education_data:
                    education_text = education_data.get_text(separator="\n").strip()
                    for college in IVY_LEAGUE_COLLEGES:
                        if college in education_text:
                            return "ivy"
                    return "noivy"

    # If no education in the infobox, scan the entire page for Ivy League colleges
    page_text = soup.get_text()
    for college in IVY_LEAGUE_COLLEGES:
        if college in page_text:
            return "ivy"

    # Default response if no Ivy League colleges are found
    return "noivy"

# Step 3: Iterate through all laureate links and count Ivy vs No Ivy
def main():
    laureate_links = get_nobel_laureate_links()
    ivy_winner = 0
    noivy_winner = 0

    for link in laureate_links:
        try:
            print(f"Scraping: {link}")
            education = scrape_education(link)
            if education == "ivy":
                ivy_winner += 1
                print(f"Education: Ivy League winner")
            else:
                noivy_winner += 1
                print(f"Education: No Ivy League affiliation")
        except Exception as e:
            print(f"Error scraping {link}: {e}")

    print(f"\nSummary:")
    print(f"Ivy League winners: {ivy_winner}")
    print(f"No Ivy League affiliation: {noivy_winner}")

if __name__ == "__main__":
    main()

Scraping: https://en.wikipedia.org/wiki/%C3%89lie_Ducommun
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/%C3%89lie_Metchnikoff
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/%C3%93scar_Arias
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/14th_Dalai_Lama
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Aage_Bohr
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Aaron_Ciechanover
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Aaron_Klug
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Abdulrazak_Gurnah
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Abdus_Salam
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Abhijit_Banerjee
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Abiy_Ahmed
Education: No Ivy League affiliation
Scraping: https://en.w

Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Aung_San_Suu_Kyi
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Austen_Chamberlain
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Avram_Hershko
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Aziz_Sancar
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Barack_Obama
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Barbara_McClintock
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Barry_Barish
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Barry_Marshall
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Baruch_Samuel_Blumberg
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Baruj_Benacerraf
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Ben_Bernanke
Education: Ivy League winn

Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Dario_Fo
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Daron_Acemoglu
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/David_Baker_(biochemist)
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/David_Baltimore
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/David_Card
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/David_Gross
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/David_H._Hubel
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/David_J._Thouless
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/David_J._Wineland
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/David_Julius
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/David_Lee_(physicist)
Education: Ivy League winne

Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Felix_Bloch
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Feodor_Lynen
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Ferdinand_Buisson
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Ferenc_Krausz
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Ferid_Murad
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Finn_E._Kydland
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Fr%C3%A9d%C3%A9ric_Joliot-Curie
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Fr%C3%A9d%C3%A9ric_Mistral
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Fr%C3%A9d%C3%A9ric_Passy
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Fran%C3%A7ois_Englert
Education: Ivy League winner
Scraping: https://en.wikip

Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Guglielmo_Marconi
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Guido_Imbens
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Gunnar_Myrdal
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Gustaf_Dal%C3%A9n
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Gustav_Ludwig_Hertz
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Gustav_Stresemann
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/H._Robert_Horvitz
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Haldan_Keffer_Hartline
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Halld%C3%B3r_Laxness
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Hamilton_O._Smith
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Han_Kang
Education: 

Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/J._J._Thomson
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/J._M._Coetzee
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/J._M._G._Le_Cl%C3%A9zio
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/J._Michael_Bishop
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Jacinto_Benavente
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Jack_Kilby
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Jack_Steinberger
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Jack_W._Szostak
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Jacobus_Henricus_van_%27t_Hoff
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Jacques_Dubochet
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wi

Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Joseph_L._Goldstein
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Joseph_Murray
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Joseph_Rotblat
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Joseph_Stiglitz
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Joshua_Angrist
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Joshua_Lederberg
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Juan_Manuel_Santos
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Juan_Ram%C3%B3n_Jim%C3%A9nez
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Jules_A._Hoffmann
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Jules_Bordet
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Julian_Schwinger
Educatio

Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Maria_Ressa
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Marie_Curie
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Mario_Capecchi
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Mario_J._Molina
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Mario_Vargas_Llosa
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Marshall_Warren_Nirenberg
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Martin_Chalfie
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Martin_Evans
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Martin_Karplus
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Martin_Lewis_Perl
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Martin_Luther_King_Jr.
Education: No Ivy League affiliation
Scra

Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Owen_Willans_Richardson
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/P%C3%A4r_Lagerkvist
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Pablo_Neruda
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Patrick_Blackett
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Patrick_Modiano
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Patrick_White
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Paul_Berg
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Paul_D._Boyer
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Paul_Dirac
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Paul_Ehrlich
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Paul_Flory
Education: Ivy League 

Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Robert_Bruce_Merrifield
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Robert_Burns_Woodward
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Robert_C._Merton
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Robert_Cecil,_1st_Viscount_Cecil_of_Chelwood
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Robert_Coleman_Richardson
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Robert_Curl
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Robert_Edwards_(physiologist)
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Robert_F._Engle
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Robert_F._Furchgott
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Robert_Fogel
Education: Ivy League winner
Scraping: https://en.wikipedia.o

Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Takaaki_Kajita
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Tasuku_Honjo
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Tawakel_Karman
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Theodor_Mommsen
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Theodor_Svedberg
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Theodor_W._H%C3%A4nsch
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Theodore_Roosevelt
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Theodore_Schultz
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Theodore_William_Richards
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Thomas_A._Steitz
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki

Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Wolfgang_Paul
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Wolfgang_Pauli
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Woodrow_Wilson
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/World_Food_Programme
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Yang_Chen-Ning
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Yasser_Arafat
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Yasunari_Kawabata
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Yitzhak_Rabin
Education: Ivy League winner
Scraping: https://en.wikipedia.org/wiki/Yoichiro_Nambu
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Yoshinori_Ohsumi
Education: No Ivy League affiliation
Scraping: https://en.wikipedia.org/wiki/Yuan_T._Lee
Education: No Ivy League affili

In [5]:
ivy_winner / (noivy_winner + ivy_winner)

NameError: name 'ivy_winner' is not defined