## 1. Import Relevant Libraries¶

In [1]:
!pip install requests
!pip install beautifulsoup4



## 2. Perform HTTP Request¶

In [14]:
import requests
from bs4 import BeautifulSoup
import pandas as pd

In [16]:
url = "https://en.wikipedia.org/wiki/Apple_Inc."
response = requests.get(url)
html_content = response.text

## 3. Check the Request Status

In [17]:
if response.status_code == 200:
    print("Request successful!")

Request successful!


## 4. Build the Extraction Model

In [18]:
soup = BeautifulSoup(html_content, 'html.parser')

In [21]:
soup = BeautifulSoup(html_content, 'html.parser')

## 5. Extract Headings¶

In [22]:
headings = [heading.text.strip() for heading in soup.find_all(['h1', 'h2', 'h3'])]
print(headings)

['Contents', 'Apple Inc.', 'History', '1976–1980: Founding and incorporation', '1980–1990: Success with Macintosh', '1990–1997: Decline and restructuring', '1997–2007: Return to profitability', '2007–2011: Success with mobile devices', '2011–present: Post-Jobs era, Tim Cook', 'Products', 'Mac', 'iPhone', 'iPad', 'Other products', 'Services', 'Marketing', 'Branding', 'Advertising', 'Stores', 'Market power', 'Privacy', 'Corporate affairs', 'Business trends', 'Leadership', 'Ownership', 'Corporate culture', 'Offices', 'Litigation', 'Finances', 'Taxes', 'Charity', 'Environment', 'Apple Energy', 'Energy and resources', 'Toxins', 'Green bonds', 'Supply chain', 'Worker organizations', 'Democratic Republic of the Congo', 'See also', 'Notes', 'References', 'Bibliography', 'Further reading', 'External links']


## 6. Extract All Paragraphs¶

In [23]:
paragraphs = [p.text.strip() for p in soup.find_all('p')]
print(paragraphs)

['', 'Apple Inc. is an American multinational corporation and technology company headquartered in Cupertino, California, in Silicon Valley. It is best known for its consumer electronics, software, and services. Founded in 1976 as Apple Computer Company by Steve Jobs, Steve Wozniak and Ronald Wayne, the company was incorporated by Jobs and Wozniak as Apple Computer, Inc. the following year. It was renamed Apple Inc. in 2007 as the company had expanded its focus from computers to consumer electronics. Apple is the largest technology company by revenue, with US$391.04\xa0billion in the 2024 fiscal year.', 'The company was founded to produce and market Wozniak\'s Apple I personal computer. Its second computer, the Apple II, became a best seller as one of the first mass-produced microcomputers. Apple introduced the Lisa in 1983 and the Macintosh in 1984, as some of the first computers to use a graphical user interface and a mouse. By 1985, internal company problems led to Jobs leaving to fo

In [24]:
paragraphs = [p.text.strip() for p in soup.find_all('p')]
print(paragraphs)

['', 'Apple Inc. is an American multinational corporation and technology company headquartered in Cupertino, California, in Silicon Valley. It is best known for its consumer electronics, software, and services. Founded in 1976 as Apple Computer Company by Steve Jobs, Steve Wozniak and Ronald Wayne, the company was incorporated by Jobs and Wozniak as Apple Computer, Inc. the following year. It was renamed Apple Inc. in 2007 as the company had expanded its focus from computers to consumer electronics. Apple is the largest technology company by revenue, with US$391.04\xa0billion in the 2024 fiscal year.', 'The company was founded to produce and market Wozniak\'s Apple I personal computer. Its second computer, the Apple II, became a best seller as one of the first mass-produced microcomputers. Apple introduced the Lisa in 1983 and the Macintosh in 1984, as some of the first computers to use a graphical user interface and a mouse. By 1985, internal company problems led to Jobs leaving to fo

## 7. Extract All Links

In [48]:
links = [a['href'] for a in soup.find_all('a', href = True)]
print(links)

['#bodyContent', '/wiki/Main_Page', '/wiki/Wikipedia:Contents', '/wiki/Portal:Current_events', '/wiki/Special:Random', '/wiki/Wikipedia:About', '//en.wikipedia.org/wiki/Wikipedia:Contact_us', '/wiki/Help:Contents', '/wiki/Help:Introduction', '/wiki/Wikipedia:Community_portal', '/wiki/Special:RecentChanges', '/wiki/Wikipedia:File_upload_wizard', '/wiki/Special:SpecialPages', '/wiki/Main_Page', '/wiki/Special:Search', 'https://donate.wikimedia.org/?wmf_source=donate&wmf_medium=sidebar&wmf_campaign=en.wikipedia.org&uselang=en', '/w/index.php?title=Special:CreateAccount&returnto=Apple+Inc.', '/w/index.php?title=Special:UserLogin&returnto=Apple+Inc.', 'https://donate.wikimedia.org/?wmf_source=donate&wmf_medium=sidebar&wmf_campaign=en.wikipedia.org&uselang=en', '/w/index.php?title=Special:CreateAccount&returnto=Apple+Inc.', '/w/index.php?title=Special:UserLogin&returnto=Apple+Inc.', '/wiki/Help:Introduction', '/wiki/Special:MyContributions', '/wiki/Special:MyTalk', '#', '#History', '#1976–19

## 8. Extract Table

In [50]:
infobox = soup.find('table', class_ = 'infobox')

if infobox:
    rows = infobox.find_all('tr')
    
    data = {}
    for row in rows:
        header = row.find('th')
        value = row.find('td')
        if header and value:
            data[header.text.strip()] = value.text.strip()
        print(data)
else:
    print("Infobox table not found.")

{}
{}
{'Formerly': 'Apple Computer Company (1976–1977)Apple Computer, Inc. (1977–2007)'}
{'Formerly': 'Apple Computer Company (1976–1977)Apple Computer, Inc. (1977–2007)', 'Company type': 'Public'}
{'Formerly': 'Apple Computer Company (1976–1977)Apple Computer, Inc. (1977–2007)', 'Company type': 'Public', 'Traded as': 'Nasdaq:\xa0AAPLNasdaq-100 componentDJIA componentS&P 100 componentS&P 500 component'}
{'Formerly': 'Apple Computer Company (1976–1977)Apple Computer, Inc. (1977–2007)', 'Company type': 'Public', 'Traded as': 'Nasdaq:\xa0AAPLNasdaq-100 componentDJIA componentS&P 100 componentS&P 500 component', 'ISIN': 'US0378331005'}
{'Formerly': 'Apple Computer Company (1976–1977)Apple Computer, Inc. (1977–2007)', 'Company type': 'Public', 'Traded as': 'Nasdaq:\xa0AAPLNasdaq-100 componentDJIA componentS&P 100 componentS&P 500 component', 'ISIN': 'US0378331005', 'Industry': 'Consumer electronicsSoftware servicesOnline services'}
{'Formerly': 'Apple Computer Company (1976–1977)Apple Compu

## 9. Convert Table into a DataFrame¶

In [34]:
table = pd.DataFrame(list(data.items()), columns = ['Key', 'Value'])
table

Unnamed: 0,Key,Value
0,Formerly,Apple Computer Company (1976–1977)Apple Comput...
1,Company type,Public
2,Traded as,Nasdaq: AAPLNasdaq-100 componentDJIA component...
3,ISIN,US0378331005
4,Industry,Consumer electronicsSoftware servicesOnline se...
5,Founded,"April 1, 1976; 49 years ago (1976-04-01), in L..."
6,Founders,Steve JobsSteve WozniakRonald Wayne
7,Headquarters,"1 Apple Park Way, Cupertino, California, U.S."
8,Number of locations,535 Apple Stores (2025)
9,Area served,Worldwide


## 10. Export the Table¶

In [36]:
table.to_excel("apple_inc_summary_table.xlsx")