In [49]:
import requests # Imports the requests library, which allows you to send HTTP requests.
from bs4 import BeautifulSoup # It is used for parsing HTML and XML documents.

In [51]:
# Fetch the Wikipedia page
url = "https://en.wikipedia.org/wiki/Los_Angeles_Lakers"
response = requests.get(url) #it sends a GET request to the specified URL and stores the response.

In [53]:
soup = BeautifulSoup(response.text, 'html.parser')
print (soup)

<!DOCTYPE html>

<html class="client-nojs vector-feature-language-in-header-enabled vector-feature-language-in-main-page-header-disabled vector-feature-page-tools-pinned-disabled vector-feature-toc-pinned-clientpref-1 vector-feature-main-menu-pinned-disabled vector-feature-limited-width-clientpref-1 vector-feature-limited-width-content-enabled vector-feature-custom-font-size-clientpref-1 vector-feature-appearance-pinned-clientpref-1 vector-feature-night-mode-enabled skin-theme-clientpref-day vector-sticky-header-enabled vector-toc-available" dir="ltr" lang="en">
<head>
<meta charset="utf-8"/>
<title>Los Angeles Lakers - Wikipedia</title>
<script>(function(){var className="client-js vector-feature-language-in-header-enabled vector-feature-language-in-main-page-header-disabled vector-feature-page-tools-pinned-disabled vector-feature-toc-pinned-clientpref-1 vector-feature-main-menu-pinned-disabled vector-feature-limited-width-clientpref-1 vector-feature-limited-width-content-enabled vecto

In [55]:
# Parse the HTML content using BeautifulSoup
soup = BeautifulSoup(response.content, "html.parser")

In [67]:
# Extract the page title
title = soup.find('h1').text
print("Title:", title)

Title: Los Angeles Lakers


In [69]:
intro_paragraph = ""
for p in soup.select('p'):
    if p.text.strip():
        intro_paragraph = p.text.strip()
        break

print("Introductory Paragraph:\n", intro_paragraph)

Introductory Paragraph:
 The Los Angeles Lakers are an American professional basketball team based in Los Angeles. The Lakers compete in the National Basketball Association (NBA) as a member of the Pacific Division of the Western Conference. The Lakers play their home games at Crypto.com Arena, an arena they share with the Los Angeles Sparks of the Women's National Basketball Association (WNBA) and the Los Angeles Kings of the National Hockey League (NHL).[10] The Lakers are one of the most successful teams in the history of the NBA with 17 championships, the second most in the league behind the Boston Celtics.[11]


In [79]:
# Find the section containing the History content
history_section = soup.find("span", {"id": "History"})

# If the History section exists, get its content
if history_section:
    
    # Get the parent section (usually an <h2> tag)
    history_heading = history_section.find_parent("h2")
    
    # Initialize a list to store content paragraphs
    history_content = []
    
    # Get all sibling elements until the next <h2> tag and extract text
    next_sibling = history_heading.find_next_sibling()
    while next_sibling and next_sibling.name != "h2":
        if next_sibling.name == "p":
            history_content.append(next_sibling.get_text())
        next_sibling = next_sibling.find_next_sibling()
    
    print("History Content:")
    for paragraph in history_content:
        print(paragraph.strip())  # Strip to remove leading and trailing whitespaces
else:
    print("History section not found.")

History section not found.


In [81]:
# Extract the key sections of the page
sections = soup.find_all("h2")
for section in sections:
    section_title = section.text
    section_content_tag = section.find_next("p")
    if section_content_tag:
        section_content = section_content_tag.text
        print("Section Title:", section_title)
        print("Section Content:", section_content)
        print()

Section Title: Contents
Section Content: 


Section Title: History
Section Content: The franchise was founded in 1946 as the Detroit Gems and played in the National Basketball League (NBL) during the 1946–47 season where it finished last in the league with only 4 wins in 44 games. Though the team was scheduled to continue in the NBL the following season,[23] its ownership, faced with high losses due to low attendance and lack of homecourt, decided on selling the team to Ben Berger and Morris Chalfen of Minnesota for $15,000.[13][24]


Section Title: Rivalries
Section Content: The rivalry between the Boston Celtics and the Lakers involves the two most storied basketball franchises in National Basketball Association (NBA) history. It has been called the best rivalry in the NBA.[309] The two teams have met a record 12 times in the NBA Finals, starting with their first Finals meeting in 1959. They would go on to dominate the league in the 1960s and the 1980s, facing each other six times in

In [83]:
# Extract the external links
external_links = soup.find_all("a", {"class": "external text"})
print("External Links:")
for link in external_links:
    print(link.get("href"))

External Links:
https://www.nba.com/lakers
http://www.nba.com/lakers/roster/
https://www.nba.com/lakers/history/season-by-season-records
https://www.nba.com/stats/history
https://www.nba.com/stats/team/1610612747/seasons
https://web.archive.org/web/20221202035957/https://www.nba.com/stats/team/1610612747/seasons
https://lalweb.blob.core.windows.net/public/lakers/media-relations/2022-23-Lakers-Media-Guide.pdf#page=344
https://lalweb.blob.core.windows.net/public/lakers/media-relations/2022-23-Lakers-Media-Guide.pdf
https://web.archive.org/web/20221108010013/https://lalweb.blob.core.windows.net/public/lakers/media-relations/2022-23-Lakers-Media-Guide.pdf
https://www.nba.com/lakers/team/uniform-schedule/
https://web.archive.org/web/20221109160248/https://www.nba.com/lakers/team/uniform-schedule
https://cdn-assets-us.frontify.com/s3/frontify-enterprise-files-us/eyJwYXRoIjoibmJhXC9maWxlXC80TTJDeVBtaUwycjFLclJSQUNXRi5wZGYifQ:nba:0rvM6XAd_inP1medUf1_yAS9UGc7q32d5SvRE6QNinw
https://www.nba.com/