In [1]:
from bs4 import BeautifulSoup

In [2]:
html = """
<!DOCTYPE html>
<html lang="en">

<head>
    <meta charset="UTF-8">
    <meta http-equiv="X-UA-Compatible" content="IE=edge">
    <meta name="viewport" content="width=device-width, initial-scale=1.0">
    <title>Document</title>
</head>

<body>
    <h1>pandas</h1>
    <blockquote>pandas is a powerful Python data analysis library. </blockquote>

    <div id="start" class="section">
        <h3 class="section-header">Getting Started</h3>
        <ul class="pandas-ul">
            <a href="https://pandas.pydata.org/getting_started.html">
                <li>Install pandas</li>
            </a>
            <a href="https://pandas.pydata.org/docs/getting_started/index.html">
                <li>Getting started</li>
            </a>
        </ul>
    </div>

    <div id="documentation" class="section">
        <h3 class="section-header">Documentation</h3>
        <ul class="pandas-ul">
            <a href="https://pandas.pydata.org/docs/user_guide/index.html">
                <li>User guide</li>
            </a>
            <a href="https://pandas.pydata.org/docs/reference/index.html">
                <li>API reference</li>
            </a>
            <a href="https://pandas.pydata.org/docs/development/index.html">
                <li>How to contribute to pandas</li>
            </a>
        </ul>
    </div>

    <div id="community" class="section">
        <h3 class="section-header">The pandas Community</h3>
        <ul class="pandas-ul">
            <a href="https://pandas.pydata.org/about/index.html">
                <li>More about pandas</li>
            </a>
            <a href="https://stackoverflow.com/questions/tagged/pandas">
                <li>Have questions?</li>
            </a>
            <a href="https://pandas.pydata.org/community/ecosystem.html">
                <li>The pandas ecosystem</li>
            </a>
        </ul>
    </div>
</body>

</html>
"""

In [3]:
soup = BeautifulSoup(html, 'html.parser')

In [4]:
soup.find_all("h3")

[<h3 class="section-header">Getting Started</h3>,
 <h3 class="section-header">Documentation</h3>,
 <h3 class="section-header">The pandas Community</h3>]

In [5]:
for _ in (soup.find_all('h3')):
    print(_.text)

Getting Started
Documentation
The pandas Community


In [6]:
# Start section
soup.find(id='start')

<div class="section" id="start">
<h3 class="section-header">Getting Started</h3>
<ul class="pandas-ul">
<a href="https://pandas.pydata.org/getting_started.html">
<li>Install pandas</li>
</a>
<a href="https://pandas.pydata.org/docs/getting_started/index.html">
<li>Getting started</li>
</a>
</ul>
</div>

In [7]:
soup.find(id='start').find('h3').text

'Getting Started'

In [8]:
soup.find(id='start').find_all('a')

[<a href="https://pandas.pydata.org/getting_started.html">
 <li>Install pandas</li>
 </a>,
 <a href="https://pandas.pydata.org/docs/getting_started/index.html">
 <li>Getting started</li>
 </a>]

In [9]:
for _ in (soup.find(id='start').find_all('a')):
    print(_['href'])


https://pandas.pydata.org/getting_started.html
https://pandas.pydata.org/docs/getting_started/index.html


In [10]:
for _ in (soup.find_all('a')):
    print(_['href'])

https://pandas.pydata.org/getting_started.html
https://pandas.pydata.org/docs/getting_started/index.html
https://pandas.pydata.org/docs/user_guide/index.html
https://pandas.pydata.org/docs/reference/index.html
https://pandas.pydata.org/docs/development/index.html
https://pandas.pydata.org/about/index.html
https://stackoverflow.com/questions/tagged/pandas
https://pandas.pydata.org/community/ecosystem.html


In [11]:
# BONUS: Compile a dictionary of titles and URLs
pandas_info_dict = {}

rows = soup.find_all('div', class_='section')

for _ in rows:
    title = _.find('h3', class_='section-header').text
    links = [a['href'] for a in _.find_all('a')]
    pandas_info_dict[title] = links

# Using a for-loop  
for title, links in pandas_info_dict.items():
    print(f"{title}")
    for link in links:
        print(f"{link}")

Getting Started
https://pandas.pydata.org/getting_started.html
https://pandas.pydata.org/docs/getting_started/index.html
Documentation
https://pandas.pydata.org/docs/user_guide/index.html
https://pandas.pydata.org/docs/reference/index.html
https://pandas.pydata.org/docs/development/index.html
The pandas Community
https://pandas.pydata.org/about/index.html
https://stackoverflow.com/questions/tagged/pandas
https://pandas.pydata.org/community/ecosystem.html
