# Set-up and Workflow

### Importing the packages

In [1]:
# Load the packages
import requests
from bs4 import BeautifulSoup

### Making a GET request

In [2]:
# Defining the url of the site
base_site = "https://en.wikipedia.org/wiki/Music"

# Making a get request
response = requests.get(base_site)
response.status_code

200

In [3]:
# Extracting the HTML
html = response.content

# Checking that the reply is indeed an HTML code by inspecting the first 100 symbols
html[:100]

b'<!DOCTYPE html>\n<html class="client-nojs" lang="en" dir="ltr">\n<head>\n<meta charset="UTF-8"/>\n<title'

### Making the soup

In [4]:
# Convert HTML to a BeautifulSoup object. This will allow us to parse out content from the HTML more easily.
# Using the default parser as it is included in Python
soup = BeautifulSoup(html, "html.parser")

### Extract text from footer

In [10]:
# If we want all the results we use find_all()
texts = soup.find_all('footer')
texts

[<footer class="mw-footer" id="footer" role="contentinfo">
 <ul id="footer-info">
 <li id="footer-info-lastmod"> This page was last edited on 30 July 2022, at 06:59<span class="anonymous-show"> (UTC)</span>.</li>
 <li id="footer-info-copyright">Text is available under the <a href="//en.wikipedia.org/wiki/Wikipedia:Text_of_Creative_Commons_Attribution-ShareAlike_3.0_Unported_License" rel="license">Creative Commons Attribution-ShareAlike License 3.0</a><a href="//creativecommons.org/licenses/by-sa/3.0/" rel="license" style="display:none;"></a>;
 additional terms may apply.  By using this site, you agree to the <a href="//foundation.wikimedia.org/wiki/Terms_of_Use">Terms of Use</a> and <a href="//foundation.wikimedia.org/wiki/Privacy_policy">Privacy Policy</a>. Wikipedia® is a registered trademark of the <a href="//www.wikimediafoundation.org/">Wikimedia Foundation, Inc.</a>, a non-profit organization.</li>
 </ul>
 <ul id="footer-places">
 <li id="footer-places-privacy"><a class="extiw" h

In [13]:
# Text from page footer
for elt in texts:
    for s in elt.stripped_strings:
        print(repr(s))

'This page was last edited on 30 July 2022, at 06:59'
'(UTC)'
'.'
'Text is available under the'
'Creative Commons Attribution-ShareAlike License 3.0'
';\nadditional terms may apply.  By using this site, you agree to the'
'Terms of Use'
'and'
'Privacy Policy'
'. Wikipedia® is a registered trademark of the'
'Wikimedia Foundation, Inc.'
', a non-profit organization.'
'Privacy policy'
'About Wikipedia'
'Disclaimers'
'Contact Wikipedia'
'Mobile view'
'Developers'
'Statistics'
'Cookie statement'
