<a href="https://colab.research.google.com/github/carloslme/automating-boring-stuff/blob/main/Chapter_15_Project_Multithreaded_XKCD_Downloader.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

# Step 1: Modify the Program to Use a Function

In [4]:
#! python3
# multidownloadXkcd.py - Downloads XKCD comics using multiple threads.

import requests, os, bs4, threading
os.makedirs('xkcd', exist_ok=True) # store comics in ./xkcd
errors = []

def downloadXkcd(startComic, endComic):
    for urlNumber in range(startComic, endComic):
        try:
          # Download the page.
          print('Downloading page http://xkcd.com/%s...' % (urlNumber))
          res = requests.get('http://xkcd.com/%s' % (urlNumber))
          res.raise_for_status()

          soup = bs4.BeautifulSoup(res.text)

          # Find the URL of the comic image.
          comicElem = soup.select('#comic img')
          if comicElem == []:
              print('Could not find comic image.')
          else:
              comicUrl = comicElem[0].get('src')
              # Download the image.
              print('Downloading image %s...' % (comicUrl))
              res = requests.get(comicUrl)
              res.raise_for_status()

              # Save the image to ./xkcd
              imageFile = open(os.path.join('xkcd', os.path.basename(comicUrl)), 'wb')
              for chunk in res.iter_content(100000):
                  imageFile.write(chunk)
              imageFile.close()
        except Exception as e:
          errors.append(str(e))
          pass

# Create and start the Thread objects.
downloadThreads = [] # a list of all the Thread objects
for i in range(0, 1400, 100): # loops 14 times, creates 14 threads
    downloadThread = threading.Thread(target=downloadXkcd, args=(i, i + 99))
    downloadThreads.append(downloadThread)
    downloadThread.start()

# Wait for all threads to end.
for downloadThread in downloadThreads:
    downloadThread.join()
print(errors)
print('Done.')


Downloading page http://xkcd.com/0...
Downloading page http://xkcd.com/100...
Downloading page http://xkcd.com/200...
Downloading page http://xkcd.com/300...
Downloading page http://xkcd.com/400...
Downloading page http://xkcd.com/500...
Downloading page http://xkcd.com/600...
Downloading page http://xkcd.com/700...
Downloading page http://xkcd.com/800...
Downloading page http://xkcd.com/900...
Downloading page http://xkcd.com/1000...
Downloading page http://xkcd.com/1100...
Downloading page http://xkcd.com/1200...
Downloading page http://xkcd.com/1300...
Downloading page http://xkcd.com/1...
Downloading image //imgs.xkcd.com/comics/family_circus.jpg...
Downloading page http://xkcd.com/101...
Downloading image //imgs.xkcd.com/comics/complexion.png...
Downloading page http://xkcd.com/701...
Downloading image //imgs.xkcd.com/comics/religions.png...
Downloading page http://xkcd.com/901...
Downloading image //imgs.xkcd.com/comics/android_boyfriend.png...
Downloading page http://xkcd.com/60