In [2]:
import requests
from pathlib import Path

def download_file(url:str, filename:str) -> None:
    """
    download a file from a specicic URL and save it to specific location
    """
    destination = Path("../data") / filename
    destination.parent.mkdir(parents=True, exist_ok=True)
    response = requests.get(url)
    response.raise_for_status()

    with open(destination, "wb") as f:
        f.write(response.content)
    
    print(f"file download successfully to {destination}")

In [3]:
navalmanack_url = "https://navalmanack.s3.amazonaws.com/Eric-Jorgenson_The-Almanack-of-Naval-Ravikant_Final.pdf"
download_file(navalmanack_url, "almanack_of_naval_ravikant.pdf")


file download successfully to ../data/almanack_of_naval_ravikant.pdf


In [8]:
balaji_url = "https://balajianthology.s3.us-east-2.amazonaws.com/The+Anthology+of+Balaji.pdf"
download_file(balaji_url, "anthology_of_balaji.pdf")

# List of URLs to download
letters_urls = [
    "https://tim.blog/wp-content/uploads/2017/07/taoofseneca_vol1-1.pdf",
    "https://tim.blog/wp-content/uploads/2017/07/taoofseneca_vol2.pdf",
    "https://tim.blog/wp-content/uploads/2017/07/taoofseneca_vol3.pdf",
]

for url in letters_urls:
    filename = Path(url).name
    download_file(url, filename)


#
hackers_url ="https://digtvbg.com/files/books-for-hacking/Hackers%20%26%20Painters%20-%20Big%20Ideas%20From%20The%20Computer%20Age%20by%20Paul%20Graham.pdf"
download_file(hackers_url, "hackers_and_painters.pdf")



file download successfully to ../data/anthology_of_balaji.pdf
file download successfully to ../data/taoofseneca_vol1-1.pdf
file download successfully to ../data/taoofseneca_vol2.pdf
file download successfully to ../data/taoofseneca_vol3.pdf
file download successfully to ../data/hackers_and_painters.pdf


In [9]:
#
try:
    striking_thoughts = "https://eddierockerz.com/wp-content/uploads/2020/11/striking-thoughts_-bruce-lees-wisdom-for-daily-living-pdfdrive.com-.pdf"
    download_file(striking_thoughts, filename="striking-thoughts.pdf")
except Exception as e:
    print(f"download striking-thoughts fail: {e}")

download striking-thoughts fail: 404 Client Error: Not Found for url: https://eddierockerz.com/wp-content/uploads/2020/11/striking-thoughts_-bruce-lees-wisdom-for-daily-living-pdfdrive.com-.pdf


In [10]:
#
skin_in_game_url = "https://philosophiatopics.wordpress.com/wp-content/uploads/2018/10/skin-in-the-game-nassim-nicholas-taleb.pdf"
download_file(skin_in_game_url, "skin_in_the_game.pdf")



file download successfully to ../data/skin_in_the_game.pdf
