In [33]:
import pandas as pd
import requests
from pathlib import Path

## Load csv with all the information about the arts

In [6]:
artworks_csv = pd.read_csv("Artworks.csv")
artworks_csv.columns

Index(['Title', 'Artist', 'ConstituentID', 'ArtistBio', 'Nationality',
       'BeginDate', 'EndDate', 'Gender', 'Date', 'Medium', 'Dimensions',
       'CreditLine', 'AccessionNumber', 'Classification', 'Department',
       'DateAcquired', 'Cataloged', 'ObjectID', 'URL', 'ThumbnailURL',
       'Circumference (cm)', 'Depth (cm)', 'Diameter (cm)', 'Height (cm)',
       'Length (cm)', 'Weight (kg)', 'Width (cm)', 'Seat Height (cm)',
       'Duration (sec.)'],
      dtype='object')

## Display the art categories and picking the right ones

In [8]:
artworks_csv.Classification.unique()

array(['Architecture', 'Mies van der Rohe Archive', 'Design',
       'Illustrated Book', 'Print', 'Drawing', 'Periodical', 'Film',
       'Multiple', 'Installation', 'Film (object)', 'Photograph',
       'Painting', 'Ephemera', 'Photography Research/Reference', 'Video',
       'Media', 'Performance', 'Sculpture', 'Work on Paper', 'Poster',
       'Audio', '(not assigned)', 'Textile', 'Digital', 'Collage',
       'Graphic Design', 'Frank Lloyd Wright Archive',
       'Furniture and Interiors', 'Software', 'Architectural Model',
       'Publication'], dtype=object)

In [9]:
wanted_classification = ['Drawing', 'Painting', 'Poster']

In [12]:
artworks_filtered = artworks_csv.loc[artworks_csv.Classification.isin(wanted_classification)]
artworks_filtered.Classification.unique()

array(['Drawing', 'Painting', 'Poster'], dtype=object)

In [42]:
artworks_filtered = artworks_filtered[artworks_filtered.URL.notnull()]

## Downloading the images

In [43]:
artworks_filtered.head()

Unnamed: 0,Title,Artist,ConstituentID,ArtistBio,Nationality,BeginDate,EndDate,Gender,Date,Medium,...,ThumbnailURL,Circumference (cm),Depth (cm),Diameter (cm),Height (cm),Length (cm),Weight (kg),Width (cm),Seat Height (cm),Duration (sec.)
7957,"""Society of Monkeys"" diploma",Aleksei Remizov,14185,"(Russian, 1877–1957)",(),(1877),(1957),(Male),1922,"Watercolor, ink, cut-and-pasted colored and me...",...,http://www.moma.org/media/W1siZiIsIjI0OTM4NiJd...,,,,23.9,,,31.8,,
8007,Untitled,Kirill Zdanevich,11875,"(Russian, 1892–1969)",(Russian),(1892),(1969),(Male),1919,Pen and ink,...,http://www.moma.org/media/W1siZiIsIjY3ODg4Il0s...,,,,28.4,,,26.6,,
8009,Valia Zdanevich,Aleksei Kruchenykh,3263,"(Russian, 1886–1969)",(Russian),(1886),(1969),(Male),1923,"Collage with photograph, pencil and watercolor...",...,http://www.moma.org/media/W1siZiIsIjY3OTM4Il0s...,,,,33.5,,,21.5,,
8057,Untitled (Futurist Landscape),Olga Rozanova,5066,"(Russian, 1886–1918)",(Russian),(1886),(1918),(Female),1913,Pen and ink on paper,...,http://www.moma.org/media/W1siZiIsIjY4Nzc2Il0s...,,,,24.3,,,17.7,,
13051,Study for cover of Novyi LEF (New LEF),Aleksandr Rodchenko,4975,"(Russian, 1891–1956)",(Russian),(1891),(1956),(Male),1926,Pencil and colored pencil on graph paper,...,http://www.moma.org/media/W1siZiIsIjY4MTcxIl0s...,,,,26.9,,,8.0,,


In [44]:
def save_image_from_response(dest_dir, filename, response):
    
    path = Path.cwd() / dest_dir / filename
    
    print(path)
    
    if response.status_code == 200:
        with open(path, 'wb') as f:
            f.write(response.content)
    

In [50]:
downloaded_art_dir = "MoMA"
test = 0

for index, row in artworks_filtered.iterrows():
    
    art_title = row.Title
    response = requests.get(row.URL)
    print(row.ThumbnailURL)
    save_image_from_response(downloaded_art_dir, art_title, response)
    
    test = test + 1
    if test > 15:
        break

    

http://www.moma.org/media/W1siZiIsIjI0OTM4NiJdLFsicCIsImNvbnZlcnQiLCItcmVzaXplIDMwMHgzMDBcdTAwM2UiXV0.jpg?sha=7de0197cf5541691
/home/michal/FIT/StolenArtRecognition/MoMA/"Society of Monkeys" diploma
http://www.moma.org/media/W1siZiIsIjY3ODg4Il0sWyJwIiwiY29udmVydCIsIi1yZXNpemUgMzAweDMwMFx1MDAzZSJdXQ.jpg?sha=649e845c41e0cff5
/home/michal/FIT/StolenArtRecognition/MoMA/Untitled
http://www.moma.org/media/W1siZiIsIjY3OTM4Il0sWyJwIiwiY29udmVydCIsIi1yZXNpemUgMzAweDMwMFx1MDAzZSJdXQ.jpg?sha=8be92eecdd1572ab
/home/michal/FIT/StolenArtRecognition/MoMA/Valia Zdanevich
http://www.moma.org/media/W1siZiIsIjY4Nzc2Il0sWyJwIiwiY29udmVydCIsIi1yZXNpemUgMzAweDMwMFx1MDAzZSJdXQ.jpg?sha=8b4ef48fea7c11bd
/home/michal/FIT/StolenArtRecognition/MoMA/Untitled (Futurist Landscape)
http://www.moma.org/media/W1siZiIsIjY4MTcxIl0sWyJwIiwiY29udmVydCIsIi1yZXNpemUgMzAweDMwMFx1MDAzZSJdXQ.jpg?sha=37a96ae21082966a
/home/michal/FIT/StolenArtRecognition/MoMA/Study for cover of Novyi LEF (New LEF)
http://www.moma.org/media/W1siZ