# Download Quick, Draw! data

Download the classes from the quick, draw! dataset needed to test the lottery ticket hypothesis

In [14]:
import os
import requests
from tqdm import tqdm

In [15]:
# Configuration
path = "./data/quickdraw"
link = "https://storage.googleapis.com/quickdraw_dataset/full/numpy_bitmap/"

# Les 50 catégories (5 clusters x 10 classes)
categories = [
    # Animaux
    'cat', 'dog', 'fish', 'bird', 'bear', 'rabbit', 'elephant', 'lion', 'tiger', 'horse',
    # Véhicules
    'car', 'bus', 'truck', 'bicycle', 'motorbike', 'airplane', 'helicopter', 'sailboat', 'train', 'ambulance',
    # Nourriture
    'apple', 'banana', 'pizza', 'cake', 'ice cream', 'cookie', 'bread', 'hot dog', 'hamburger', 'grapes',
    # Objets du quotidien
    'chair', 'table', 'clock', 'book', 'cup', 'scissors', 'key', 'hammer', 'candle', 'broom',
    # Nature
    'tree', 'flower', 'cloud', 'sun', 'moon', 'star', 'mountain', 'ocean', 'rain', 'lightning',
    # Shape
    'circle', 'square', 'triangle', 'star', 'line', 'hexagon', 'octagon', 'diamond', 'zigzag', 'cloud'
]

os.makedirs(path, exist_ok=True)

In [16]:
def download_all():
    for cat in tqdm(categories, desc="Progression"):
        filepath = os.path.join(path, f"{cat}.npy")
        
        # Skip si déjà présent
        if os.path.exists(filepath):
            continue
        
        # Télécharger
        url = f"{link}{cat.replace(' ', '%20')}.npy"
        try:
            response = requests.get(url)
            response.raise_for_status()
            with open(filepath, 'wb') as f:
                f.write(response.content)
        except Exception as e:
            print(f"Erreur {cat}: {e}")
    
    # Vérification
    downloaded = [f.replace('.npy', '') for f in os.listdir(path) if f.endswith('.npy')]
    missing = set(categories) - set(downloaded)
    
    if missing:
        print(f"Manquant: {missing}")
    else:
        print(f"Terminé ! {len(categories)} catégories disponibles")

In [17]:
download_all()

Progression: 100%|██████████| 60/60 [00:00<00:00, 15587.38it/s]

Terminé ! 60 catégories disponibles



