# 📥 SUN RGB-D Dataset Downloader
This notebook downloads the SUN RGB-D dataset and extracts it to the `data/` folder.

> ⚠️ Note: The dataset is large (~16GB). Make sure you have a stable internet connection and enough disk space.

In [None]:
# ✅ Create data directory if not exists
import os
DATA_DIR = "data"
os.makedirs(DATA_DIR, exist_ok=True)
print(f"Data directory is ready: {DATA_DIR}")

In [None]:
# 📦 Download dataset using requests (or wget if preferred)
import requests
from tqdm import tqdm
import zipfile

def download_file(url, dest_path):
    response = requests.get(url, stream=True)
    total = int(response.headers.get('content-length', 0))
    with open(dest_path, 'wb') as file, tqdm(
        desc=dest_path,
        total=total,
        unit='B',
        unit_scale=True,
        unit_divisor=1024,
    ) as bar:
        for data in response.iter_content(chunk_size=1024):
            size = file.write(data)
            bar.update(size)

# Example: SUNRGBD.zip
url = "http://rgbd.cs.princeton.edu/data/SUNRGBD.zip"
output_path = os.path.join(DATA_DIR, "SUNRGBD.zip")

if not os.path.exists(output_path):
    download_file(url, output_path)
else:
    print("Dataset already downloaded.")

In [None]:
# 📂 Unzip the dataset (this may take a while)
zip_path = os.path.join(DATA_DIR, "SUNRGBD.zip")
extract_path = os.path.join(DATA_DIR, "SUNRGBD")

if not os.path.exists(extract_path):
    with zipfile.ZipFile(zip_path, 'r') as zip_ref:
        zip_ref.extractall(extract_path)
    print(f"Extracted to: {extract_path}")
else:
    print("Dataset already extracted.")