# Install required packages

In [0]:
%pip install kaggle
%pip install python-dotenv

In [0]:
%restart_python

In [0]:
import os
from dotenv import load_dotenv

In [0]:
load_dotenv(dotenv_path=".env", override=True)

catalog_name = os.getenv("CATALOG")
schema_name = os.getenv("SCHEMA")
volume_name = os.getenv("VOLUME")
kaggle_username = os.getenv("KAGGLE_USERNAME")
kaggle_key = os.getenv("KAGGLE_KEY")

print(f"Catalog: {catalog_name}, Schema: {schema_name}, Volume: {volume_name}")

# Set Kaggle credentials in environment

In [0]:
    os.environ["KAGGLE_USERNAME"] = kaggle_username
    os.environ["KAGGLE_KEY"] = kaggle_key


 Databricks SQL commands to create catalog, schema, and volume

In [0]:

spark.sql(f"CREATE CATALOG IF NOT EXISTS {catalog_name}")
spark.sql(f"CREATE SCHEMA IF NOT EXISTS {catalog_name}.{schema_name}")
spark.sql(f"CREATE VOLUME IF NOT EXISTS {catalog_name}.{schema_name}.{volume_name}")
print("Catalog, schema, and volume created successfully ✅")




In [0]:

import pathlib

volume_path = f"/Volumes/{catalog_name}/{schema_name}/{volume_name}/global_fashion"
pathlib.Path(volume_path).mkdir(parents=True, exist_ok=True)

print(f"Local volume path created at: {volume_path}")

 Download Kaggle dataset

In [0]:
from kaggle.api.kaggle_api_extended import KaggleApi

api = KaggleApi()
api.authenticate()

Dataset identifier from Kaggle

In [0]:
dataset = "ricgomes/global-fashion-retail-stores-dataset"

api.dataset_download_files(
    dataset,
    path=volume_path,
    unzip=True
)

print(f"Kaggle dataset downloaded successfully to {volume_path} ✅")    