In [None]:
import os
import logging
from logging import getLogger

from pathlib import Path
from hydra import initialize, compose
from hydra.core.hydra_config import HydraConfig

from kaggle import KaggleApi
from src.utils.kaggle_utils import download_kaggle_competition_dataset

In [None]:
EXPERIMENT = os.getenv("EXPERIMENT", "000")  # input your experiment number as environment variable

In [None]:
if EXPERIMENT is None:
    raise ValueError("EXPERIMENT is not set")

with initialize(version_base=None, config_path="../../configs"):
    CFG = compose(
        config_name="config.yaml",
        return_hydra_config=True,
        overrides=[f"experiment={EXPERIMENT}"],
    )
    HydraConfig.instance().set_config(CFG)  # use HydracConfig for notebook to use hydra job

LOGGER = logging.getLogger()
LOGGER.setLevel(logging.DEBUG)

KAGGLE_CLIENT = KaggleApi()
KAGGLE_CLIENT.authenticate()

LOGGER.info(f"start experiment={EXPERIMENT} 🚀")

### load data


In [None]:
download_kaggle_competition_dataset(
    client=KAGGLE_CLIENT,
    competition=CFG.meta.competition,
    out_dir=Path(CFG.paths.input_dir),
)