In [0]:
# 99_bootstrap_raw_claims.ipynb
# Perform one-time setup for Claims data.
# Creates the raw input folder and moves in the initial test file.

# 1. Manually upload the test file `claims_part_1.avro` to DBFS.

UPLOADS_DIR = "dbfs:/FileStore/tables/"
RAW_CLAIMS_DIR = "dbfs:/kardia/raw/claims/"
INITIAL_TEST_FILE = "claims_part_1.avro"

src = UPLOADS_DIR + INITIAL_TEST_FILE
dst = RAW_CLAIMS_DIR + INITIAL_TEST_FILE

# Step 1 – Create raw folder if needed
dbutils.fs.mkdirs(RAW_CLAIMS_DIR)

# Step 2 – Check if file exists in destination already
existing = [f.name for f in dbutils.fs.ls(RAW_CLAIMS_DIR)]
already_exists = INITIAL_TEST_FILE in existing

# Step 3 – Check if file exists in uploads directory
uploads = [f.name for f in dbutils.fs.ls(UPLOADS_DIR)]
available_to_copy = INITIAL_TEST_FILE in uploads

# Step 4 – Conditionally copy file
if already_exists:
    print(f"Skipped (already exists): {dst}")
elif not available_to_copy:
    print(f"Skipped (not found in uploads): {src}")
else:
    try:
        dbutils.fs.cp(src, dst)
        print(f"Bootstrapped: {INITIAL_TEST_FILE} copied to {dst}")
    except Exception as e:
        print(f"Failed to copy: {e}")