
## Snippet to download all the files from "NHANES I" study.


In [None]:
import os
import requests

#
# NHANES I datasets
#
datasets = {
    "Anthropometry_Goniometry_Skeletal_Age_Bone_Density_and_Cortical_Thickness_4111": [
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4111.txt", "DU4111.txt"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4111.sas", "DU4111.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4111_F.sas", "DU4111_F.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/4111.pdf", "4111.pdf"),
    ],
    "Arthritis_Data_4121": [
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4121.txt", "DU4121.txt"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4121.sas", "DU4121.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4121_F.sas", "DU4121_F.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/4121.pdf", "4121.pdf"),
    ],
    "Audiometric_4241": [
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4241.txt", "DU4241.txt"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4241.sas", "DU4241.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4241_F.sas", "DU4241_F.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/4241.pdf", "4241.pdf"),
    ],
    "Biochemistry_Serology_Hematology_4800": [
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4800.txt", "DU4800.txt"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4800.sas", "DU4800.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4800_F.sas", "DU4800_F.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/4800.pdf", "4800.pdf"),
    ],
    "Chest_XRay_Pulmonary_Diffusion_4251": [
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4251.txt", "DU4251.txt"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4251.sas", "DU4251.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4251_F.sas", "DU4251_F.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/4251.pdf", "4251.pdf"),
    ],
    "Computer_ECG_4140": [
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4140.txt", "DU4140.txt"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4140.sas", "DU4140.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4140_F.sas", "DU4140_F.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/4140.pdf", "4140.pdf"),
    ],
    "Dental_4235": [
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4235.txt", "DU4235.txt"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4235.sas", "DU4235.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4235_F.sas", "DU4235_F.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/4235.pdf", "4235.pdf"),
    ],
    "Dermatology_4151": [
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4151.txt", "DU4151.txt"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4151.sas", "DU4151.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4151_F.sas", "DU4151_F.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/4151.pdf", "4151.pdf"),
    ],
    "Dietary_Frequency_4701": [
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4701.txt", "DU4701.txt"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4701.sas", "DU4701.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4701_F.sas", "DU4701_F.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/4701.pdf", "4701.pdf"),
    ],
    "General_WellBeing_Depression_Scale_4171": [
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4171.txt", "DU4171.txt"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4171.sas", "DU4171.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4171_F.sas", "DU4171_F.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/4171.pdf", "4171.pdf"),
    ],
    "Health_Care_Needs_Respiratory_CV_Supplement_4091": [
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4091.txt", "DU4091.txt"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4091.sas", "DU4091.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4091_F.sas", "DU4091_F.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/4091.pdf", "4091.pdf"),
    ],
    "Medical_History_1to11_4067": [
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4067.txt", "DU4067.txt"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4067.sas", "DU4067.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4067_F.sas", "DU4067_F.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/4067.pdf", "4067.pdf"),
    ],
    "Medical_History_12to74_4081": [
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4081.txt", "DU4081.txt"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4081.sas", "DU4081.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4081_F.sas", "DU4081_F.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/4081.pdf", "4081.pdf"),
    ],
    "Medical_Examination_4233": [
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4233.txt", "DU4233.txt"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4233.sas", "DU4233.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4233_F.sas", "DU4233_F.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/4233.pdf", "4233.pdf"),
    ],
    "Model_Gram_4702": [
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4702.txt", "DU4702.txt"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4702.sas", "DU4702.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/4702_3.pdf", "4702_3.pdf"),
    ],
    "Near_and_Distant_Vision_4163": [
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4163.txt", "DU4163.txt"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4163.sas", "DU4163.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4163_F.sas", "DU4163_F.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/4163.pdf", "4163.pdf"),
    ],
    "Nutrient_Composition_4703": [
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4703.txt", "DU4703.txt"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4703.sas", "DU4703.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/4702_3.pdf", "4702_3.pdf"),
    ],
    "Ophthalmology_4161": [
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4161.txt", "DU4161.txt"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4161.sas", "DU4161.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4161_F.sas", "DU4161_F.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/4161.pdf", "4161.pdf"),
    ],
    "Spirometry_4250": [
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4250.txt", "DU4250.txt"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4250.sas", "DU4250.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4250_F.sas", "DU4250_F.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/4250.pdf", "4250.pdf"),
    ],
    "Food_Consumption_4704": [
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4704.txt", "DU4704.txt"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4704.sas", "DU4704.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/DU4704_F.sas", "DU4704_F.sas"),
        ("https://wwwn.cdc.gov/nchs/data/nhanes1/4704.pdf", "4704.pdf"),
    ]
}



#
# The following datasets will not be downloaded / used:
#
# Growth Charts (November, 2012)
#
# "Electrocardiogram": [
#     ("https://wwwn.cdc.gov/nchs/data/nhanes1/nh1ecg.dat", "nh1ecg.dat"),
#     ("https://wwwn.cdc.gov/nchs/data/nhanes1/nh1ecg.sas", "nh1ecg.sas"),
#     ("https://wwwn.cdc.gov/nchs/data/nhanes1/nh1ecg.pdf", "nh1ecg.pdf"),
# ],




def download_file(url, path):
    r = requests.get(url, stream=True)
    r.raise_for_status()
    with open(path, 'wb') as f:
        for chunk in r.iter_content(chunk_size=8192):
            f.write(chunk)

for folder, files in datasets.items():
    os.makedirs(folder, exist_ok=True)
    for url, filename in files:
        filepath = os.path.join(folder, filename)
        print(f"Downloading {filename} into {folder}...")
        download_file(url, filepath)


Downloading DU4111.txt into Anthropometry_Goniometry_Skeletal_Age_Bone_Density_and_Cortical_Thickness_4111...
Downloading DU4111.sas into Anthropometry_Goniometry_Skeletal_Age_Bone_Density_and_Cortical_Thickness_4111...
Downloading DU4111_F.sas into Anthropometry_Goniometry_Skeletal_Age_Bone_Density_and_Cortical_Thickness_4111...
Downloading 4111.pdf into Anthropometry_Goniometry_Skeletal_Age_Bone_Density_and_Cortical_Thickness_4111...
Downloading DU4121.txt into Arthritis_Data_4121...
Downloading DU4121.sas into Arthritis_Data_4121...
Downloading DU4121_F.sas into Arthritis_Data_4121...
Downloading 4121.pdf into Arthritis_Data_4121...
Downloading DU4241.txt into Audiometric_4241...
Downloading DU4241.sas into Audiometric_4241...
Downloading DU4241_F.sas into Audiometric_4241...
Downloading 4241.pdf into Audiometric_4241...
Downloading DU4800.txt into Biochemistry_Serology_Hematology_4800...
Downloading DU4800.sas into Biochemistry_Serology_Hematology_4800...
Downloading DU4800_F.sas i