In [1]:
# step 1: imports and checking the folder
from pathlib import Path

unzipped = Path(r"C:\Users\venus\OneDrive\Documents\GitHub\Climate-Malnutrition-EastAfrica\data_raw\unzipped")
print("unzipped folder:", unzipped)

# just checking what folders are there
[f.name for f in unzipped.iterdir() if f.is_dir()]


unzipped folder: C:\Users\venus\OneDrive\Documents\GitHub\Climate-Malnutrition-EastAfrica\data_raw\unzipped


['ETKR41DT',
 'ETKR51DT',
 'ETKR61DT',
 'ETKR71DT',
 'ETKR81DT',
 'KEKR01DT',
 'KEKR31DT',
 'KEKR3ADT',
 'KEKR42DT',
 'KEKR52DT',
 'KEKR72DT',
 'KEKR8CDT',
 'TZKR21DT',
 'TZKR3ADT',
 'TZKR41DT',
 'TZKR4IDT',
 'TZKR63DT',
 'TZKR7BDT',
 'TZKR82DT',
 'UGKR01DT',
 'UGKR33DT',
 'UGKR41DT',
 'UGKR52DT',
 'UGKR61DT',
 'UGKR7BDT']

In [3]:
# this script goes inside each folder listed above and renames the .dta files
# so ETKR41FL.DTA → Ethiopia_KR_2000.dta, KEKR52FL.DTA → Kenya_KR_2008.dta, etc.
# i kept it super readable and not complicated at all

import os
from pathlib import Path

# my main unzipped folder
unzipped = Path(r"C:\Users\venus\OneDrive\Documents\GitHub\Climate-Malnutrition-EastAfrica\data_raw\unzipped")

# this dictionary helps me turn country code → name
country_map = {
    "ET": "Ethiopia",
    "KE": "Kenya",
    "TZ": "Tanzania",
    "UG": "Uganda"
}

# and this one turns phase → approximate survey year
year_map = {
    "01": "1988",
    "17": "1992",
    "21": "1996",
    "31": "1998",
    "3A": "1999",
    "33": "2000",
    "41": "2005",
    "4I": "2007",
    "42": "2008",
    "52": "2010",
    "61": "2011",
    "63": "2013",
    "71": "2016",
    "7B": "2018",
    "8C": "2022",
    "81": "2021",
    "82": "2023"
}

# loop through every folder
for folder in unzipped.iterdir():
    if not folder.is_dir():
        continue

    for file in folder.glob("*.dta"):
        old_name = file.stem  # like ETKR41FL
        cc = old_name[:2]     # ET, KE, TZ, UG
        country = country_map.get(cc, cc)
        file_type = old_name[2:4]   # KR
        phase = old_name[4:6]       # 41, 52, etc.

        # look up year
        year = year_map.get(phase, phase)

        new_name = f"{country}_{file_type}_{year}.dta"
        new_path = file.with_name(new_name)

        os.rename(file, new_path)
        print("renamed:", file.name, "→", new_name)


renamed: ETKR41FL.DTA → Ethiopia_KR_2005.dta
renamed: ETKR51FL.DTA → Ethiopia_KR_51.dta
renamed: ETKR61FL.DTA → Ethiopia_KR_2011.dta
renamed: ETKR71FL.DTA → Ethiopia_KR_2016.dta
renamed: ETKR81FL.DTA → Ethiopia_KR_2021.dta
renamed: KEKR01FL.DTA → Kenya_KR_1988.dta
renamed: KEKR31FL.DTA → Kenya_KR_1998.dta
renamed: KEKR3AFL.DTA → Kenya_KR_1999.dta
renamed: KEKR42FL.DTA → Kenya_KR_2008.dta
renamed: KEKR52FL.DTA → Kenya_KR_2010.dta
renamed: KEKR72FL.DTA → Kenya_KR_72.dta
renamed: KEKR8CFL.DTA → Kenya_KR_2022.dta
renamed: TZKR21FL.DTA → Tanzania_KR_1996.dta
renamed: TZKR3AFL.DTA → Tanzania_KR_1999.dta
renamed: TZKR41FL.DTA → Tanzania_KR_2005.dta
renamed: TZKR4IFL.DTA → Tanzania_KR_2007.dta
renamed: TZKR63FL.DTA → Tanzania_KR_2013.dta
renamed: TZKR7BFL.DTA → Tanzania_KR_2018.dta
renamed: TZKR82FL.DTA → Tanzania_KR_2023.dta
renamed: UGKR01FL.DTA → Uganda_KR_1988.dta
renamed: UGKR33FL.DTA → Uganda_KR_2000.dta
renamed: UGKR41FL.DTA → Uganda_KR_2005.dta
renamed: UGKR52FL.DTA → Uganda_KR_2010.dt

In [5]:
# quick check that names changed correctly
for folder in unzipped.iterdir():
    dta_files = list(folder.glob("*.dta"))
    if dta_files:
        print(folder.name, "→", [f.name for f in dta_files])


ETKR41DT → ['Ethiopia_KR_2005.dta']
ETKR51DT → ['Ethiopia_KR_51.dta']
ETKR61DT → ['Ethiopia_KR_2011.dta']
ETKR71DT → ['Ethiopia_KR_2016.dta']
ETKR81DT → ['Ethiopia_KR_2021.dta']
KEKR01DT → ['Kenya_KR_1988.dta']
KEKR31DT → ['Kenya_KR_1998.dta']
KEKR3ADT → ['Kenya_KR_1999.dta']
KEKR42DT → ['Kenya_KR_2008.dta']
KEKR52DT → ['Kenya_KR_2010.dta']
KEKR72DT → ['Kenya_KR_72.dta']
KEKR8CDT → ['Kenya_KR_2022.dta']
TZKR21DT → ['Tanzania_KR_1996.dta']
TZKR3ADT → ['Tanzania_KR_1999.dta']
TZKR41DT → ['Tanzania_KR_2005.dta']
TZKR4IDT → ['Tanzania_KR_2007.dta']
TZKR63DT → ['Tanzania_KR_2013.dta']
TZKR7BDT → ['Tanzania_KR_2018.dta']
TZKR82DT → ['Tanzania_KR_2023.dta']
UGKR01DT → ['Uganda_KR_1988.dta']
UGKR33DT → ['Uganda_KR_2000.dta']
UGKR41DT → ['Uganda_KR_2005.dta']
UGKR52DT → ['Uganda_KR_2010.dta']
UGKR61DT → ['Uganda_KR_2011.dta']
UGKR7BDT → ['Uganda_KR_2018.dta']
