In [None]:
import pandas as pd
import numpy as np

#load data return table and interpret correctly
df = pd.read_csv("redcap_export.csv", encoding='utf-8')


#list of all possible data_return fields matching the export
expected_fields = [
    'dr_status', 'dr_type', 'dr_loc', 'dr_url', 'genie_id',
    'gel_eligibility', 'gel_consent', 'gel_blood', 'dr_other'
]


#only include fields that i want
data_return_fields = [field for field in expected_fields if field in df.columns]

#replace 0s in checkbox fields with NaN (to treat as missing)
checkbox_fields = [col for col in df.columns if '___' in col]
df[checkbox_fields] = df[checkbox_fields].replace([0, '0'], np.nan)

#identify rows where ALL data_return fields are empty
empty_data_return = df[data_return_fields].isnull().all(axis=1)

#invert to find rows where at least one field has data
has_data_return = df[~empty_data_return]

#check for results
print(f"Found {len(has_data_return)} records with at least one field filled in 'data_return'.")

#export to CSV
has_data_return.to_csv("records_with_data_return.csv", index=False, encoding='utf-8')

