In [2]:
from scipy.stats import ttest_ind
import pandas as pd

file_path = '/home/changbae/fmri_project/MDMR/notebook/data/participant_demo_clinical.csv'
data = pd.read_csv(file_path)

# Columns to exclude
exclude_columns = ['HAID ID', 'Exp No.', 'fmri_code', 'Screening #', 'Enrollment #']

# Filter columns
columns_to_include = [col for col in data.columns if col not in exclude_columns]

# Filter data for relevant columns
filtered_data = data[columns_to_include]

# Split data into EXP and HC groups
exp_group = filtered_data[filtered_data['GROUP'] == 'EXP']
hc_group = filtered_data[filtered_data['GROUP'] == 'HC']

# Initialize lists to store results
results = []

# Calculate mean, std, and p-value for each column
for column in columns_to_include:
    if column == 'GROUP':
        continue
    exp_values = exp_group[column].dropna().astype(float)
    hc_values = hc_group[column].dropna().astype(float)
    
    mean_exp = exp_values.mean()
    std_exp = exp_values.std()
    mean_hc = hc_values.mean()
    std_hc = hc_values.std()
    t_stat, p_value = ttest_ind(exp_values, hc_values, equal_var=False)
    
    results.append({
        'Measure': column,
        'Mean_EXP': mean_exp,
        'STD_EXP': std_exp,
        'Mean_HC': mean_hc,
        'STD_HC': std_hc,
        'P_value': p_value
    })

# Convert results to DataFrame
results_df = pd.DataFrame(results)

In [4]:
results_df.to_csv("/home/changbae/fmri_project/MDMR/notebook/data/clinical_measure_summary.csv")

In [6]:
hc_group

Unnamed: 0.1,Unnamed: 0,GROUP,1. SEX,2.AGE,3-2. YR_EDU,STAI-X-1,STAI-X-2,HADS_anxiety,HADS_depression,SWLS,...,lsas,MOCI,checking,cleaning,doubting,slowness,BFNE,PSWQ,Handedness(true),FCV-19S
3,3,HC,1,25,15.0,35.0,27.0,14.0,9.0,24.0,...,18.0,24.0,7.0,11.0,3.0,7.0,31.0,48.0,47.0,3.0
5,5,HC,1,29,18.0,22.0,17.0,15.0,8.0,24.0,...,6.0,26.0,7.0,11.0,5.0,7.0,14.0,19.0,41.0,1.0
6,6,HC,2,23,17.0,32.0,27.0,15.0,7.0,29.0,...,28.0,22.0,7.0,8.0,5.0,5.0,28.0,32.0,48.0,3.0
8,8,HC,2,22,16.0,34.0,34.0,16.0,7.0,8.0,...,14.0,27.0,8.0,10.0,6.0,6.0,40.0,46.0,39.0,5.0
10,10,HC,2,25,18.0,35.0,28.0,15.0,6.0,20.0,...,38.0,14.0,6.0,4.0,3.0,5.0,33.0,45.0,44.0,12.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
114,114,HC,1,29,15.0,30.0,31.0,2.0,3.0,19.0,...,13.0,2.0,2.0,0.0,0.0,0.0,29.0,40.0,43.0,7.0
115,115,HC,1,29,16.0,43.0,36.0,3.0,7.0,23.0,...,19.0,8.0,2.0,1.0,4.0,1.0,40.0,37.0,40.0,9.0
116,116,HC,2,28,12.0,32.0,28.0,0.0,4.0,13.0,...,45.0,8.0,3.0,0.0,3.0,2.0,43.0,32.0,42.0,9.0
117,117,HC,2,25,12.0,32.0,34.0,1.0,4.0,18.0,...,8.0,5.0,1.0,0.0,4.0,0.0,38.0,44.0,41.0,11.0
