In [41]:
import pandas as pd
from scipy import stats

data = pd.read_excel('BIOCARD_ICM_random200.xlsx')
data.columns = data.columns.str.strip("'")


print(data.head())

    Subject_ID Gender   Age Diagnosis  ACR_R  AGWM_R   AG_R  ALIC_R  Amyg_R  \
0  'Subject_1'    'F'  56.8  'NORMAL'  14270    3694  12859    2294    2310   
1  'Subject_2'    'F'  53.2  'NORMAL'  12964    3275  12063    2367    1697   
2  'Subject_3'    'F'  81.0  'NORMAL'   9742    3386  10980    1586    1400   
3  'Subject_4'    'M'  69.6  'NORMAL'  10960    3709  12992    2301    2150   
4  'Subject_5'    'M'  55.3  'NORMAL'  13137    2757  13342    2275    2166   

   AnteriorBasalForebrain_R  ...  TempSul_L  Thalamus_L  dorsalWM_ACC_L  \
0                       338  ...       1175        6638            1523   
1                       243  ...        858        5100            1419   
2                       175  ...       1437        4546             795   
3                       301  ...       1350        5400            1829   
4                       278  ...       1713        5770            1421   

   dorsal_ACC_L  rostralWM_ACC_L  rostral_ACC_L  subcallosalWM_ACC_L  \
0 

In [42]:

# control and disease/disorder groups
control_group = data[data['Diagnosis'] == "'NORMAL'"]
disease_group = data[data['Diagnosis'] == "'AD/MCI'"]

# columns for the limbic system brain regions
brain_region_columns = ['Amyg_R', 'Amyg_L', 'Fimbria_R', 'Fimbria_L', 'Hippo_R', 'Hippo_L', 'Mammillary_R', 'Mammillary_L']

results = {}

In [43]:
# Set your significance level (alpha)
alpha = 0.05

# Perform t-test for each brain region
for column in brain_region_columns:
    control_values = control_group[column].dropna()
    disease_values = disease_group[column].dropna()
    
    # Check if both groups have enough data
    if len(control_values) < 2 or len(disease_values) < 2:
        print(f"Not enough data for {column}")
    else:
        t_statistic, p_value = stats.ttest_ind(control_values, disease_values)
    
        results[column] = {
            't_statistic': t_statistic,
            'p_value': p_value,
        }

In [44]:
for column, result in results.items():
    print(f"Brain Region: {column}")
    print(f"  t-statistic: {result['t_statistic']}")
    print(f"  p-value: {result['p_value']}")
    
    if result['p_value'] <= alpha:
        print("  Null hypothesis rejected: There is a significant difference.")
    else:
        print("  Null hypothesis not rejected: No significant difference.")

Brain Region: Amyg_R
  t-statistic: 0.5380404845001473
  p-value: 0.591153371178904
  Null hypothesis not rejected: No significant difference.
Brain Region: Amyg_L
  t-statistic: 1.7635053385308637
  p-value: 0.07935767887889372
  Null hypothesis not rejected: No significant difference.
Brain Region: Fimbria_R
  t-statistic: 3.2764383126638683
  p-value: 0.001241262260055997
  Null hypothesis rejected: There is a significant difference.
Brain Region: Fimbria_L
  t-statistic: 1.380000034037533
  p-value: 0.16914286194712758
  Null hypothesis not rejected: No significant difference.
Brain Region: Hippo_R
  t-statistic: -1.0490133350400956
  p-value: 0.29545072386155785
  Null hypothesis not rejected: No significant difference.
Brain Region: Hippo_L
  t-statistic: -1.237492350721392
  p-value: 0.21736986747035617
  Null hypothesis not rejected: No significant difference.
Brain Region: Mammillary_R
  t-statistic: -1.1903519132937355
  p-value: 0.23533332123207135
  Null hypothesis not reje