# Anatomical Abnormalities Associated with  Schizophrenia—An Observational Study 

In [None]:
# standard library imports
import warnings

# 3rd party library imports
import matplotlib.pyplot as plt
import numpy as np
import pandas as pd
import pingouin as pg
import scipy.stats
import seaborn as sns

warnings.simplefilter('ignore', category=FutureWarning)

# two digits of precision is good enough here
pd.options.display.float_format = "{:.3f}".format

# enable TeX on figure labels
plt.rcParams['text.usetex'] = True

sns.set()

df = pd.read_csv('case0202.csv')

# Robustness of Assumptions

In [None]:
df.describe()

In [None]:
# wrangle the data into long form
dflong = (
    df.stack()
      .reset_index(level=1)
      .rename({'level_1': 'Treatment', 0: 'Volume'}, axis='columns')
)
dflong.head()

In [None]:
fig, axes = plt.subplots(ncols=2, figsize=[12, 6.4])
_ = sns.boxplot(data=dflong, x='Treatment', y='Volume', ax=axes[0])
_ = axes[0].set_ylabel(r'Volume ($cm^3$)')
_ = axes[0].set_title('Hippocampus Volumes for Schizophrenia Study')
_ = sns.kdeplot(data=dflong, x='Volume', hue='Treatment', ax=axes[1])

There is weak evidence against both normality and equal variance.

$H_0: \mu_{affected} = \mu_{unaffected}$
<br>
$H_a: \mu_{affected} \ne \mu_{unaffected}$

In [None]:
res = pg.ttest(df['Affected'], df['Unaffected'], paired=True)
print(res)

There is strong evidence that the mean difference in left hippocampus volumes bettween schizophrenic individuals and their nonschizophrenic twins is non-zero (two-sided $p$-value = 0.006, $t_{0.95, 14}$ = -3.229).   The mean difference is between 0.07 and 0.33 $cm^3$ smaller for schizophrenic individuals.