# Check sex chromosomes for caudate nucleus

In [None]:
suppressMessages({library(dplyr)
                  library(ggpubr)})

## Get and annotated sex from genotypes

In [None]:
sexcheck_file = paste0('../../../input/genotypes/check_sex/_m/', 
                       'LIBD_Brain_TopMed.sexcheck')
pheno_file = '../../..//input/phenotypes/_m/phenotypes.csv'

dt = data.table::fread(sexcheck_file) %>% 
    inner_join(data.table::fread(pheno_file), by=c("FID"="BrNum")) %>%
    select(c("FID", "Dx", "Sex", "Age", "F", "SNPSEX")) %>%
    distinct() %>% mutate_if(is.character, as.factor)
levels(dt$Sex) <- c('Woman', 'Man')
dt %>% head(2)

## Plot F estimate

In [None]:
fig <- ggboxplot(dt, x = "Sex", y = "F", fill='Sex', width=0.65, palette='npg', 
                 xlab='Reported Gender', ylab='F estimate\n(Genotype Sex)', 
                 ggtheme=theme_pubr(base_size=20), add="jitter", 
                 add.params=list(alpha=0.5), legend="None") +
    font("xy.title", face='bold')
fig

In [None]:
ggsave("sex_check.png")
ggsave("sex_check.pdf")
ggsave("sex_check.svg")

In [None]:
dt %>%
  group_by(Sex) %>%
  summarize(mean_size = mean(F, na.rm = TRUE), max = max(F, na.rm=TRUE))

## Check that reported gender matches genotype sex

In [None]:
sum(dt$Sex == "Man")
sum(dt$SNPSEX == 1 & dt$Sex == "Man")

In [None]:
sum(dt$Sex == "Woman")
sum(dt$SNPSEX == 2 & dt$Sex == "Woman")

### Examine number of X chromosomes

In [None]:
table(dt$SNPSEX)

In [None]:
table(dt$Sex)

#### Summary: All samples have reported gender matching genotype sex

## Reproducibility Information

In [None]:
Sys.time()
proc.time()
options(width = 120)
sessioninfo::session_info()