## Supplementary Table 1. Baseline characteristics of the ARIC cohort (N=10,871)

In [1]:
library(data.table)
library(ggplot2)
library(ggpubr)
library(cowplot)
theme_set(theme_cowplot())
library(dplyr)
library(tidyr)


Attaching package: 'cowplot'


The following object is masked from 'package:ggpubr':

    get_legend



Attaching package: 'dplyr'


The following objects are masked from 'package:data.table':

    between, first, last


The following objects are masked from 'package:stats':

    filter, lag


The following objects are masked from 'package:base':

    intersect, setdiff, setequal, union




In [2]:
# set working directory
setwd("/medpop/esp2/mesbah/projects/ch_progression/aric/pheno/")

In [3]:
# Baseline pop
aric_baseline_full <- fread("aric_baseline_N10881.pheno_ch_status.23Mar2023.csv", header=T)

# Samples with Follow-up
aric_baseline_n_v05_noPrevHeme <- fread("aric_baseline_n_v05_N4187.pheno_ch_status.noHemeCA.9May2023.csv", header=T)


In [4]:
## SBP and DBP
bp_baseline <- fread("aric_baseline_bp_20230508.csv", header=T)
# summary(bp_baseline)
table(bp_baseline$aricid %in% aric_baseline_full$aricid, exclude=NULL)
aric_baseline_full <- merge(aric_baseline_full, 
                             bp_baseline[,c(3,5,6)], 
                             by = "aricid")
summary(aric_baseline_full$dbp_base)
summary(aric_baseline_full$sbp_base)

## Heme CA
hemeCA_baseline <- fread("aric_hem_cancer_20230507.csv", header=T)
# summary(hemeCA_baseline)
table(hemeCA_baseline$aricid %in% aric_baseline_full$aricid, exclude=NULL)

aric_baseline_full <- merge(aric_baseline_full, 
                             hemeCA_baseline[,c(1,17,18,19,20,21)], 
                             by = "aricid")

table(aric_baseline_full$hem_can_inc_base, exclude = NULL)
table(aric_baseline_full$hem_can_base, exclude = NULL)
aric_baseline_full[which(aric_baseline_full$hem_can_base==1),c(1,2)]


 TRUE 
10881 

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
   18.0    66.0    72.0    72.6    79.0   133.0       2 

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
   62.0   109.0   120.0   122.4   133.0   242.0       2 


FALSE  TRUE 
 4911 10881 


   0    1 <NA> 
9871  305  705 


    0     1  <NA> 
10176    10   695 

aricid,gwasid
<chr>,<chr>
F104165,A15404
F159114,A02532
F317722,A07633
J145941,A02524
J224295,A12238
M156005,A16338
M204906,A16420
M311260,A15977
W180449,A14702
W241017,A04745


In [5]:
## exclude prev. heme CA
aric_baseline_full_noPrevHeme <- subset(aric_baseline_full, aric_baseline_full$hem_can_base==0 | is.na(aric_baseline_full$hem_can_base) )
nrow(aric_baseline_full_noPrevHeme)

In [6]:
table(aric_baseline_full_noPrevHeme$aricid %in% aric_baseline_n_v05_noPrevHeme$ARIC_ID)


FALSE  TRUE 
 6684  4187 

In [7]:
aric_baseline_full_noPrevHeme$followUp <- ifelse(aric_baseline_full_noPrevHeme$aricid %in% aric_baseline_n_v05_noPrevHeme$ARIC_ID, 1,0)
table(aric_baseline_full_noPrevHeme$followUp)


   0    1 
6684 4187 

In [14]:
# fwrite(aric_baseline_full, "aric_baseline_N10881.pheno_ch_status_bp_heme.10May2023.csv", 
  #  row.names = F, col.names = T, sep=",")

# fwrite(aric_baseline_full_noPrevHeme, "aric_baseline_N10881.pheno_ch_status_bp_heme.noHemeCA.10May2023.csv", 
  #   row.names = F, col.names = T, sep=",")

In [8]:
aric_baseline_full_noPrevHeme <-  fread("aric_baseline_N10881.pheno_ch_status_bp_heme.noHemeCA.10May2023.csv", 
                                        header=T)

In [9]:
table(aric_baseline_full_noPrevHeme$followUp)


   0    1 
6684 4187 

In [5]:
round(summary(aric_baseline_full_noPrevHeme$age_base[aric_baseline_full_noPrevHeme$followUp==0]),1)
round(summary(aric_baseline_full_noPrevHeme$age_base[aric_baseline_full_noPrevHeme$followUp==1]),1)

t.test(aric_baseline_full_noPrevHeme$age_base[aric_baseline_full_noPrevHeme$followUp==0], 
       aric_baseline_full_noPrevHeme$age_base[aric_baseline_full_noPrevHeme$followUp==1])

formatC(t.test(aric_baseline_full_noPrevHeme$age_base[aric_baseline_full_noPrevHeme$followUp==0], 
       aric_baseline_full_noPrevHeme$age_base[aric_baseline_full_noPrevHeme$followUp==1])$p.value, 
        digit=1,format="E")

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
   44.0    54.0    59.0    58.5    64.0    84.0 

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
   45.0    51.0    55.0    55.5    59.0    83.0 


	Welch Two Sample t-test

data:  aric_baseline_full_noPrevHeme$age_base[aric_baseline_full_noPrevHeme$followUp == 0] and aric_baseline_full_noPrevHeme$age_base[aric_baseline_full_noPrevHeme$followUp == 1]
t = 26.489, df = 9522.6, p-value < 2.2e-16
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 2.779387 3.223609
sample estimates:
mean of x mean of y 
 58.47606  55.47456 


In [25]:
# Sex
table(aric_baseline_full_noPrevHeme$Sex[aric_baseline_full_noPrevHeme$followUp==0])
round(prop.table(table(aric_baseline_full_noPrevHeme$Sex[aric_baseline_full_noPrevHeme$followUp==0]))*100,1)

table(aric_baseline_full_noPrevHeme$Sex[aric_baseline_full_noPrevHeme$followUp==1])
round(prop.table(table(aric_baseline_full_noPrevHeme$Sex[aric_baseline_full_noPrevHeme$followUp==1]))*100,1)

# Race
table(aric_baseline_full_noPrevHeme$race_BW[aric_baseline_full_noPrevHeme$followUp==0])
round(prop.table(table(aric_baseline_full_noPrevHeme$race_BW[aric_baseline_full_noPrevHeme$followUp==0]))*100,1)

table(aric_baseline_full_noPrevHeme$race_BW[aric_baseline_full_noPrevHeme$followUp==1])
round(prop.table(table(aric_baseline_full_noPrevHeme$race_BW[aric_baseline_full_noPrevHeme$followUp==1]))*100,1)



   F    M 
3664 3020 


   F    M 
54.8 45.2 


   F    M 
2478 1709 


   F    M 
59.2 40.8 


   B    W 
2171 4513 


   B    W 
32.5 67.5 


   B    W 
 951 3236 


   B    W 
22.7 77.3 

In [11]:
cat("Sex")
chisq.test(table(aric_baseline_full_noPrevHeme$Sex,
           aric_baseline_full_noPrevHeme$followUp) )

cat("Race")
chisq.test(table(aric_baseline_full_noPrevHeme$race_BW,
           aric_baseline_full_noPrevHeme$followUp) )

chisq.test(table(aric_baseline_full_noPrevHeme$race_BW,
           aric_baseline_full_noPrevHeme$followUp) )$p.value

Sex


	Pearson's Chi-squared test with Yates' continuity correction

data:  table(aric_baseline_full_noPrevHeme$Sex, aric_baseline_full_noPrevHeme$followUp)
X-squared = 19.786, df = 1, p-value = 8.66e-06


Race


	Pearson's Chi-squared test with Yates' continuity correction

data:  table(aric_baseline_full_noPrevHeme$race_BW, aric_baseline_full_noPrevHeme$followUp)
X-squared = 119.5, df = 1, p-value < 2.2e-16


In [7]:
# smoking
table(aric_baseline_full_noPrevHeme$ever_smoke[aric_baseline_full_noPrevHeme$followUp==0])
round(prop.table(table(aric_baseline_full_noPrevHeme$ever_smoke[aric_baseline_full_noPrevHeme$followUp==0]))*100,1)

table(aric_baseline_full_noPrevHeme$ever_smoke[aric_baseline_full_noPrevHeme$followUp==1])
round(prop.table(table(aric_baseline_full_noPrevHeme$ever_smoke[aric_baseline_full_noPrevHeme$followUp==1]))*100,1)

t.test(aric_baseline_full_noPrevHeme$ever_smoke[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$ever_smoke[aric_baseline_full_noPrevHeme$followUp==1])

formatC(t.test(aric_baseline_full_noPrevHeme$ever_smoke[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$ever_smoke[aric_baseline_full_noPrevHeme$followUp==1])$p.value, digit=1, format="E")


   0    1 
2448 4212 


   0    1 
36.8 63.2 


   0    1 
1908 2269 


   0    1 
45.7 54.3 


	Welch Two Sample t-test

data:  aric_baseline_full_noPrevHeme$ever_smoke[aric_baseline_full_noPrevHeme$followUp == 0] and aric_baseline_full_noPrevHeme$ever_smoke[aric_baseline_full_noPrevHeme$followUp == 1]
t = 9.1863, df = 8651.6, p-value < 2.2e-16
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 0.07018124 0.10825796
sample estimates:
mean of x mean of y 
0.6324324 0.5432128 


In [8]:
## BMI
round(summary(aric_baseline_full_noPrevHeme$bmi_base[aric_baseline_full_noPrevHeme$followUp==0]),1)
round((sd(aric_baseline_full_noPrevHeme$bmi_base[aric_baseline_full_noPrevHeme$followUp==0], na.rm = T)),1)

round(summary(aric_baseline_full_noPrevHeme$bmi_base[aric_baseline_full_noPrevHeme$followUp==1]),1)
round((sd(aric_baseline_full_noPrevHeme$bmi_base[aric_baseline_full_noPrevHeme$followUp==1], na.rm = T)),1)

t.test(aric_baseline_full_noPrevHeme$bmi_base[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$bmi_base[aric_baseline_full_noPrevHeme$followUp==1])

formatC(t.test(aric_baseline_full_noPrevHeme$bmi_base[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$bmi_base[aric_baseline_full_noPrevHeme$followUp==1])$p.value, 
        digit=1, format="E")


   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
   14.0    24.6    27.6    28.5    31.4    67.3      15 

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
   15.9    24.2    27.0    27.8    30.4    55.0       4 


	Welch Two Sample t-test

data:  aric_baseline_full_noPrevHeme$bmi_base[aric_baseline_full_noPrevHeme$followUp == 0] and aric_baseline_full_noPrevHeme$bmi_base[aric_baseline_full_noPrevHeme$followUp == 1]
t = 6.821, df = 9730, p-value = 9.581e-12
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 0.5182605 0.9362599
sample estimates:
mean of x mean of y 
 28.50137  27.77411 


In [9]:
## sBP
round(summary(aric_baseline_full_noPrevHeme$sbp_base[aric_baseline_full_noPrevHeme$followUp==0]),1)
round((sd(aric_baseline_full_noPrevHeme$sbp_base[aric_baseline_full_noPrevHeme$followUp==0], na.rm = T)),1)

round(summary(aric_baseline_full_noPrevHeme$sbp_base[aric_baseline_full_noPrevHeme$followUp==1]),1)
round((sd(aric_baseline_full_noPrevHeme$sbp_base[aric_baseline_full_noPrevHeme$followUp==1], na.rm = T)),1)

t.test(aric_baseline_full_noPrevHeme$sbp_base[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$sbp_base[aric_baseline_full_noPrevHeme$followUp==1])

formatC(t.test(aric_baseline_full_noPrevHeme$sbp_base[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$sbp_base[aric_baseline_full_noPrevHeme$followUp==1])$p.value, 
        digit=1, format="E")

## dBP
round(summary(aric_baseline_full_noPrevHeme$dbp_base[aric_baseline_full_noPrevHeme$followUp==0]),1)
round((sd(aric_baseline_full_noPrevHeme$dbp_base[aric_baseline_full_noPrevHeme$followUp==0], na.rm = T)),1)

round(summary(aric_baseline_full_noPrevHeme$dbp_base[aric_baseline_full_noPrevHeme$followUp==1]),1)
round((sd(aric_baseline_full_noPrevHeme$dbp_base[aric_baseline_full_noPrevHeme$followUp==1], na.rm = T)),1)

t.test(aric_baseline_full_noPrevHeme$dbp_base[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$dbp_base[aric_baseline_full_noPrevHeme$followUp==1])

formatC(t.test(aric_baseline_full_noPrevHeme$dbp_base[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$dbp_base[aric_baseline_full_noPrevHeme$followUp==1])$p.value, 
        digit=1, format="E")

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
   74.0   111.0   122.0   124.8   136.0   242.0 

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
   62.0   107.0   117.0   118.4   127.0   220.0       2 


	Welch Two Sample t-test

data:  aric_baseline_full_noPrevHeme$sbp_base[aric_baseline_full_noPrevHeme$followUp == 0] and aric_baseline_full_noPrevHeme$sbp_base[aric_baseline_full_noPrevHeme$followUp == 1]
t = 18.394, df = 9994, p-value < 2.2e-16
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 5.705755 7.066927
sample estimates:
mean of x mean of y 
 124.8204  118.4341 


   Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
   18.0    65.0    72.0    72.7    79.0   133.0 

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
   39.0    66.0    72.0    72.4    79.0   124.0       2 


	Welch Two Sample t-test

data:  aric_baseline_full_noPrevHeme$dbp_base[aric_baseline_full_noPrevHeme$followUp == 0] and aric_baseline_full_noPrevHeme$dbp_base[aric_baseline_full_noPrevHeme$followUp == 1]
t = 1.5135, df = 9531.3, p-value = 0.1302
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 -0.08958267  0.69665437
sample estimates:
mean of x mean of y 
 72.71781  72.41427 


In [10]:
# Chol medication
table(aric_baseline_full_noPrevHeme$chol_med_base[aric_baseline_full_noPrevHeme$followUp==0])
round(prop.table(table(aric_baseline_full_noPrevHeme$chol_med_base[aric_baseline_full_noPrevHeme$followUp==0]))*100,1)

table(aric_baseline_full_noPrevHeme$chol_med_base[aric_baseline_full_noPrevHeme$followUp==1])
round(prop.table(table(aric_baseline_full_noPrevHeme$chol_med_base[aric_baseline_full_noPrevHeme$followUp==1]))*100,1)

t.test(aric_baseline_full_noPrevHeme$chol_med_base[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$chol_med_base[aric_baseline_full_noPrevHeme$followUp==1])

formatC(t.test(aric_baseline_full_noPrevHeme$chol_med_base[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$chol_med_base[aric_baseline_full_noPrevHeme$followUp==1])$p.value, digit=1, format="E")


   0    1 
6169  470 


   0    1 
92.9  7.1 


   0    1 
3948  231 


   0    1 
94.5  5.5 


	Welch Two Sample t-test

data:  aric_baseline_full_noPrevHeme$chol_med_base[aric_baseline_full_noPrevHeme$followUp == 0] and aric_baseline_full_noPrevHeme$chol_med_base[aric_baseline_full_noPrevHeme$followUp == 1]
t = 3.278, df = 9622.3, p-value = 0.001049
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 0.006238152 0.024796673
sample estimates:
 mean of x  mean of y 
0.07079379 0.05527638 


In [11]:
# Hypertension
table(aric_baseline_full_noPrevHeme$htn_5_base[aric_baseline_full_noPrevHeme$followUp==0])
round(prop.table(table(aric_baseline_full_noPrevHeme$htn_5_base[aric_baseline_full_noPrevHeme$followUp==0]))*100,1)

table(aric_baseline_full_noPrevHeme$htn_5_base[aric_baseline_full_noPrevHeme$followUp==1])
round(prop.table(table(aric_baseline_full_noPrevHeme$htn_5_base[aric_baseline_full_noPrevHeme$followUp==1]))*100,1)

t.test(aric_baseline_full_noPrevHeme$htn_5_base[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$htn_5_base[aric_baseline_full_noPrevHeme$followUp==1])

formatC(t.test(aric_baseline_full_noPrevHeme$htn_5_base[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$htn_5_base[aric_baseline_full_noPrevHeme$followUp==1])$p.value, digit=1, format="E")


   0    1 
3774 2879 


   0    1 
56.7 43.3 


   0    1 
2985 1194 


   0    1 
71.4 28.6 


	Welch Two Sample t-test

data:  aric_baseline_full_noPrevHeme$htn_5_base[aric_baseline_full_noPrevHeme$followUp == 0] and aric_baseline_full_noPrevHeme$htn_5_base[aric_baseline_full_noPrevHeme$followUp == 1]
t = 15.877, df = 9477.8, p-value < 2.2e-16
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 0.1288711 0.1651746
sample estimates:
mean of x mean of y 
0.4327371 0.2857143 


In [12]:
# T2D
table(aric_baseline_full_noPrevHeme$dm_126_base[aric_baseline_full_noPrevHeme$followUp==0])
round(prop.table(table(aric_baseline_full_noPrevHeme$dm_126_base[aric_baseline_full_noPrevHeme$followUp==0]))*100,1)

table(aric_baseline_full_noPrevHeme$dm_126_base[aric_baseline_full_noPrevHeme$followUp==1])
round(prop.table(table(aric_baseline_full_noPrevHeme$dm_126_base[aric_baseline_full_noPrevHeme$followUp==1]))*100,1)

t.test(aric_baseline_full_noPrevHeme$dm_126_base[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$dm_126_base[aric_baseline_full_noPrevHeme$followUp==1])

formatC(t.test(aric_baseline_full_noPrevHeme$dm_126_base[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$dm_126_base[aric_baseline_full_noPrevHeme$followUp==1])$p.value, digit=1, format="E")


   0    1 
5341 1309 


   0    1 
80.3 19.7 


   0    1 
3823  349 


   0    1 
91.6  8.4 


	Welch Two Sample t-test

data:  aric_baseline_full_noPrevHeme$dm_126_base[aric_baseline_full_noPrevHeme$followUp == 0] and aric_baseline_full_noPrevHeme$dm_126_base[aric_baseline_full_noPrevHeme$followUp == 1]
t = 17.433, df = 10705, p-value < 2.2e-16
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 0.1004622 0.1259161
sample estimates:
 mean of x  mean of y 
0.19684211 0.08365292 


In [15]:
# CHD
table(aric_baseline_full_noPrevHeme$chd_base[aric_baseline_full_noPrevHeme$followUp==0])
round(prop.table(table(aric_baseline_full_noPrevHeme$chd_base[aric_baseline_full_noPrevHeme$followUp==0]))*100,1)

table(aric_baseline_full_noPrevHeme$chd_base[aric_baseline_full_noPrevHeme$followUp==1])
round(prop.table(table(aric_baseline_full_noPrevHeme$chd_base[aric_baseline_full_noPrevHeme$followUp==1]))*100,2)

t.test(aric_baseline_full_noPrevHeme$chd_base[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$chd_base[aric_baseline_full_noPrevHeme$followUp==1])

formatC(t.test(aric_baseline_full_noPrevHeme$chd_base[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$chd_base[aric_baseline_full_noPrevHeme$followUp==1])$p.value, digit=1, format="E")


   0    1 
6140  544 


   0    1 
91.9  8.1 


   0    1 
4060  127 


    0     1 
96.97  3.03 


	Welch Two Sample t-test

data:  aric_baseline_full_noPrevHeme$chd_base[aric_baseline_full_noPrevHeme$followUp == 0] and aric_baseline_full_noPrevHeme$chd_base[aric_baseline_full_noPrevHeme$followUp == 1]
t = 11.963, df = 10869, p-value < 2.2e-16
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 0.04269088 0.05942194
sample estimates:
 mean of x  mean of y 
0.08138839 0.03033198 


In [16]:
# Stroke
table(aric_baseline_full_noPrevHeme$is_base[aric_baseline_full_noPrevHeme$followUp==0])
round(prop.table(table(aric_baseline_full_noPrevHeme$is_base[aric_baseline_full_noPrevHeme$followUp==0]))*100,1)

table(aric_baseline_full_noPrevHeme$is_base[aric_baseline_full_noPrevHeme$followUp==1])
round(prop.table(table(aric_baseline_full_noPrevHeme$is_base[aric_baseline_full_noPrevHeme$followUp==1]))*100,2)

t.test(aric_baseline_full_noPrevHeme$is_base[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$is_base[aric_baseline_full_noPrevHeme$followUp==1])

formatC(t.test(aric_baseline_full_noPrevHeme$is_base[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$is_base[aric_baseline_full_noPrevHeme$followUp==1])$p.value, digit=1, format="E")


   0    1 
6306  215 


   0    1 
96.7  3.3 


   0    1 
4048   42 


    0     1 
98.97  1.03 


	Welch Two Sample t-test

data:  aric_baseline_full_noPrevHeme$is_base[aric_baseline_full_noPrevHeme$followUp == 0] and aric_baseline_full_noPrevHeme$is_base[aric_baseline_full_noPrevHeme$followUp == 1]
t = 8.359, df = 10505, p-value < 2.2e-16
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 0.01737794 0.02802497
sample estimates:
 mean of x  mean of y 
0.03297040 0.01026895 


In [17]:
# HF
table(aric_baseline_full_noPrevHeme$hf_base[aric_baseline_full_noPrevHeme$followUp==0])
round(prop.table(table(aric_baseline_full_noPrevHeme$hf_base[aric_baseline_full_noPrevHeme$followUp==0]))*100,1)

table(aric_baseline_full_noPrevHeme$hf_base[aric_baseline_full_noPrevHeme$followUp==1])
round(prop.table(table(aric_baseline_full_noPrevHeme$hf_base[aric_baseline_full_noPrevHeme$followUp==1]))*100,1)

t.test(aric_baseline_full_noPrevHeme$hf_base[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$hf_base[aric_baseline_full_noPrevHeme$followUp==1])

formatC(t.test(aric_baseline_full_noPrevHeme$hf_base[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$hf_base[aric_baseline_full_noPrevHeme$followUp==1])$p.value, digit=1, format="E")


   0    1 
6136  438 


   0    1 
93.3  6.7 


   0    1 
4011  113 


   0    1 
97.3  2.7 


	Welch Two Sample t-test

data:  aric_baseline_full_noPrevHeme$hf_base[aric_baseline_full_noPrevHeme$followUp == 0] and aric_baseline_full_noPrevHeme$hf_base[aric_baseline_full_noPrevHeme$followUp == 1]
t = 9.8295, df = 10677, p-value < 2.2e-16
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 0.03140325 0.04704779
sample estimates:
 mean of x  mean of y 
0.06662610 0.02740058 


In [18]:
## corrected lipid values
lipids_base <- fread("aric_baseline_vanilla_02082023.csv", header=T, sep="\t")
#str(lipids_base)
summary(lipids_base[,c(10,12,14,16:19)])
# zero value to "NA"
lipids_base$ldl_base[lipids_base$ldl_base==0] <- NA
summary(lipids_base[,c(10,12,14,16:19)])
table(lipids_base$aricid %in% aric_baseline_full$aricid)

aric_baseline_full_noPrevHeme <-  fread("aric_baseline_N10881.pheno_ch_status_bp_heme.noHemeCA.10May2023.csv", 
                                        header=T)

aric_baseline_full_noPrevHeme.v2 <- merge(aric_baseline_full_noPrevHeme, lipids_base, by="aricid")

str(aric_baseline_full_noPrevHeme.v2)

# fwrite(aric_baseline_full_noPrevHeme.v2, "aric_baseline_N10871.pheno_ch_status.noHemeCA.correct_lipids.31May2023.csv", 
  #   row.names = F, col.names = T, sep=",")



    age_base        bmi_base       gluc_base        chol_base  
 Min.   :44.00   Min.   :13.98   Min.   : 18.98   Min.   : 85  
 1st Qu.:52.00   1st Qu.:24.41   1st Qu.: 95.92   1st Qu.:183  
 Median :57.00   Median :27.36   Median :102.92   Median :207  
 Mean   :57.32   Mean   :28.22   Mean   :113.68   Mean   :210  
 3rd Qu.:62.00   3rd Qu.:31.01   3rd Qu.:112.66   3rd Qu.:232  
 Max.   :84.00   Max.   :67.26   Max.   :590.52   Max.   :558  
                 NA's   :20      NA's   :1685     NA's   :15   
    hdl_base         ldl_base        tg_base      
 Min.   :  5.00   Min.   :  0.0   Min.   :  11.0  
 1st Qu.: 38.72   1st Qu.:108.5   1st Qu.:  82.0  
 Median : 48.00   Median :130.4   Median : 113.0  
 Mean   : 50.62   Mean   :132.7   Mean   : 135.3  
 3rd Qu.: 60.00   3rd Qu.:154.4   3rd Qu.: 160.0  
 Max.   :202.00   Max.   :467.4   Max.   :2375.9  
 NA's   :43       NA's   :210     NA's   :14      

    age_base        bmi_base       gluc_base        chol_base  
 Min.   :44.00   Min.   :13.98   Min.   : 18.98   Min.   : 85  
 1st Qu.:52.00   1st Qu.:24.41   1st Qu.: 95.92   1st Qu.:183  
 Median :57.00   Median :27.36   Median :102.92   Median :207  
 Mean   :57.32   Mean   :28.22   Mean   :113.68   Mean   :210  
 3rd Qu.:62.00   3rd Qu.:31.01   3rd Qu.:112.66   3rd Qu.:232  
 Max.   :84.00   Max.   :67.26   Max.   :590.52   Max.   :558  
                 NA's   :20      NA's   :1685     NA's   :15   
    hdl_base         ldl_base        tg_base      
 Min.   :  5.00   Min.   :  9.8   Min.   :  11.0  
 1st Qu.: 38.72   1st Qu.:108.6   1st Qu.:  82.0  
 Median : 48.00   Median :130.4   Median : 113.0  
 Mean   : 50.62   Mean   :132.7   Mean   : 135.3  
 3rd Qu.: 60.00   3rd Qu.:154.4   3rd Qu.: 160.0  
 Max.   :202.00   Max.   :467.4   Max.   :2375.9  
 NA's   :43       NA's   :211     NA's   :14      


 TRUE 
10881 

Classes 'data.table' and 'data.frame':	10871 obs. of  95 variables:
 $ aricid              : chr  "F100146" "F100152" "F100358" "F100361" ...
 $ gwasid.x            : chr  "A11401" "A10391" "A07753" "A12357" ...
 $ hg38_CRAM_ID.x      : chr  "A11401" "A10391" "A07753" "A12357" ...
 $ Visit.x             : chr  "V03" "V02" "V02" "V02" ...
 $ sex                 : chr  "M" "F" "M" "F" ...
 $ race                : chr  "W" "B" "W" "W" ...
 $ center              : chr  "F" "F" "F" "F" ...
 $ dob                 : IDate, format: "1923-11-30" "1939-04-18" ...
 $ date_base.x         : IDate, format: "1993-04-02" "1990-02-15" ...
 $ age_base.x          : int  69 50 58 58 65 56 64 61 62 60 ...
 $ fast_8_base.x       : int  1 1 1 1 1 1 1 1 1 1 ...
 $ bmi_base.x          : num  26.7 25.8 26.3 27.1 29.1 ...
 $ dm_126_base.x       : int  0 0 0 0 0 0 0 0 1 0 ...
 $ gluc_base.x         : num  NA 4.77 6.38 4.88 6.83 ...
 $ htn_5_base.x        : int  0 0 0 1 1 0 0 0 0 0 ...
 $ chol_base.x         : num

In [19]:
# updated: Total Chol. 
round(summary(aric_baseline_full_noPrevHeme.v2$chol_base.y[aric_baseline_full_noPrevHeme.v2$followUp==0]),1)
round(sd(aric_baseline_full_noPrevHeme.v2$chol_base.y[aric_baseline_full_noPrevHeme.v2$followUp==0], na.rm = T),1)

round(summary(aric_baseline_full_noPrevHeme.v2$chol_base.y[aric_baseline_full_noPrevHeme.v2$followUp==1]),1)
round(sd(aric_baseline_full_noPrevHeme.v2$chol_base.y[aric_baseline_full_noPrevHeme.v2$followUp==1], na.rm = T),1)

t.test(aric_baseline_full_noPrevHeme.v2$chol_base.y[aric_baseline_full_noPrevHeme.v2$followUp==0],
      aric_baseline_full_noPrevHeme.v2$chol_base.y[aric_baseline_full_noPrevHeme.v2$followUp==1])

formatC(t.test(aric_baseline_full_noPrevHeme.v2$chol_base.y[aric_baseline_full_noPrevHeme.v2$followUp==0],
      aric_baseline_full_noPrevHeme.v2$chol_base.y[aric_baseline_full_noPrevHeme.v2$followUp==1])$p.value, digit=1, format="E")



   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
   85.0   183.0   208.0   211.1   234.0   558.0      10 

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
  101.0   183.0   205.0   208.1   230.0   461.0       5 


	Welch Two Sample t-test

data:  aric_baseline_full_noPrevHeme.v2$chol_base.y[aric_baseline_full_noPrevHeme.v2$followUp == 0] and aric_baseline_full_noPrevHeme.v2$chol_base.y[aric_baseline_full_noPrevHeme.v2$followUp == 1]
t = 4.0695, df = 9537, p-value = 4.749e-05
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 1.582590 4.524034
sample estimates:
mean of x mean of y 
 211.1412  208.0879 


In [20]:
## LDL
#
round(summary(aric_baseline_full_noPrevHeme.v2$ldl_base.y[aric_baseline_full_noPrevHeme.v2$followUp==0]),1)
round(sd(aric_baseline_full_noPrevHeme.v2$ldl_base.y[aric_baseline_full_noPrevHeme.v2$followUp==0], na.rm = T),1)

round(summary(aric_baseline_full_noPrevHeme.v2$ldl_base.y[aric_baseline_full_noPrevHeme.v2$followUp==1]),1)
round(sd(aric_baseline_full_noPrevHeme.v2$ldl_base.y[aric_baseline_full_noPrevHeme.v2$followUp==1], na.rm = T),1)

t.test(aric_baseline_full_noPrevHeme.v2$ldl_base.y[aric_baseline_full_noPrevHeme.v2$followUp==0],
      aric_baseline_full_noPrevHeme.v2$ldl_base.y[aric_baseline_full_noPrevHeme.v2$followUp==1])

formatC(t.test(aric_baseline_full_noPrevHeme.v2$ldl_base.y[aric_baseline_full_noPrevHeme.v2$followUp==0],
      aric_baseline_full_noPrevHeme.v2$ldl_base.y[aric_baseline_full_noPrevHeme.v2$followUp==1])$p.value, digit=1, format="E")



   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
   21.4   108.9   131.6   134.0   156.8   467.4     137 

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
    9.8   107.8   128.4   130.6   151.0   396.8      74 


	Welch Two Sample t-test

data:  aric_baseline_full_noPrevHeme.v2$ldl_base.y[aric_baseline_full_noPrevHeme.v2$followUp == 0] and aric_baseline_full_noPrevHeme.v2$ldl_base.y[aric_baseline_full_noPrevHeme.v2$followUp == 1]
t = 4.8326, df = 9165.1, p-value = 1.369e-06
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 2.021242 4.779957
sample estimates:
mean of x mean of y 
 134.0339  130.6333 


In [22]:
## HDL
round(summary(aric_baseline_full_noPrevHeme.v2$hdl_base.y[aric_baseline_full_noPrevHeme.v2$followUp==0]),1)
round(sd(aric_baseline_full_noPrevHeme.v2$hdl_base.y[aric_baseline_full_noPrevHeme.v2$followUp==0], na.rm = T),2)

round(summary(aric_baseline_full_noPrevHeme.v2$hdl_base.y[aric_baseline_full_noPrevHeme.v2$followUp==1]),1)
round(sd(aric_baseline_full_noPrevHeme.v2$hdl_base.y[aric_baseline_full_noPrevHeme.v2$followUp==1], na.rm = T),2)

t.test(aric_baseline_full_noPrevHeme.v2$hdl_base.y[aric_baseline_full_noPrevHeme.v2$followUp==0],
      aric_baseline_full_noPrevHeme.v2$hdl_base.y[aric_baseline_full_noPrevHeme.v2$followUp==1])

formatC(t.test(aric_baseline_full_noPrevHeme.v2$hdl_base.y[aric_baseline_full_noPrevHeme.v2$followUp==0],
      aric_baseline_full_noPrevHeme.v2$hdl_base.y[aric_baseline_full_noPrevHeme.v2$followUp==1])$p.value, digit=1, format="E")



   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
   11.0    37.0    47.0    49.8    59.0   202.0      28 

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
      5      40      50      52      62     141      15 


	Welch Two Sample t-test

data:  aric_baseline_full_noPrevHeme.v2$hdl_base.y[aric_baseline_full_noPrevHeme.v2$followUp == 0] and aric_baseline_full_noPrevHeme.v2$hdl_base.y[aric_baseline_full_noPrevHeme.v2$followUp == 1]
t = -6.6647, df = 8871.8, p-value = 2.81e-11
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 -2.892585 -1.577761
sample estimates:
mean of x mean of y 
 49.75919  51.99437 


In [23]:
## TG

round(summary(aric_baseline_full_noPrevHeme.v2$tg_base.y[aric_baseline_full_noPrevHeme.v2$followUp==0]),1)
round(sd(aric_baseline_full_noPrevHeme.v2$tg_base.y[aric_baseline_full_noPrevHeme.v2$followUp==0], na.rm = T),1)

round(summary(aric_baseline_full_noPrevHeme.v2$tg_base.y[aric_baseline_full_noPrevHeme.v2$followUp==1]),1)
round(sd(aric_baseline_full_noPrevHeme.v2$tg_base.y[aric_baseline_full_noPrevHeme.v2$followUp==1], na.rm = T),1)

t.test(aric_baseline_full_noPrevHeme.v2$tg_base.y[aric_baseline_full_noPrevHeme.v2$followUp==0],
      aric_baseline_full_noPrevHeme.v2$tg_base.y[aric_baseline_full_noPrevHeme.v2$followUp==1])

formatC(t.test(aric_baseline_full_noPrevHeme.v2$tg_base.y[aric_baseline_full_noPrevHeme.v2$followUp==0],
      aric_baseline_full_noPrevHeme.v2$tg_base.y[aric_baseline_full_noPrevHeme.v2$followUp==1])$p.value, digit=1, format="E")




   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
   11.0    83.0   116.0   138.9   167.0  2375.9       9 

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
   29.0    80.0   110.0   129.4   154.0  1634.9       5 


	Welch Two Sample t-test

data:  aric_baseline_full_noPrevHeme.v2$tg_base.y[aric_baseline_full_noPrevHeme.v2$followUp == 0] and aric_baseline_full_noPrevHeme.v2$tg_base.y[aric_baseline_full_noPrevHeme.v2$followUp == 1]
t = 5.3385, df = 9943, p-value = 9.579e-08
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
  6.013384 12.991741
sample estimates:
mean of x mean of y 
 138.8947  129.3922 


In [18]:
# Total Chol. 
round(summary(aric_baseline_full_noPrevHeme$chol_base[aric_baseline_full_noPrevHeme$followUp==0]),1)
round(sd(aric_baseline_full_noPrevHeme$chol_base[aric_baseline_full_noPrevHeme$followUp==0], na.rm = T),1)

round(summary(aric_baseline_full_noPrevHeme$chol_base[aric_baseline_full_noPrevHeme$followUp==1]),1)
round(sd(aric_baseline_full_noPrevHeme$chol_base[aric_baseline_full_noPrevHeme$followUp==1], na.rm = T),1)

t.test(aric_baseline_full_noPrevHeme$chol_base[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$chol_base[aric_baseline_full_noPrevHeme$followUp==1])

formatC(t.test(aric_baseline_full_noPrevHeme$chol_base[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$chol_base[aric_baseline_full_noPrevHeme$followUp==1])$p.value, digit=1, format="E")

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
    2.2     4.8     5.4     8.9     6.1   337.0      10 

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
    2.6     4.7     5.3     8.1     6.0   255.3       5 


	Welch Two Sample t-test

data:  aric_baseline_full_noPrevHeme$chol_base[aric_baseline_full_noPrevHeme$followUp == 0] and aric_baseline_full_noPrevHeme$chol_base[aric_baseline_full_noPrevHeme$followUp == 1]
t = 1.586, df = 9541.3, p-value = 0.1128
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 -0.1788008  1.6943685
sample estimates:
mean of x mean of y 
 8.860470  8.102686 


In [19]:
# LDL 
round(summary(aric_baseline_full_noPrevHeme$ldl_base[aric_baseline_full_noPrevHeme$followUp==0]),1)
round(sd(aric_baseline_full_noPrevHeme$ldl_base[aric_baseline_full_noPrevHeme$followUp==0], na.rm = T),1)

round(summary(aric_baseline_full_noPrevHeme$ldl_base[aric_baseline_full_noPrevHeme$followUp==1]),1)
round(sd(aric_baseline_full_noPrevHeme$ldl_base[aric_baseline_full_noPrevHeme$followUp==1], na.rm = T),1)

t.test(aric_baseline_full_noPrevHeme$ldl_base[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$ldl_base[aric_baseline_full_noPrevHeme$followUp==1])

formatC(t.test(aric_baseline_full_noPrevHeme$ldl_base[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$ldl_base[aric_baseline_full_noPrevHeme$followUp==1])$p.value, digit=1, format="E")

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
    0.0     2.8     3.4     5.6     4.1   238.6     136 

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
    0.3     2.8     3.3     5.1     3.9   180.0      74 


	Welch Two Sample t-test

data:  aric_baseline_full_noPrevHeme$ldl_base[aric_baseline_full_noPrevHeme$followUp == 0] and aric_baseline_full_noPrevHeme$ldl_base[aric_baseline_full_noPrevHeme$followUp == 1]
t = 1.3408, df = 9137.4, p-value = 0.18
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 -0.1903355  1.0143510
sample estimates:
mean of x mean of y 
 5.553565  5.141557 


In [20]:
# HDL 
round(summary(aric_baseline_full_noPrevHeme$hdl_base[aric_baseline_full_noPrevHeme$followUp==0]),1)
round(sd(aric_baseline_full_noPrevHeme$hdl_base[aric_baseline_full_noPrevHeme$followUp==0], na.rm = T),1)

round(summary(aric_baseline_full_noPrevHeme$hdl_base[aric_baseline_full_noPrevHeme$followUp==1]),1)
round(sd(aric_baseline_full_noPrevHeme$hdl_base[aric_baseline_full_noPrevHeme$followUp==1], na.rm = T),1)

t.test(aric_baseline_full_noPrevHeme$hdl_base[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$hdl_base[aric_baseline_full_noPrevHeme$followUp==1])

formatC(t.test(aric_baseline_full_noPrevHeme$hdl_base[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$hdl_base[aric_baseline_full_noPrevHeme$followUp==1])$p.value, 
        digit=1, format="E")

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
    0.3     1.0     1.2     2.2     1.5    94.0      28 

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
    0.1     1.0     1.3     2.0     1.6   102.0      15 


	Welch Two Sample t-test

data:  aric_baseline_full_noPrevHeme$hdl_base[aric_baseline_full_noPrevHeme$followUp == 0] and aric_baseline_full_noPrevHeme$hdl_base[aric_baseline_full_noPrevHeme$followUp == 1]
t = 1.5479, df = 10074, p-value = 0.1217
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 -0.04967175  0.42260724
sample estimates:
mean of x mean of y 
 2.164578  1.978110 


In [21]:
# TG 
round(summary(aric_baseline_full_noPrevHeme$tg_base[aric_baseline_full_noPrevHeme$followUp==0]),1)
round(sd(aric_baseline_full_noPrevHeme$tg_base[aric_baseline_full_noPrevHeme$followUp==0], na.rm = T),1)

round(summary(aric_baseline_full_noPrevHeme$tg_base[aric_baseline_full_noPrevHeme$followUp==1]),1)
round(sd(aric_baseline_full_noPrevHeme$tg_base[aric_baseline_full_noPrevHeme$followUp==1], na.rm = T),1)

t.test(aric_baseline_full_noPrevHeme$tg_base[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$tg_base[aric_baseline_full_noPrevHeme$followUp==1])

formatC(t.test(aric_baseline_full_noPrevHeme$tg_base[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$tg_base[aric_baseline_full_noPrevHeme$followUp==1])$p.value, digit=1, format="E")

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
    0.1     0.9     1.3     3.9     1.9   542.0       9 

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
    0.3     0.9     1.3     3.3     1.8   352.5       5 


	Welch Two Sample t-test

data:  aric_baseline_full_noPrevHeme$tg_base[aric_baseline_full_noPrevHeme$followUp == 0] and aric_baseline_full_noPrevHeme$tg_base[aric_baseline_full_noPrevHeme$followUp == 1]
t = 1.5824, df = 9811.4, p-value = 0.1136
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 -0.1389726  1.3029578
sample estimates:
mean of x mean of y 
 3.897101  3.315108 


In [22]:
## CHIP >=2%
(table(aric_baseline_full_noPrevHeme$CH_baseline[aric_baseline_full_noPrevHeme$followUp==0]))
round(prop.table(table(aric_baseline_full_noPrevHeme$CH_baseline[aric_baseline_full_noPrevHeme$followUp==0]))*100,1)

(table(aric_baseline_full_noPrevHeme$CH_baseline[aric_baseline_full_noPrevHeme$followUp==1]))
round(prop.table(table(aric_baseline_full_noPrevHeme$CH_baseline[aric_baseline_full_noPrevHeme$followUp==1]))*100,1)

t.test(aric_baseline_full_noPrevHeme$CH_baseline[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$CH_baseline[aric_baseline_full_noPrevHeme$followUp==1])

formatC(t.test(aric_baseline_full_noPrevHeme$CH_baseline[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$CH_baseline[aric_baseline_full_noPrevHeme$followUp==1])$p.value, digit=1, format="E")


   0    1 
6049  635 


   0    1 
90.5  9.5 


   0    1 
3730  457 


   0    1 
89.1 10.9 


	Welch Two Sample t-test

data:  aric_baseline_full_noPrevHeme$CH_baseline[aric_baseline_full_noPrevHeme$followUp == 0] and aric_baseline_full_noPrevHeme$CH_baseline[aric_baseline_full_noPrevHeme$followUp == 1]
t = -2.3543, df = 8478, p-value = 0.01858
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 -0.025921100 -0.002367638
sample estimates:
 mean of x  mean of y 
0.09500299 0.10914736 


In [24]:
## CHIP >=10%
(table(aric_baseline_full_noPrevHeme$CHvaf10_baseline[aric_baseline_full_noPrevHeme$followUp==0]))
round(prop.table(table(aric_baseline_full_noPrevHeme$CHvaf10_baseline[aric_baseline_full_noPrevHeme$followUp==0]))*100,1)

(table(aric_baseline_full_noPrevHeme$CHvaf10_baseline[aric_baseline_full_noPrevHeme$followUp==1]))
round(prop.table(table(aric_baseline_full_noPrevHeme$CHvaf10_baseline[aric_baseline_full_noPrevHeme$followUp==1]))*100,1)

t.test(aric_baseline_full_noPrevHeme$CHvaf10_baseline[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$CHvaf10_baseline[aric_baseline_full_noPrevHeme$followUp==1])

formatC(t.test(aric_baseline_full_noPrevHeme$CHvaf10_baseline[aric_baseline_full_noPrevHeme$followUp==0],
      aric_baseline_full_noPrevHeme$CHvaf10_baseline[aric_baseline_full_noPrevHeme$followUp==1])$p.value, digit=1, format="E")


   0    1 
6397  287 


   0    1 
95.7  4.3 


   0    1 
4026  161 


   0    1 
96.2  3.8 


	Welch Two Sample t-test

data:  aric_baseline_full_noPrevHeme$CHvaf10_baseline[aric_baseline_full_noPrevHeme$followUp == 0] and aric_baseline_full_noPrevHeme$CHvaf10_baseline[aric_baseline_full_noPrevHeme$followUp == 1]
t = 1.159, df = 9238.6, p-value = 0.2465
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 -0.003101301  0.012073317
sample estimates:
 mean of x  mean of y 
0.04293836 0.03845235 


##### END ###


In [14]:
## CH status
cat("CHvaf02_baseline: M")
table(aric_baseline_full$CH_baseline[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"])

round(prop.table(table(aric_baseline_full$CH_baseline[aric_baseline_full$race=="B" & 
                                                aric_baseline_full$Sex=="M"]))*100,1)

table(aric_baseline_full$CH_baseline[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])
round(prop.table(table(aric_baseline_full$CH_baseline[aric_baseline_full$race=="W" & 
                                                      aric_baseline_full$Sex=="M"]))*100,1)

formatC(t.test(aric_baseline_full$CH_baseline[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"], 
       aric_baseline_full$CH_baseline[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])$p.value,
        digits = 1,format = "E")

cat("CHvaf02_baseline: F")
table(aric_baseline_full$CH_baseline[aric_baseline_full$race=="B" & 
                                       aric_baseline_full$Sex=="F"])
round(prop.table(table(aric_baseline_full$CH_baseline[aric_baseline_full$race=="B" & 
                                       aric_baseline_full$Sex=="F"]))*100,1)

table(aric_baseline_full$CH_baseline[aric_baseline_full$race=="W" & 
                                       aric_baseline_full$Sex=="F"])
round(prop.table(table(aric_baseline_full$CH_baseline[aric_baseline_full$race=="W" & 
                                       aric_baseline_full$Sex=="F"]))*100,1)


formatC(x =t.test(aric_baseline_full$CH_baseline[aric_baseline_full$race=="B" & 
                                             aric_baseline_full$Sex=="F"], 
            aric_baseline_full$CH_baseline[aric_baseline_full$race=="W" & 
                                             aric_baseline_full$Sex=="F"])$p.value, 
        digits = 1,format = "E")


CHvaf02_baseline: M


   0    1 
1052  102 


   0    1 
91.2  8.8 


   0    1 
3182  396 


   0    1 
88.9 11.1 

CHvaf02_baseline: F


   0    1 
1799  172 


   0    1 
91.3  8.7 


   0    1 
3754  424 


   0    1 
89.9 10.1 

In [15]:
## CH status
cat("CHvaf10_baseline: M")
table(aric_baseline_full$CHvaf10_baseline[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"])

round(prop.table(table(aric_baseline_full$CHvaf10_baseline[aric_baseline_full$race=="B" & 
                                                aric_baseline_full$Sex=="M"]))*100,1)

table(aric_baseline_full$CHvaf10_baseline[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])
round(prop.table(table(aric_baseline_full$CHvaf10_baseline[aric_baseline_full$race=="W" & 
                                                      aric_baseline_full$Sex=="M"]))*100,1)

formatC(t.test(aric_baseline_full$CHvaf10_baseline[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"], 
       aric_baseline_full$CHvaf10_baseline[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])$p.value,
        digits = 1,format = "E")

cat("CHvaf10_baseline: F")
table(aric_baseline_full$CHvaf10_baseline[aric_baseline_full$race=="B" & 
                                       aric_baseline_full$Sex=="F"])
round(prop.table(table(aric_baseline_full$CHvaf10_baseline[aric_baseline_full$race=="B" & 
                                       aric_baseline_full$Sex=="F"]))*100,1)

table(aric_baseline_full$CHvaf10_baseline[aric_baseline_full$race=="W" & 
                                       aric_baseline_full$Sex=="F"])
round(prop.table(table(aric_baseline_full$CHvaf10_baseline[aric_baseline_full$race=="W" & 
                                       aric_baseline_full$Sex=="F"]))*100,1)


formatC(x =t.test(aric_baseline_full$CHvaf10_baseline[aric_baseline_full$race=="B" & 
                                             aric_baseline_full$Sex=="F"], 
            aric_baseline_full$CHvaf10_baseline[aric_baseline_full$race=="W" & 
                                             aric_baseline_full$Sex=="F"])$p.value, 
        digits = 1,format = "E")


CHvaf10_baseline: M


   0    1 
1102   52 


   0    1 
95.5  4.5 


   0    1 
3410  168 


   0    1 
95.3  4.7 

CHvaf10_baseline: F


   0    1 
1905   66 


   0    1 
96.7  3.3 


   0    1 
4016  162 


   0    1 
96.1  3.9 

In [8]:
names(aric_baseline_full)

In [7]:
# Age
summary(aric_baseline_full$age_base)

table(aric_baseline_full$race, aric_baseline_full$Sex)

table(aric_baseline_full$Sex)
round(prop.table(table( aric_baseline_full$Sex))*100,1)

table(aric_baseline_full$race)
round(prop.table(table( aric_baseline_full$race))*100,1)

table(aric_baseline_full$ever_smoke)
round(prop.table(table( aric_baseline_full$ever_smoke))*100,1)

## 
cat("age_base: M")
round(summary(aric_baseline_full$age_base[aric_baseline_full$race=="B" & 
                                             aric_baseline_full$Sex=="M"]),1)

round(summary(aric_baseline_full$age_base[aric_baseline_full$race=="W" & 
                                             aric_baseline_full$Sex=="M"]),1)

wilcox.test(aric_baseline_full$age_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"],
            aric_baseline_full$age_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])
t.test(aric_baseline_full$age_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"],
       aric_baseline_full$age_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])

cat("age_base: F")
round(summary(aric_baseline_full$age_base[aric_baseline_full$race=="B" & 
                                             aric_baseline_full$Sex=="F"]),1)

round(summary(aric_baseline_full$age_base[aric_baseline_full$race=="W" & 
                                             aric_baseline_full$Sex=="F"]),1)

wilcox.test(aric_baseline_full$age_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="F"],
            aric_baseline_full$age_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="F"])

t.test(aric_baseline_full$age_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="F"],
       aric_baseline_full$age_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="F"])

## 


   Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
  44.00   52.00   57.00   57.32   62.00   84.00 

   
       F    M
  B 1971 1154
  W 4178 3578


   F    M 
6149 4732 


   F    M 
56.5 43.5 


   B    W 
3125 7756 


   B    W 
28.7 71.3 


   0    1 
4358 6488 


   0    1 
40.2 59.8 

age_base: M

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
   44.0    51.0    56.0    56.7    61.0    83.0 

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
   45.0    53.0    58.0    58.3    63.0    84.0 


	Wilcoxon rank sum test with continuity correction

data:  aric_baseline_full$age_base[aric_baseline_full$race == "B" & aric_baseline_full$Sex == "M"] and aric_baseline_full$age_base[aric_baseline_full$race == "W" & aric_baseline_full$Sex == "M"]
W = 1744401, p-value = 2.011e-15
alternative hypothesis: true location shift is not equal to 0



	Welch Two Sample t-test

data:  aric_baseline_full$age_base[aric_baseline_full$race == "B" & aric_baseline_full$Sex == "M"] and aric_baseline_full$age_base[aric_baseline_full$race == "W" & aric_baseline_full$Sex == "M"]
t = -7.4715, df = 1861.2, p-value = 1.213e-13
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 -2.015475 -1.177365
sample estimates:
mean of x mean of y 
 56.68111  58.27753 


age_base: F

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
   44.0    51.0    55.0    56.1    61.0    78.0 

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
   44.0    52.0    57.0    57.2    62.0    79.0 


	Wilcoxon rank sum test with continuity correction

data:  aric_baseline_full$age_base[aric_baseline_full$race == "B" & aric_baseline_full$Sex == "F"] and aric_baseline_full$age_base[aric_baseline_full$race == "W" & aric_baseline_full$Sex == "F"]
W = 3674936, p-value = 9.157e-12
alternative hypothesis: true location shift is not equal to 0



	Welch Two Sample t-test

data:  aric_baseline_full$age_base[aric_baseline_full$race == "B" & aric_baseline_full$Sex == "F"] and aric_baseline_full$age_base[aric_baseline_full$race == "W" & aric_baseline_full$Sex == "F"]
t = -6.6894, df = 3769.4, p-value = 2.572e-11
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 -1.4125556 -0.7722194
sample estimates:
mean of x mean of y 
 56.14409  57.23648 


In [9]:
cat("smoked: M")
table(aric_baseline_full$ever_smoke[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"])
round(prop.table(table(aric_baseline_full$ever_smoke[aric_baseline_full$race=="B" & 
                                                        aric_baseline_full$Sex=="M"]))*100,1)

table(aric_baseline_full$ever_smoke[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])
round(prop.table(table(aric_baseline_full$ever_smoke[aric_baseline_full$race=="W" & 
                                                        aric_baseline_full$Sex=="M"]))*100,1)

# wilcox.test(aric_baseline_full$ever_smoke[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"], aric_baseline_full$ever_smoke[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])
t.test(aric_baseline_full$ever_smoke[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"], aric_baseline_full$ever_smoke[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])

cat("smoked: F")
table(aric_baseline_full$ever_smoke[aric_baseline_full$race=="B" & 
                                       aric_baseline_full$Sex=="F"])
round(prop.table(table(aric_baseline_full$ever_smoke[aric_baseline_full$race=="B" & 
                                                        aric_baseline_full$Sex=="F"]))*100,1)

table(aric_baseline_full$ever_smoke[aric_baseline_full$race=="W" & 
                                       aric_baseline_full$Sex=="F"])
round(prop.table(table(aric_baseline_full$ever_smoke[aric_baseline_full$race=="W" & 
                                                        aric_baseline_full$Sex=="F"]))*100,1)

# wilcox.test(aric_baseline_full$ever_smoke[aric_baseline_full$race=="B" & 
#                                              aric_baseline_full$Sex=="F"], 
#             aric_baseline_full$ever_smoke[aric_baseline_full$race=="W" & 
#                                              aric_baseline_full$Sex=="F"])

t.test(aric_baseline_full$ever_smoke[aric_baseline_full$race=="B" & 
                                        aric_baseline_full$Sex=="F"], 
       aric_baseline_full$ever_smoke[aric_baseline_full$race=="W" & 
                                        aric_baseline_full$Sex=="F"])

## 
# BMI
cat("bmi")
round(summary(aric_baseline_full$bmi_base[aric_baseline_full$race=="B" & 
                                             aric_baseline_full$Sex=="M"]),1)
cat("bmi AA M sd=",round(sd(aric_baseline_full$bmi_base[aric_baseline_full$race=="B" & 
                                                       aric_baseline_full$Sex=="M"], na.rm = T),1))

round(summary(aric_baseline_full$bmi_base[aric_baseline_full$race=="W" & 
                                             aric_baseline_full$Sex=="M"]),1)
cat("bmi EA M sd=",round(sd(aric_baseline_full$bmi_base[aric_baseline_full$race=="W" & 
                                                       aric_baseline_full$Sex=="M"], na.rm = T),1) )

t.test(aric_baseline_full$bmi_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"],
       aric_baseline_full$bmi_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])

# Female
round(summary(aric_baseline_full$bmi_base[aric_baseline_full$race=="B" & 
                                             aric_baseline_full$Sex=="F"]),1)
cat("bmi AA F sd=",round(sd(aric_baseline_full$bmi_base[aric_baseline_full$race=="B" & 
                                                       aric_baseline_full$Sex=="F"], na.rm = T),1) )

round(summary(aric_baseline_full$bmi_base[aric_baseline_full$race=="W" & 
                                             aric_baseline_full$Sex=="F"]),1)

cat("bmi EA F sd=",round(sd(aric_baseline_full$bmi_base[aric_baseline_full$race=="W" & 
                                                       aric_baseline_full$Sex=="F"], na.rm = T),1) )

# wilcox.test(aric_baseline_full$bmi_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="F"],
#             aric_baseline_full$bmi_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="F"])

t.test(aric_baseline_full$bmi_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="F"],
       aric_baseline_full$bmi_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="F"])

formatC(x=t.test(aric_baseline_full$bmi_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="F"],
                 aric_baseline_full$bmi_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="F"])$p.value, 
        digit=1, format="E")



smoked: M


  0   1 
303 836 


   0    1 
26.6 73.4 


   0    1 
 941 2635 


   0    1 
26.3 73.7 


	Welch Two Sample t-test

data:  aric_baseline_full$ever_smoke[aric_baseline_full$race == "B" & aric_baseline_full$Sex == "M"] and aric_baseline_full$ever_smoke[aric_baseline_full$race == "W" & aric_baseline_full$Sex == "M"]
t = -0.19163, df = 1910.4, p-value = 0.8481
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 -0.03235095  0.02659165
sample estimates:
mean of x mean of y 
0.7339772 0.7368568 


smoked: F


   0    1 
1106  848 


   0    1 
56.6 43.4 


   0    1 
2008 2169 


   0    1 
48.1 51.9 


	Welch Two Sample t-test

data:  aric_baseline_full$ever_smoke[aric_baseline_full$race == "B" & aric_baseline_full$Sex == "F"] and aric_baseline_full$ever_smoke[aric_baseline_full$race == "W" & aric_baseline_full$Sex == "F"]
t = -6.2613, df = 3844.4, p-value = 4.237e-10
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 -0.11199728 -0.05858398
sample estimates:
mean of x mean of y 
0.4339816 0.5192722 


bmi

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
   14.0    24.6    27.5    28.0    30.8    57.9       7 

bmi AA M sd= 5.1

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
   14.5    25.0    27.3    27.8    30.1    59.1       4 

bmi EA M sd= 4.2


	Welch Two Sample t-test

data:  aric_baseline_full$bmi_base[aric_baseline_full$race == "B" & aric_baseline_full$Sex == "M"] and aric_baseline_full$bmi_base[aric_baseline_full$race == "W" & aric_baseline_full$Sex == "M"]
t = 0.99062, df = 1675.7, p-value = 0.322
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 -0.1625655  0.4943444
sample estimates:
mean of x mean of y 
 27.99844  27.83255 


   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
   14.2    26.7    30.5    31.4    34.7    67.3       6 

bmi AA F sd= 6.7

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
   14.4    23.1    26.1    27.1    30.0    53.0       3 

bmi EA F sd= 5.6


	Welch Two Sample t-test

data:  aric_baseline_full$bmi_base[aric_baseline_full$race == "B" & aric_baseline_full$Sex == "F"] and aric_baseline_full$bmi_base[aric_baseline_full$race == "W" & aric_baseline_full$Sex == "F"]
t = 24.39, df = 3295.6, p-value < 2.2e-16
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 3.907118 4.590210
sample estimates:
mean of x mean of y 
 31.37550  27.12684 


In [11]:
##
cat("chol_med_base: M")
table(aric_baseline_full$chol_med_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"])
round(prop.table(table(aric_baseline_full$chol_med_base[aric_baseline_full$race=="B" & 
                                                           aric_baseline_full$Sex=="M"]))*100,1)

table(aric_baseline_full$chol_med_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])
round(prop.table(table(aric_baseline_full$chol_med_base[aric_baseline_full$race=="W" & 
                                                           aric_baseline_full$Sex=="M"]))*100,1)

# wilcox.test(aric_baseline_full$chol_med_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"], aric_baseline_full$ever_smoke[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])

formatC(t.test(aric_baseline_full$chol_med_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"], 
               aric_baseline_full$chol_med_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])$p.value,
        digits = 1,format = "E")

cat("chol_med_base: F")
table(aric_baseline_full$chol_med_base[aric_baseline_full$race=="B" & 
                                          aric_baseline_full$Sex=="F"])
round(prop.table(table(aric_baseline_full$chol_med_base[aric_baseline_full$race=="B" & 
                                                           aric_baseline_full$Sex=="F"]))*100,1)

table(aric_baseline_full$chol_med_base[aric_baseline_full$race=="W" & 
                                          aric_baseline_full$Sex=="F"])
round(prop.table(table(aric_baseline_full$chol_med_base[aric_baseline_full$race=="W" & 
                                                           aric_baseline_full$Sex=="F"]))*100,1)

# wilcox.test(aric_baseline_full$chol_med_base[aric_baseline_full$race=="B" & 
#                                                 aric_baseline_full$Sex=="F"], 
#             aric_baseline_full$chol_med_base[aric_baseline_full$race=="W" & 
#                                                 aric_baseline_full$Sex=="F"])

formatC(x =t.test(aric_baseline_full$chol_med_base[aric_baseline_full$race=="B" & 
                                                      aric_baseline_full$Sex=="F"], 
                  aric_baseline_full$chol_med_base[aric_baseline_full$race=="W" & 
                                                      aric_baseline_full$Sex=="F"])$p.value, 
        digits = 1,format = "E")


##
# Clinical traits
# htn_5_base,  hf_base, is_base, hs_base, 
cat("htn_5_base: M")
table(aric_baseline_full$htn_5_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"])
round(prop.table(table(aric_baseline_full$htn_5_base[aric_baseline_full$race=="B" & 
                                                        aric_baseline_full$Sex=="M"]))*100,1)

table(aric_baseline_full$htn_5_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])
round(prop.table(table(aric_baseline_full$htn_5_base[aric_baseline_full$race=="W" & 
                                                        aric_baseline_full$Sex=="M"]))*100,1)

formatC(t.test(aric_baseline_full$htn_5_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"], 
               aric_baseline_full$htn_5_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])$p.value,
        digits = 1,format = "E")

cat("htn_5_base: F")
table(aric_baseline_full$htn_5_base[aric_baseline_full$race=="B" & 
                                       aric_baseline_full$Sex=="F"])
round(prop.table(table(aric_baseline_full$htn_5_base[aric_baseline_full$race=="B" & 
                                                        aric_baseline_full$Sex=="F"]))*100,1)

table(aric_baseline_full$htn_5_base[aric_baseline_full$race=="W" & 
                                       aric_baseline_full$Sex=="F"])
round(prop.table(table(aric_baseline_full$htn_5_base[aric_baseline_full$race=="W" & 
                                                        aric_baseline_full$Sex=="F"]))*100,1)


formatC(x =t.test(aric_baseline_full$htn_5_base[aric_baseline_full$race=="B" & 
                                                   aric_baseline_full$Sex=="F"], 
                  aric_baseline_full$htn_5_base[aric_baseline_full$race=="W" & 
                                                   aric_baseline_full$Sex=="F"])$p.value, 
        digits = 1,format = "E")


##
cat("dm_126_base: M")
table(aric_baseline_full$dm_126_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"])
round(prop.table(table(aric_baseline_full$dm_126_base[aric_baseline_full$race=="B" & 
                                                         aric_baseline_full$Sex=="M"]))*100,1)

table(aric_baseline_full$dm_126_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])
round(prop.table(table(aric_baseline_full$dm_126_base[aric_baseline_full$race=="W" & 
                                                         aric_baseline_full$Sex=="M"]))*100,1)

formatC(t.test(aric_baseline_full$dm_126_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"], 
               aric_baseline_full$dm_126_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])$p.value,
        digits = 1,format = "E")

cat("dm_126_base: F")
table(aric_baseline_full$dm_126_base[aric_baseline_full$race=="B" & 
                                        aric_baseline_full$Sex=="F"])
round(prop.table(table(aric_baseline_full$dm_126_base[aric_baseline_full$race=="B" & 
                                                         aric_baseline_full$Sex=="F"]))*100,1)

table(aric_baseline_full$dm_126_base[aric_baseline_full$race=="W" & 
                                        aric_baseline_full$Sex=="F"])
round(prop.table(table(aric_baseline_full$dm_126_base[aric_baseline_full$race=="W" & 
                                                         aric_baseline_full$Sex=="F"]))*100,1)


formatC(x =t.test(aric_baseline_full$dm_126_base[aric_baseline_full$race=="B" & 
                                                    aric_baseline_full$Sex=="F"], 
                  aric_baseline_full$dm_126_base[aric_baseline_full$race=="W" & 
                                                    aric_baseline_full$Sex=="F"])$p.value
        ,digits = 1,format = "E")




chol_med_base: M


   0    1 
1084   36 


   0    1 
96.8  3.2 


   0    1 
3251  323 


 0  1 
91  9 

chol_med_base: F


   0    1 
1895   61 


   0    1 
96.9  3.1 


   0    1 
3897  281 


   0    1 
93.3  6.7 

htn_5_base: M


  0   1 
529 618 


   0    1 
46.1 53.9 


   0    1 
2399 1167 


   0    1 
67.3 32.7 

htn_5_base: F


   0    1 
 825 1132 


   0    1 
42.2 57.8 


   0    1 
3015 1157 


   0    1 
72.3 27.7 

dm_126_base: M


  0   1 
864 272 


   0    1 
76.1 23.9 


   0    1 
3057  514 


   0    1 
85.6 14.4 

dm_126_base: F


   0    1 
1461  489 


   0    1 
74.9 25.1 


   0    1 
3791  383 


   0    1 
90.8  9.2 

In [12]:
### 
# Clinical traits
# dm_126_base, htn_5_base,  chol_med_base, hf_base, chd_base, is_base, hs_base, 
cat("chd_base: M")
table(aric_baseline_full$chd_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"])
round(prop.table(table(aric_baseline_full$chd_base[aric_baseline_full$race=="B" & 
                                                      aric_baseline_full$Sex=="M"]))*100,1)

table(aric_baseline_full$chd_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])
round(prop.table(table(aric_baseline_full$chd_base[aric_baseline_full$race=="W" & 
                                                      aric_baseline_full$Sex=="M"]))*100,1)

wilcox.test(aric_baseline_full$chd_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"], aric_baseline_full$ever_smoke[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])
t.test(aric_baseline_full$chd_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"], 
       aric_baseline_full$chd_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])$p.value

cat("chd_base: F")
table(aric_baseline_full$chd_base[aric_baseline_full$race=="B" & 
                                     aric_baseline_full$Sex=="F"])
round(prop.table(table(aric_baseline_full$chd_base[aric_baseline_full$race=="B" & 
                                                      aric_baseline_full$Sex=="F"]))*100,1)

table(aric_baseline_full$chd_base[aric_baseline_full$race=="W" & 
                                     aric_baseline_full$Sex=="F"])
round(prop.table(table(aric_baseline_full$chd_base[aric_baseline_full$race=="W" & 
                                                      aric_baseline_full$Sex=="F"]))*100,1)

# wilcox.test(aric_baseline_full$chd_base[aric_baseline_full$race=="B" & 
#                                            aric_baseline_full$Sex=="F"], 
#             aric_baseline_full$chd_base[aric_baseline_full$race=="W" & 
#                                            aric_baseline_full$Sex=="F"])

t.test(aric_baseline_full$chd_base[aric_baseline_full$race=="B" & 
                                      aric_baseline_full$Sex=="F"], 
       aric_baseline_full$chd_base[aric_baseline_full$race=="W" & 
                                      aric_baseline_full$Sex=="F"])$p.value

##
# Clinical traits
#  is_base, 

cat("is_base: M")
table(aric_baseline_full$is_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"])
round(prop.table(table(aric_baseline_full$is_base[aric_baseline_full$race=="B" & 
                                                     aric_baseline_full$Sex=="M"]))*100,1)

table(aric_baseline_full$is_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])
round(prop.table(table(aric_baseline_full$is_base[aric_baseline_full$race=="W" & 
                                                     aric_baseline_full$Sex=="M"]))*100,1)

formatC(t.test(aric_baseline_full$is_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"], 
               aric_baseline_full$is_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])$p.value,
        digits = 1,format = "E")

cat("is_base: F")
table(aric_baseline_full$is_base[aric_baseline_full$race=="B" & 
                                    aric_baseline_full$Sex=="F"])
round(prop.table(table(aric_baseline_full$is_base[aric_baseline_full$race=="B" & 
                                                     aric_baseline_full$Sex=="F"]))*100,1)

table(aric_baseline_full$is_base[aric_baseline_full$race=="W" & 
                                    aric_baseline_full$Sex=="F"])
round(prop.table(table(aric_baseline_full$is_base[aric_baseline_full$race=="W" & 
                                                     aric_baseline_full$Sex=="F"]))*100,1)


formatC(x =t.test(aric_baseline_full$is_base[aric_baseline_full$race=="B" & 
                                                aric_baseline_full$Sex=="F"], 
                  aric_baseline_full$is_base[aric_baseline_full$race=="W" & 
                                                aric_baseline_full$Sex=="F"])$p.value,
        digits = 1,format = "E")

# Clinical traits
# hf_base, is_base, 
cat("hf_base: M")
table(aric_baseline_full$hf_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"])
round(prop.table(table(aric_baseline_full$hf_base[aric_baseline_full$race=="B" & 
                                                     aric_baseline_full$Sex=="M"]))*100,1)

table(aric_baseline_full$hf_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])
round(prop.table(table(aric_baseline_full$hf_base[aric_baseline_full$race=="W" & 
                                                     aric_baseline_full$Sex=="M"]))*100,1)

formatC(t.test(aric_baseline_full$hf_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"], 
               aric_baseline_full$hf_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])$p.value,
        digits = 1,format = "E")

cat("hf_base: F")
table(aric_baseline_full$hf_base[aric_baseline_full$race=="B" & 
                                    aric_baseline_full$Sex=="F"])
round(prop.table(table(aric_baseline_full$hf_base[aric_baseline_full$race=="B" & 
                                                     aric_baseline_full$Sex=="F"]))*100,1)

table(aric_baseline_full$hf_base[aric_baseline_full$race=="W" & 
                                    aric_baseline_full$Sex=="F"])
round(prop.table(table(aric_baseline_full$hf_base[aric_baseline_full$race=="W" & 
                                                     aric_baseline_full$Sex=="F"]))*100,1)


formatC(x =t.test(aric_baseline_full$hf_base[aric_baseline_full$race=="B" & 
                                                aric_baseline_full$Sex=="F"], 
                  aric_baseline_full$hf_base[aric_baseline_full$race=="W" & 
                                                aric_baseline_full$Sex=="F"])$p.value,
        digits = 1,format = "E")




chd_base: M


   0    1 
1071   83 


   0    1 
92.8  7.2 


   0    1 
3156  422 


   0    1 
88.2 11.8 


	Wilcoxon rank sum test with continuity correction

data:  aric_baseline_full$chd_base[aric_baseline_full$race == "B" & aric_baseline_full$Sex == "M"] and aric_baseline_full$ever_smoke[aric_baseline_full$race == "W" & aric_baseline_full$Sex == "M"]
W = 691361, p-value < 2.2e-16
alternative hypothesis: true location shift is not equal to 0


chd_base: F


   0    1 
1907   64 


   0    1 
96.8  3.2 


   0    1 
4075  103 


   0    1 
97.5  2.5 

is_base: M


   0    1 
1096   45 


   0    1 
96.1  3.9 


   0    1 
3379   96 


   0    1 
97.2  2.8 

is_base: F


   0    1 
1909   44 


   0    1 
97.7  2.3 


   0    1 
3980   72 


   0    1 
98.2  1.8 

hf_base: M


   0    1 
1081   51 


   0    1 
95.5  4.5 


   0    1 
3364  133 


   0    1 
96.2  3.8 

hf_base: F


   0    1 
1773  173 


   0    1 
91.1  8.9 


   0    1 
3937  196 


   0    1 
95.3  4.7 

In [13]:
# lipids
# chol_base
round(summary(aric_baseline_full$chol_base
              [aric_baseline_full$race=="B" & 
                  aric_baseline_full$Sex=="M"]),1)

cat("M AA chol_base mad=",round(mad(aric_baseline_full$chol_base[aric_baseline_full$race=="B" & 
                                                                    aric_baseline_full$Sex=="M"], na.rm = T),1))
cat("M AA chol_base sd=",round(sd(aric_baseline_full$chol_base[aric_baseline_full$race=="B" & 
                                                                  aric_baseline_full$Sex=="M"], na.rm = T),1))

round(summary(aric_baseline_full$chol_base[aric_baseline_full$race=="W" & 
                                              aric_baseline_full$Sex=="M"]),1)
cat("M EA chol_base mad=",round(mad(aric_baseline_full$chol_base[aric_baseline_full$race=="W" & 
                                                                    aric_baseline_full$Sex=="M"], na.rm = T),1) )
cat("M EA chol_base sd=",round(sd(aric_baseline_full$chol_base[aric_baseline_full$race=="W" & 
                                                                  aric_baseline_full$Sex=="M"], na.rm = T),1) )

wilcox.test(aric_baseline_full$chol_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"],
            aric_baseline_full$chol_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])

t.test(aric_baseline_full$chol_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"],
       aric_baseline_full$chol_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])

# 
round(summary(aric_baseline_full$chol_base[aric_baseline_full$race=="B" & 
                                              aric_baseline_full$Sex=="F"]),1)

cat("F AA chol_base mad=",round(mad(aric_baseline_full$chol_base[aric_baseline_full$race=="B" & 
                                                                    aric_baseline_full$Sex=="F"], na.rm = T),1))
cat("F AA chol_base sd=",round(sd(aric_baseline_full$chol_base[aric_baseline_full$race=="B" & 
                                                                  aric_baseline_full$Sex=="F"], na.rm = T),1))

round(summary(aric_baseline_full$chol_base[aric_baseline_full$race=="W" & 
                                              aric_baseline_full$Sex=="F"]),1)
cat("F EA chol_base mad=",round(mad(aric_baseline_full$chol_base[aric_baseline_full$race=="W" & 
                                                                    aric_baseline_full$Sex=="F"], na.rm = T),1) )
cat("F EA chol_base sd=",round(sd(aric_baseline_full$chol_base[aric_baseline_full$race=="W" & 
                                                                  aric_baseline_full$Sex=="F"], na.rm = T),1) )


wilcox.test(aric_baseline_full$chol_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="F"],
            aric_baseline_full$chol_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="F"])

t.test(aric_baseline_full$chol_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="F"],
       aric_baseline_full$chol_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="F"])

# ldl_base
round(summary(aric_baseline_full$ldl_base[aric_baseline_full$race=="B" & 
                                             aric_baseline_full$Sex=="M"]),1)

cat("M AA ldl_base mad=",round(mad(aric_baseline_full$ldl_base[aric_baseline_full$race=="B" & 
                                                                  aric_baseline_full$Sex=="M"], na.rm = T),1))

cat("M AA ldl_base sd=",round(sd(aric_baseline_full$ldl_base[aric_baseline_full$race=="B" & 
                                                                aric_baseline_full$Sex=="M"], na.rm = T),1))


round(summary(aric_baseline_full$ldl_base[aric_baseline_full$race=="W" & 
                                             aric_baseline_full$Sex=="M"]),1)
cat("M EA ldl_base mad=",round(mad(aric_baseline_full$ldl_base[aric_baseline_full$race=="W" & 
                                                                  aric_baseline_full$Sex=="M"], na.rm = T),1) )
cat("M EA ldl_base sd=",round(sd(aric_baseline_full$ldl_base[aric_baseline_full$race=="W" & 
                                                                aric_baseline_full$Sex=="M"], na.rm = T),1) )

wilcox.test(aric_baseline_full$ldl_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"],
            aric_baseline_full$ldl_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])

t.test(aric_baseline_full$ldl_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"],
       aric_baseline_full$ldl_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])

#
round(summary(aric_baseline_full$ldl_base[aric_baseline_full$race=="B" & 
                                             aric_baseline_full$Sex=="F"]),1)

cat("F AA ldl_base mad=",round(mad(aric_baseline_full$ldl_base[aric_baseline_full$race=="B" & 
                                                                  aric_baseline_full$Sex=="F"], na.rm = T),1))
cat("F AA ldl_base sd=",round(sd(aric_baseline_full$ldl_base[aric_baseline_full$race=="B" & 
                                                                aric_baseline_full$Sex=="F"], na.rm = T),1))


round(summary(aric_baseline_full$ldl_base[aric_baseline_full$race=="W" & 
                                             aric_baseline_full$Sex=="F"]),1)
cat("F EA ldl_base mad=",round(mad(aric_baseline_full$ldl_base[aric_baseline_full$race=="W" & 
                                                                  aric_baseline_full$Sex=="F"], na.rm = T),1) )
cat("F EA ldl_base sd=",round(sd(aric_baseline_full$ldl_base[aric_baseline_full$race=="W" & 
                                                                aric_baseline_full$Sex=="F"], na.rm = T),1) )

wilcox.test(aric_baseline_full$ldl_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="F"],
            aric_baseline_full$ldl_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="F"])
t.test(aric_baseline_full$ldl_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="F"],
       aric_baseline_full$ldl_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="F"])


# hdl_base
round(summary(aric_baseline_full$hdl_base[aric_baseline_full$race=="B" & 
                                             aric_baseline_full$Sex=="M"]),1)

cat("AA hdl_base mad=",round(mad(aric_baseline_full$hdl_base[aric_baseline_full$race=="B" & 
                                                                aric_baseline_full$Sex=="M"], na.rm = T),1))
cat("AA hdl_base sd=",round(sd(aric_baseline_full$hdl_base[aric_baseline_full$race=="B" & 
                                                              aric_baseline_full$Sex=="M"], na.rm = T),1))

round(summary(aric_baseline_full$hdl_base[aric_baseline_full$race=="W" & 
                                             aric_baseline_full$Sex=="M"]),1)
cat("EA hdl_base mad=",round(mad(aric_baseline_full$hdl_base[aric_baseline_full$race=="W" & 
                                                                aric_baseline_full$Sex=="M"], na.rm = T),1) )
cat("EA hdl_base sd=",round(sd(aric_baseline_full$hdl_base[aric_baseline_full$race=="W" & 
                                                              aric_baseline_full$Sex=="M"], na.rm = T),1) )

wilcox.test(aric_baseline_full$hdl_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"],
            aric_baseline_full$hdl_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])

t.test(aric_baseline_full$hdl_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"],
       aric_baseline_full$hdl_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])

#
round(summary(aric_baseline_full$hdl_base[aric_baseline_full$race=="B" & 
                                             aric_baseline_full$Sex=="F"]),1)

cat("F AA hdl_base mad=",round(mad(aric_baseline_full$hdl_base[aric_baseline_full$race=="B" & 
                                                                  aric_baseline_full$Sex=="F"], na.rm = T),1))
cat("F AA hdl_base sd=",round(sd(aric_baseline_full$hdl_base[aric_baseline_full$race=="B" & 
                                                                aric_baseline_full$Sex=="F"], na.rm = T),1))

round(summary(aric_baseline_full$hdl_base[aric_baseline_full$race=="W" & 
                                             aric_baseline_full$Sex=="F"]),1)
cat("F EA hdl_base mad=",round(mad(aric_baseline_full$hdl_base[aric_baseline_full$race=="W" & 
                                                                  aric_baseline_full$Sex=="F"], na.rm = T),1) )
cat("F EA hdl_base sd=",round(sd(aric_baseline_full$hdl_base[aric_baseline_full$race=="W" & 
                                                                aric_baseline_full$Sex=="F"], na.rm = T),1) )

wilcox.test(aric_baseline_full$hdl_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="F"],
            aric_baseline_full$hdl_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="F"])
t.test(aric_baseline_full$hdl_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="F"],
       aric_baseline_full$hdl_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="F"])
# tg_base
round(summary(aric_baseline_full$tg_base[aric_baseline_full$race=="B" & 
                                            aric_baseline_full$Sex=="M"]),1)

cat("AA tg_base mad=",round(mad(aric_baseline_full$tg_base[aric_baseline_full$race=="B" & 
                                                              aric_baseline_full$Sex=="M"], na.rm = T),1))
cat("AA tg_base sd=",round(sd(aric_baseline_full$tg_base[aric_baseline_full$race=="B" & 
                                                            aric_baseline_full$Sex=="M"], na.rm = T),1))

round(summary(aric_baseline_full$tg_base[aric_baseline_full$race=="W" & 
                                            aric_baseline_full$Sex=="M"]),1)
cat("EA tg_base mad=",round(mad(aric_baseline_full$tg_base[aric_baseline_full$race=="W" & 
                                                              aric_baseline_full$Sex=="M"], na.rm = T),1) )
cat("EA tg_base sd=",round(sd(aric_baseline_full$tg_base[aric_baseline_full$race=="W" & 
                                                            aric_baseline_full$Sex=="M"], na.rm = T),1) )

wilcox.test(aric_baseline_full$tg_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"],
            aric_baseline_full$tg_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])
t.test(aric_baseline_full$tg_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="M"],
       aric_baseline_full$tg_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="M"])

#
round(summary(aric_baseline_full$tg_base[aric_baseline_full$race=="B" & 
                                            aric_baseline_full$Sex=="F"]),1)

cat("F AA tg_base mad=",round(mad(aric_baseline_full$tg_base[aric_baseline_full$race=="B" & 
                                                                aric_baseline_full$Sex=="F"], na.rm = T),1))
cat("F AA tg_base sd=",round(sd(aric_baseline_full$tg_base[aric_baseline_full$race=="B" & 
                                                              aric_baseline_full$Sex=="F"], na.rm = T),1))

round(summary(aric_baseline_full$tg_base[aric_baseline_full$race=="W" & 
                                            aric_baseline_full$Sex=="F"]),1)
cat("F EA tg_base mad=",round(mad(aric_baseline_full$tg_base[aric_baseline_full$race=="W" & 
                                                                aric_baseline_full$Sex=="F"], na.rm = T),1) )
cat("F EA tg_base sd=",round(sd(aric_baseline_full$tg_base[aric_baseline_full$race=="W" & 
                                                              aric_baseline_full$Sex=="F"], na.rm = T),1) )

wilcox.test(aric_baseline_full$tg_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="F"],
            aric_baseline_full$tg_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="F"])

t.test(aric_baseline_full$tg_base[aric_baseline_full$race=="B" & aric_baseline_full$Sex=="F"],
       aric_baseline_full$tg_base[aric_baseline_full$race=="W" & aric_baseline_full$Sex=="F"])

#


   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
    2.9     4.6     5.2    11.2     6.0   286.0       4 

M AA chol_base mad= 1M AA chol_base sd= 33

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
    2.2     4.7     5.2     8.1     5.9   263.0 

M EA chol_base mad= 0.9M EA chol_base sd= 23.4


	Wilcoxon rank sum test with continuity correction

data:  aric_baseline_full$chol_base[aric_baseline_full$race == "B" & aric_baseline_full$Sex == "M"] and aric_baseline_full$chol_base[aric_baseline_full$race == "W" & aric_baseline_full$Sex == "M"]
W = 2052019, p-value = 0.8947
alternative hypothesis: true location shift is not equal to 0



	Welch Two Sample t-test

data:  aric_baseline_full$chol_base[aric_baseline_full$race == "B" & aric_baseline_full$Sex == "M"] and aric_baseline_full$chol_base[aric_baseline_full$race == "W" & aric_baseline_full$Sex == "M"]
t = 2.8929, df = 1540.1, p-value = 0.00387
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 0.9758825 5.0861005
sample estimates:
mean of x mean of y 
11.179466  8.148474 


   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
    2.6     4.8     5.5    10.2     6.2   337.0      11 

F AA chol_base mad= 1.1F AA chol_base sd= 30.5

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
    2.2     4.9     5.5     7.5     6.2   272.0 

F EA chol_base mad= 0.9F EA chol_base sd= 20


	Wilcoxon rank sum test with continuity correction

data:  aric_baseline_full$chol_base[aric_baseline_full$race == "B" & aric_baseline_full$Sex == "F"] and aric_baseline_full$chol_base[aric_baseline_full$race == "W" & aric_baseline_full$Sex == "F"]
W = 4051068, p-value = 0.5028
alternative hypothesis: true location shift is not equal to 0



	Welch Two Sample t-test

data:  aric_baseline_full$chol_base[aric_baseline_full$race == "B" & aric_baseline_full$Sex == "F"] and aric_baseline_full$chol_base[aric_baseline_full$race == "W" & aric_baseline_full$Sex == "F"]
t = 3.5352, df = 2774.6, p-value = 0.0004142
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 1.188634 4.149440
sample estimates:
mean of x mean of y 
10.170855  7.501818 


   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
    0.0     2.8     3.4     7.2     4.1   210.0      22 

M AA ldl_base mad= 1M AA ldl_base sd= 21.5

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
    0.8     2.9     3.4     5.3     4.0   175.2      89 

M EA ldl_base mad= 0.8M EA ldl_base sd= 14.8


	Wilcoxon rank sum test with continuity correction

data:  aric_baseline_full$ldl_base[aric_baseline_full$race == "B" & aric_baseline_full$Sex == "M"] and aric_baseline_full$ldl_base[aric_baseline_full$race == "W" & aric_baseline_full$Sex == "M"]
W = 1909520, p-value = 0.09432
alternative hypothesis: true location shift is not equal to 0



	Welch Two Sample t-test

data:  aric_baseline_full$ldl_base[aric_baseline_full$race == "B" & aric_baseline_full$Sex == "M"] and aric_baseline_full$ldl_base[aric_baseline_full$race == "W" & aric_baseline_full$Sex == "M"]
t = 2.8206, df = 1495.9, p-value = 0.004856
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 0.5902805 3.2859190
sample estimates:
mean of x mean of y 
 7.197095  5.258995 


   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
    0.4     2.8     3.5     6.3     4.2   238.6      22 

F AA ldl_base mad= 1F AA ldl_base sd= 19

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
    0.3     2.8     3.3     4.6     4.0   196.8      77 

F EA ldl_base mad= 0.9F EA ldl_base sd= 12.4


	Wilcoxon rank sum test with continuity correction

data:  aric_baseline_full$ldl_base[aric_baseline_full$race == "B" & aric_baseline_full$Sex == "F"] and aric_baseline_full$ldl_base[aric_baseline_full$race == "W" & aric_baseline_full$Sex == "F"]
W = 4237022, p-value = 0.0001508
alternative hypothesis: true location shift is not equal to 0



	Welch Two Sample t-test

data:  aric_baseline_full$ldl_base[aric_baseline_full$race == "B" & aric_baseline_full$Sex == "F"] and aric_baseline_full$ldl_base[aric_baseline_full$race == "W" & aric_baseline_full$Sex == "F"]
t = 3.7186, df = 2756.9, p-value = 0.0002043
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 0.8304963 2.6833789
sample estimates:
mean of x mean of y 
 6.345782  4.588845 


   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
    0.3     1.0     1.2     2.8     1.5    94.0       8 

AA hdl_base mad= 0.4AA hdl_base sd= 8.8

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
    0.3     0.9     1.0     1.7     1.2    83.0       1 

EA hdl_base mad= 0.3EA hdl_base sd= 5.1


	Wilcoxon rank sum test with continuity correction

data:  aric_baseline_full$hdl_base[aric_baseline_full$race == "B" & aric_baseline_full$Sex == "M"] and aric_baseline_full$hdl_base[aric_baseline_full$race == "W" & aric_baseline_full$Sex == "M"]
W = 2633895, p-value < 2.2e-16
alternative hypothesis: true location shift is not equal to 0



	Welch Two Sample t-test

data:  aric_baseline_full$hdl_base[aric_baseline_full$race == "B" & aric_baseline_full$Sex == "M"] and aric_baseline_full$hdl_base[aric_baseline_full$race == "W" & aric_baseline_full$Sex == "M"]
t = 4.091, df = 1401.6, p-value = 4.54e-05
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 0.5845707 1.6616562
sample estimates:
mean of x mean of y 
 2.815680  1.692566 


   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
    0.3     1.2     1.4     2.7     1.7   102.0      14 

F AA hdl_base mad= 0.4F AA hdl_base sd= 8.4

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
    0.1     1.1     1.4     2.0     1.7    92.0      20 

F EA hdl_base mad= 0.4F EA hdl_base sd= 5.4


	Wilcoxon rank sum test with continuity correction

data:  aric_baseline_full$hdl_base[aric_baseline_full$race == "B" & aric_baseline_full$Sex == "F"] and aric_baseline_full$hdl_base[aric_baseline_full$race == "W" & aric_baseline_full$Sex == "F"]
W = 4175910, p-value = 0.0956
alternative hypothesis: true location shift is not equal to 0



	Welch Two Sample t-test

data:  aric_baseline_full$hdl_base[aric_baseline_full$race == "B" & aric_baseline_full$Sex == "F"] and aric_baseline_full$hdl_base[aric_baseline_full$race == "W" & aric_baseline_full$Sex == "F"]
t = 3.6685, df = 2742.4, p-value = 0.0002486
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 0.3533823 1.1649137
sample estimates:
mean of x mean of y 
 2.714748  1.955600 


   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
    0.3     0.8     1.1     4.5     1.7   249.0       4 

AA tg_base mad= 0.6AA tg_base sd= 18.9

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
    0.3     1.0     1.4     4.1     2.1   542.0 

EA tg_base mad= 0.7EA tg_base sd= 22.5


	Wilcoxon rank sum test with continuity correction

data:  aric_baseline_full$tg_base[aric_baseline_full$race == "B" & aric_baseline_full$Sex == "M"] and aric_baseline_full$tg_base[aric_baseline_full$race == "W" & aric_baseline_full$Sex == "M"]
W = 1607784, p-value < 2.2e-16
alternative hypothesis: true location shift is not equal to 0



	Welch Two Sample t-test

data:  aric_baseline_full$tg_base[aric_baseline_full$race == "B" & aric_baseline_full$Sex == "M"] and aric_baseline_full$tg_base[aric_baseline_full$race == "W" & aric_baseline_full$Sex == "M"]
t = 0.65502, df = 2285.1, p-value = 0.5125
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 -0.876829  1.756389
sample estimates:
mean of x mean of y 
 4.533431  4.093651 


   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
    0.1     0.8     1.1     4.1     1.5   331.0      10 

F AA tg_base mad= 0.5F AA tg_base sd= 20.7

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
    0.4     1.0     1.3     2.9     1.9   350.0 

F EA tg_base mad= 0.6F EA tg_base sd= 15.4


	Wilcoxon rank sum test with continuity correction

data:  aric_baseline_full$tg_base[aric_baseline_full$race == "B" & aric_baseline_full$Sex == "F"] and aric_baseline_full$tg_base[aric_baseline_full$race == "W" & aric_baseline_full$Sex == "F"]
W = 3269785, p-value < 2.2e-16
alternative hypothesis: true location shift is not equal to 0



	Welch Two Sample t-test

data:  aric_baseline_full$tg_base[aric_baseline_full$race == "B" & aric_baseline_full$Sex == "F"] and aric_baseline_full$tg_base[aric_baseline_full$race == "W" & aric_baseline_full$Sex == "F"]
t = 2.1784, df = 3009.5, p-value = 0.02945
alternative hypothesis: true difference in means is not equal to 0
95 percent confidence interval:
 0.1142695 2.1731574
sample estimates:
mean of x mean of y 
 4.062461  2.918748 


Follow-up: M

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
     NA      NA      NA     NaN      NA      NA    1154 

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max.    NA's 
     NA      NA      NA     NaN      NA      NA    3578 

ERROR: Error in wilcox.test.default(aric_baseline_full$dAge[aric_baseline_full$race == : not enough (non-missing) 'x' observations
