
This script analyzes the PE_3 pooled sequencing data using the package poolfstat



In [4]:
setwd("~/Dropbox/U Chicago/Projects/France/DataAnalysis_Figures/PE3_DataAnalysis/")

library(poolfstat)
library(corrplot)
library(ggplot2)
library(reshape2)

In [None]:
##Using sync file with all larval full population samples samples (Sync_2.sync)
##These results were used in generation of Figure 4b
all_fulldstbn_samples <- c("Embryos", "D25Low_LB2", "D25High_LB10", "D25Low_LB3", "D25High_LB12", "D25High_LB5", "D25Low_LB8", "D6High_LB4", "D6Low_LB7", "SettledLow_LB2", "SettledHigh_LB10", "SettledLow_LB3", "SettledHigh_LB5", "SettledLow_LB8")

all_fulldstbn <- popsync2pooldata("./PoPoolation/SyncFiles/Sync_2.sync", poolsizes = c(100000, 2500, 2500, 2500, 2500, 2500, 2500, 25000, 25000, 250, 250, 250, 250, 250), poolnames = all_fulldstbn_samples, min.rc = 2, min.cov.per.pool = 50, max.cov.per.pool = 400, min.maf = 0.05, noindel = TRUE, nlines.per.readblock = 1e+06)

#Compute Fst for every SNP
all_fulldstbn_SNPFst <- computeFST(all_fulldstbn, method = "Anova", snp.index = NA)

#Compute pairwise Fst matrix
all_fulldstbn_Fst <- computePairwiseFSTmatrix(all_fulldstbn, method = "Anova", min.cov.per.pool = 50, max.cov.per.pool = 400, min.maf = 0.05, output.snp.values = FALSE)

all_fulldstbn_PairwiseFSTMatrix <- as.matrix(as.data.frame(all_fulldstbn_Fst$PairwiseFSTmatrix))




In [None]:
#Now generating Fst between samples collected on Day 6
#The results were used for Figure S2

Embr_D6all_D25_samples <- c("Embryos", "D25Low_LB2", "D25High_LB10", "D25Low_LB3", "D25High_LB12", "D25High_LB5", "D25Low_LB8", "D6High_Large_LB11", "D6Low_Large_LB9", "D6High_Large_LB6", "D6Low_Large_LB1", "D6High_Small_LB11", "D6Low_Small_LB9", "D6High_Small_LB6", "D6Low_Small_LB1", "D6High_LB4", "D6Low_LB7")


#Note, this sync file was generated using an allele frequency matrix with more stringent MAF filtering
Embr_D6all_D25_pooldata <- popsync2pooldata("./PoPoolation/SyncFiles/Sync_3.sync", poolsizes = c(100000, 2500, 2500, 2500, 2500, 2500, 2500, 5250, 4250,5250, 4250, 19750, 20750, 19750, 20750, 25000, 25000), poolnames = Embr_D6all_D25_samples, min.rc = 2, min.cov.per.pool = 50, max.cov.per.pool = 400, min.maf = 0.05, noindel = TRUE, nlines.per.readblock = 1e+06)

#Compute Fst for every SNP
Embr_D6All_D25_SNPFst <- computeFST(Embr_D6all_D25_pooldata, method = "Anova", snp.index = NA)

#Compute pairwise Fst matrix
Embr_D6All_D25_Fst <- computePairwiseFSTmatrix(Embr_D6all_D25_pooldata, method = "Anova", min.cov.per.pool = 50, max.cov.per.pool = 400, min.maf = 0.05, output.snp.values = FALSE)

Embr_D6All_D25_PairwiseFSTMatrix <- as.matrix(as.data.frame(Embr_D6All_D25_Fst$PairwiseFSTmatrix))

D6_Fst <- Embr_D6All_D25_PairwiseFSTMatrix[c("D6High_LB4","D6High_Large_LB6", "D6High_Large_LB11", "D6High_Small_LB6", "D6High_Small_LB11"),c("D6Low_LB7", "D6Low_Large_LB1", "D6Low_Large_LB9", "D6Low_Small_LB1", "D6Low_Small_LB9")]
write.csv(D6_Fst, "~/Dropbox/D6_Fst.csv")