In [1]:
require(Matrix)
require(tibble)
utilities_path="../correlation_network_analysis_functions.r"
source(utilities_path)

Loading required package: Matrix
Loading required package: tibble
Loading required package: mgcv
Loading required package: nlme
This is mgcv 1.8-16. For overview type 'help("mgcv-package")'.
Loading required package: MASS
Loading required package: ggplot2
Loading required package: dplyr

Attaching package: ‘dplyr’

The following object is masked from ‘package:MASS’:

    select

The following object is masked from ‘package:nlme’:

    collapse

The following objects are masked from ‘package:stats’:

    filter, lag

The following objects are masked from ‘package:base’:

    intersect, setdiff, setequal, union

Loading required package: reshape2
Loading required package: RColorBrewer
Loading required package: colorRamps
Loading required package: tidyr

Attaching package: ‘tidyr’

The following object is masked from ‘package:reshape2’:

    smiths

The following object is masked from ‘package:Matrix’:

    expand

Loading required package: colorspace
Loading required package: igraph

Att

In [7]:
basepath="./"
baseinfodir="./"
analysisDir=paste(basepath,"analysis",sep="/")
datafilename="contact.corr"
contactmapname="contact.contact"
coordfilename="carma.average.pdb"
resinfofilename="resinfo.cpptraj.dat"
atominfofilename="atominfo.cpptraj.dat"
system_list=c("wt","R206H","Q207E","Q207D")
window_list=c(0:4)

In [3]:
#load the contact - correlation maps generated by carma into a single data frame
#and apply some residue naming information
data_list <- load_windowed_correlation_data(basepath=basepath,baseinfodir=baseinfodir,
                                            datafilename=datafilename,
                                            contactmapname=contactmapname,
                                            resinfofilename=resinfofilename,
                                            atominfofilename=atominfofilename,
                                            coordfilename=coordfilename,
                                            system_list=system_list,window_list=window_list,
                                            skip_corr_header_rows=1,
                                            datafiles_as_arrays=TRUE,
                                            contactfiles_as_arrays=TRUE)
windowed_corr_data <- data_list[["windowed_corr_data"]]
windowed_contact_map <- data_list[["windowed_contact_data"]]
resData <- data_list[["res_data"]]
contact_corr <- gen_contact_corr_summary(windowed_corr_data,windowed_contact_map,
                                             verbose=TRUE)
contact_corr %>% head
data_list %>% glimpse

[1] "loading data for wt"
[1] "-loading system structure data"
[1] "-loading windowed correlation and contact data:"
-     0  1  2  3  4
[1] "loading data for R206H"
[1] "-loading system structure data"
[1] "-loading windowed correlation and contact data:"
-     0  1  2  3  4
[1] "loading data for Q207E"
[1] "-loading system structure data"
[1] "-loading windowed correlation and contact data:"
-     0  1  2  3  4
[1] "loading data for Q207D"
[1] "-loading system structure data"
[1] "-loading windowed correlation and contact data:"
-     0  1  2  3  4
[1] "Done!"
[1] "melting windowed_corr_data"
[1] "melting windowed_contact_data"
[1] "joining melted data"
[1] "re-spreading melted data"
[1] "computing windowed_data summary"


SYSTEM,X,Y,X_RES,Y_RES,X_RESNAME,Y_RESNAME,X_Residue,Y_Residue,CONTACT,CORR,CONTACT_stdev
Q207D,1,3,172,174,THR,ASN,THR_172,ASN_174,0.349506,0.8737799,0.47858759
Q207D,2,4,173,175,THR,VAL,THR_173,VAL_175,0.608728,0.7641681,0.34391265
Q207D,3,1,174,172,ASN,THR,ASN_174,THR_172,0.349506,0.8737799,0.47858759
Q207D,3,5,174,176,ASN,GLY,ASN_174,GLY_176,0.655322,0.6626401,0.07742486
Q207D,4,2,175,173,VAL,THR,VAL_175,THR_173,0.608728,0.7641681,0.34391265
Q207D,4,6,175,177,VAL,ASP,VAL_175,ASP_177,0.336552,0.5694814,0.31303522


List of 3
 $ windowed_corr_data   :'data.frame':	3767120 obs. of  11 variables:
  ..$ SYSTEM   : chr [1:3767120] "wt" "wt" "wt" "wt" ...
  ..$ WINDOW   : int [1:3767120] 0 0 0 0 0 0 0 0 0 0 ...
  ..$ X        : int [1:3767120] 1 2 3 4 5 6 7 8 9 10 ...
  ..$ Y        : int [1:3767120] 1 1 1 1 1 1 1 1 1 1 ...
  ..$ X_RES    : int [1:3767120] 172 173 174 175 176 177 178 179 180 181 ...
  ..$ Y_RES    : int [1:3767120] 172 172 172 172 172 172 172 172 172 172 ...
  ..$ X_RESNAME: Factor w/ 20 levels "ALA","ARG","ASN",..: 17 17 3 20 8 4 16 17 11 1 ...
  ..$ Y_RESNAME: Factor w/ 20 levels "ALA","ARG","ASN",..: 17 17 17 17 17 17 17 17 17 17 ...
  ..$ X_Residue: chr [1:3767120] "THR_172" "THR_173" "ASN_174" "VAL_175" ...
  ..$ Y_Residue: chr [1:3767120] "THR_172" "THR_172" "THR_172" "THR_172" ...
  ..$ CORR     : num [1:3767120] 0 0 0.719 0 0 ...
 $ windowed_contact_data:'data.frame':	3784500 obs. of  11 variables:
  ..$ SYSTEM   : chr [1:3784500] "wt" "wt" "wt" "wt" ...
  ..$ WINDOW   : int [1

In [8]:
write.table(x=data_list$windowed_corr_data,
            file=paste(analysisDir,"/joint_windowed_correlation_data_table.dat",sep=""),
            quote=FALSE,row.names=FALSE)
write.table(x=contact_corr,
            file=paste(analysisDir,"/joint_contact_averaged_correlation_data_table.dat",sep=""),
            quote=FALSE,row.names=FALSE)
write.table(x=data_list$res_data,
            file=paste(analysisDir,"/joint_res_data_table.dat",sep=""),
            quote=FALSE,row.names=FALSE)

In [12]:
equil_windowed_corr_data=read.table(
    paste(analysisDir,"/joint_windowed_correlation_data_table.dat",sep=""),header=TRUE) %>%
    filter(WINDOW>0) %>%
    mutate(CONTACT=1.0*(abs(CORR)>0))
equil_windowed_corr_data %>% head

SYSTEM,WINDOW,X,Y,X_RES,Y_RES,X_RESNAME,Y_RESNAME,X_Residue,Y_Residue,CORR,CONTACT
wt,1,1,1,172,172,THR,THR,THR_172,THR_172,0.0,0
wt,1,2,1,173,172,THR,THR,THR_173,THR_172,0.0,0
wt,1,3,1,174,172,ASN,THR,ASN_174,THR_172,0.86239,1
wt,1,4,1,175,172,VAL,THR,VAL_175,THR_172,0.0,0
wt,1,5,1,176,172,GLY,THR,GLY_176,THR_172,0.0,0
wt,1,6,1,177,172,ASP,THR,ASP_177,THR_172,0.0,0
