### Subsetting HIPPIE interactions with human orthologs of yeast genetic interactors of Htt protein
#### Mason et al_2013

In [1]:
##################################################################
## Hippie Dataset subset with Mason2013 - Human orthologs ###
##################################################################

####################################################################################
### If you have query data (df2) and want to match it with entries 
## in both columns of your original data frame (foreg. df1$A and df2$B
##############################################################################
path <- "C:/Users/Sonali/Box Sync/Huntington Interactome/MutantHTT_Interactors/Yeast/MutantHttSuppressors_green"
setwd(path)

####################################################################################
### Read the Hippie dataset ###
### example: df1 <- data.frame(A=sample(1:10, 10), B=sample(1:10, 10)) ## sample data frame 1
####################################################################################
df1 <- read.delim(file= "HIPPIE_lastupdated090514_cleaned.txt", header = TRUE, sep= "\t") ## Hippie Data set
df1[1:10,1:4] ## the first 10 rows and 4 columns of your dataframe.
# df1$ID.Interactor.A


####################################################################################
### Read the dataframe which contains the Entrez Gene IDs of the human orthologs
### example:  df2 <- data.frame(C=1:5) # sample data frame 2
####################################################################################
df2 <- read.delim(file= "MasonHumanOrthologs.txt", header = TRUE, sep= "\t") ## Data frame containing entrez gene IDs

dim(df1)
dim(df2)

########################################################################################
### Intersection function - main function doing the job!
### WILL GIVE YOU THE INTERSECTION OF THE COLUMN A WITH YOUR DATA COLUMN C FROM YOUR QUERY DATA FRAME###
### REMEMBER THIS IS A LOGICAL VECTOR.SO YOU WILL GET A BUNCH OF TRUE AND FALSE VALUES#######
##########################################################################################
selectedRows <- (df1$ID.Interactor.A %in% df2$entrezgene | df1$ID.Interactor.B %in% df2$entrezgene) ## the main function that does the work!! ###

###################################################################################################################
### Now get the resultant dataframe we are looking for with corresponding columns from your huge Hippie dataset!
##################################################################################################################

dfReduced <- df1[selectedRows,] ## dataframe containing your results.
dim(dfReduced) # dimensions of the dataframe
dfReduced[1:10,1:4] # view the first 10 and first 4 columns of the dataframe

#dfReduced ## have a look at the result.
## class(dfReduced)

# write.table(dfReduced, file="Mason2013_Hip_Interactns.txt", sep="\t", col.names = NA) ### export file in text format to the folder.

sessionInfo()




ID.Interactor.A,ID.Interactor.B,Alt.IDs.Interactor.A,Alt.IDs.Interactor.B
216,216,AL1A1_HUMAN,AL1A1_HUMAN
3679,1134,ITA7_HUMAN,ACHA_HUMAN
55607,71,NEB1_HUMAN,ACTG_HUMAN
5552,960,SRGN_HUMAN,CD44_HUMAN
2886,2064,GRB7_HUMAN,ERBB2_HUMAN
5058,2064,PAK1_HUMAN,ERBB2_HUMAN
1742,2064,DLG4_HUMAN,ERBB2_HUMAN
5296,2064,P85B_HUMAN,ERBB2_HUMAN
26469,2064,PTN18_HUMAN,ERBB2_HUMAN
55914,2064,LAP2_HUMAN,ERBB2_HUMAN


Unnamed: 0,ID.Interactor.A,ID.Interactor.B,Alt.IDs.Interactor.A,Alt.IDs.Interactor.B
893,6517,3418,GTR4_HUMAN,IDHP_HUMAN
2236,56915,5315,EXOS5_HUMAN,KPYM_HUMAN
2469,11144,5888,DMC1_HUMAN,RAD51_HUMAN
2757,51194,6136,IPO11_HUMAN,RL12_HUMAN
3399,56897,5425,WRIP1_HUMAN,DPOD2_HUMAN
3404,56897,5424,WRIP1_HUMAN,DPOD1_HUMAN
3405,56897,57804,WRIP1_HUMAN,DPOD4_HUMAN
4484,112858,7157,PRPK_HUMAN,P53_HUMAN
4985,475,538,ATOX1_HUMAN,ATP7A_HUMAN
5105,6654,529,SOS1_HUMAN,VATE1_HUMAN


R version 3.3.1 (2016-06-21)
Platform: x86_64-w64-mingw32/x64 (64-bit)
Running under: Windows 10 x64 (build 14393)

locale:
[1] LC_COLLATE=English_United States.1252 
[2] LC_CTYPE=English_United States.1252   
[3] LC_MONETARY=English_United States.1252
[4] LC_NUMERIC=C                          
[5] LC_TIME=English_United States.1252    

attached base packages:
[1] stats     graphics  grDevices utils     datasets  methods   base     

loaded via a namespace (and not attached):
 [1] R6_2.2.0            magrittr_1.5        IRdisplay_0.4.4    
 [4] pbdZMQ_0.2-5        tools_3.3.1         crayon_1.3.2       
 [7] uuid_0.1-2          stringi_1.1.5       IRkernel_0.8.6.9000
[10] jsonlite_1.4        stringr_1.2.0       digest_0.6.12      
[13] repr_0.12.0         evaluate_0.10      

#### Giorgini et al_2005

In [2]:
##################################################################
## Hippie Dataset subset with Giorgini2005 - Human orthologs ###
##################################################################

####################################################################################
### If you have query data (df2) and want to match it with entries 
## in both columns of your original data frame (foreg. df1$A and df2$B
##############################################################################
path <- "C:/Users/Sonali/Box Sync/Huntington Interactome/MutantHTT_Interactors/Yeast/MutantHttSuppressors_green"
setwd(path)

####################################################################################
### Read the Hippie dataset ###
### example: df1 <- data.frame(A=sample(1:10, 10), B=sample(1:10, 10)) ## sample data frame 1
####################################################################################
df1 <- read.delim(file= "HIPPIE_lastupdated090514_cleaned.txt", header = TRUE, sep= "\t") ## Hippie Data set
df1[1:10,1:4] ## the first 10 rows and 4 columns of your dataframe.
# df1$ID.Interactor.A


####################################################################################
### Read the dataframe which contains the Entrez Gene IDs of the human orthologs
### example:  df2 <- data.frame(C=1:5) # sample data frame 2
####################################################################################
df2 <- read.delim(file= "GiorginiHumanOrthologs.txt", header = TRUE, sep= "\t") ## Data frame containing entrez gene IDs

dim(df1)
dim(df2)

########################################################################################
### Intersection function - main function doing the job!
### WILL GIVE YOU THE INTERSECTION OF THE COLUMN A WITH YOUR DATA COLUMN C FROM YOUR QUERY DATA FRAME###
### REMEMBER THIS IS A LOGICAL VECTOR.SO YOU WILL GET A BUNCH OF TRUE AND FALSE VALUES#######
##########################################################################################
selectedRows <- (df1$ID.Interactor.A %in% df2$entrezgene | df1$ID.Interactor.B %in% df2$entrezgene) ## the main function that does the work!! ###

###################################################################################################################
### Now get the resultant dataframe we are looking for with corresponding columns from your huge Hippie dataset!
##################################################################################################################

dfReduced <- df1[selectedRows,] ## dataframe containing your results.
dim(dfReduced) # dimensions of the dataframe
dfReduced[1:10,1:4] # view the first 10 and first 4 columns of the dataframe

#dfReduced ## have a look at the result.
## class(dfReduced)

#write.table(dfReduced, file="Giorgini2005_Hip_Interactns.txt", sep="\t", col.names = NA) ### export file in text format to the folder.

sessionInfo()




ID.Interactor.A,ID.Interactor.B,Alt.IDs.Interactor.A,Alt.IDs.Interactor.B
216,216,AL1A1_HUMAN,AL1A1_HUMAN
3679,1134,ITA7_HUMAN,ACHA_HUMAN
55607,71,NEB1_HUMAN,ACTG_HUMAN
5552,960,SRGN_HUMAN,CD44_HUMAN
2886,2064,GRB7_HUMAN,ERBB2_HUMAN
5058,2064,PAK1_HUMAN,ERBB2_HUMAN
1742,2064,DLG4_HUMAN,ERBB2_HUMAN
5296,2064,P85B_HUMAN,ERBB2_HUMAN
26469,2064,PTN18_HUMAN,ERBB2_HUMAN
55914,2064,LAP2_HUMAN,ERBB2_HUMAN


Unnamed: 0,ID.Interactor.A,ID.Interactor.B,Alt.IDs.Interactor.A,Alt.IDs.Interactor.B
502,1822,64599,ATN1_HUMAN,PERQ1_HUMAN
1901,5578,8721,KPCA_HUMAN,EDF1_HUMAN
2668,8721,6256,EDF1_HUMAN,RXRA_HUMAN
3108,8721,2516,EDF1_HUMAN,STF1_HUMAN
5780,8721,6872,EDF1_HUMAN,TAF1_HUMAN
6096,8721,6908,EDF1_HUMAN,TBP_HUMAN
8958,8721,5468,EDF1_HUMAN,PPARG_HUMAN
9003,64599,2887,PERQ1_HUMAN,GRB10_HUMAN
10923,8721,801,EDF1_HUMAN,CALM_HUMAN
13969,2494,8721,NR5A2_HUMAN,EDF1_HUMAN


R version 3.3.1 (2016-06-21)
Platform: x86_64-w64-mingw32/x64 (64-bit)
Running under: Windows 10 x64 (build 14393)

locale:
[1] LC_COLLATE=English_United States.1252 
[2] LC_CTYPE=English_United States.1252   
[3] LC_MONETARY=English_United States.1252
[4] LC_NUMERIC=C                          
[5] LC_TIME=English_United States.1252    

attached base packages:
[1] stats     graphics  grDevices utils     datasets  methods   base     

loaded via a namespace (and not attached):
 [1] R6_2.2.0            magrittr_1.5        IRdisplay_0.4.4    
 [4] pbdZMQ_0.2-5        tools_3.3.1         crayon_1.3.2       
 [7] uuid_0.1-2          stringi_1.1.5       IRkernel_0.8.6.9000
[10] jsonlite_1.4        stringr_1.2.0       digest_0.6.12      
[13] repr_0.12.0         evaluate_0.10      

#### Chatterjee et al_2013

In [3]:
##################################################################
## Hippie Dataset subset with Chatterjee2013 - Human orthologs ###
##################################################################

####################################################################################
### If you have query data (df2) and want to match it with entries 
## in both columns of your original data frame (foreg. df1$A and df2$B
##############################################################################
path <- "C:/Users/Sonali/Box Sync/Huntington Interactome/MutantHTT_Interactors/Yeast/MutantHttSuppressors_green"
setwd(path)


####################################################################################
### Read the Hippie dataset ###
### example: df1 <- data.frame(A=sample(1:10, 10), B=sample(1:10, 10)) ## sample data frame 1
####################################################################################
df1 <- read.delim(file= "HIPPIE_lastupdated090514_cleaned.txt", header = TRUE, sep= "\t") ## Hippie Data set
df1[1:10,1:4] ## the first 10 rows and 4 columns of your dataframe.
# df1$ID.Interactor.A


####################################################################################
### Read the dataframe which contains the Entrez Gene IDs of the human orthologs
### example:  df2 <- data.frame(C=1:5) # sample data frame 2
####################################################################################
df2 <- read.delim(file= "ChatterjeeHumanOrthologs.txt", header = TRUE, sep= "\t") ## Data frame containing entrez gene IDs

dim(df1)
dim(df2)

########################################################################################
### Intersection function - main function doing the job!
### WILL GIVE YOU THE INTERSECTION OF THE COLUMN A WITH YOUR DATA COLUMN C FROM YOUR QUERY DATA FRAME###
### REMEMBER THIS IS A LOGICAL VECTOR.SO YOU WILL GET A BUNCH OF TRUE AND FALSE VALUES#######
##########################################################################################
selectedRows <- (df1$ID.Interactor.A %in% df2$entrezgene | df1$ID.Interactor.B %in% df2$entrezgene) ## the main function that does the work!! ###

###################################################################################################################
### Now get the resultant dataframe we are looking for with corresponding columns from your huge Hippie dataset!
##################################################################################################################

dfReduced <- df1[selectedRows,] ## dataframe containing your results.
dim(dfReduced) # dimensions of the dataframe
dfReduced[1:10,1:4] # view the first 10 and first 4 columns of the dataframe

#dfReduced ## have a look at the result.
## class(dfReduced)

#write.table(dfReduced, file="Chatterjee2013_Hip_Interactns.txt", sep="\t", col.names = NA) ### export file in text format to the folder.

sessionInfo()




ID.Interactor.A,ID.Interactor.B,Alt.IDs.Interactor.A,Alt.IDs.Interactor.B
216,216,AL1A1_HUMAN,AL1A1_HUMAN
3679,1134,ITA7_HUMAN,ACHA_HUMAN
55607,71,NEB1_HUMAN,ACTG_HUMAN
5552,960,SRGN_HUMAN,CD44_HUMAN
2886,2064,GRB7_HUMAN,ERBB2_HUMAN
5058,2064,PAK1_HUMAN,ERBB2_HUMAN
1742,2064,DLG4_HUMAN,ERBB2_HUMAN
5296,2064,P85B_HUMAN,ERBB2_HUMAN
26469,2064,PTN18_HUMAN,ERBB2_HUMAN
55914,2064,LAP2_HUMAN,ERBB2_HUMAN


Unnamed: 0,ID.Interactor.A,ID.Interactor.B,Alt.IDs.Interactor.A,Alt.IDs.Interactor.B
2731,6780,6194,STAU1_HUMAN,RS6_HUMAN
2732,5062,6194,PAK2_HUMAN,RS6_HUMAN
2733,6198,6194,KS6B1_HUMAN,RS6_HUMAN
2754,817,6222,KCC2D_HUMAN,RS18_HUMAN
2757,51194,6136,IPO11_HUMAN,RL12_HUMAN
2773,6780,6175,STAU1_HUMAN,RLA0_HUMAN
9901,6147,3843,RL23A_HUMAN,IPO5_HUMAN
9902,3843,6137,IPO5_HUMAN,RL13_HUMAN
11340,6147,3842,RL23A_HUMAN,TNPO1_HUMAN
12156,11033,6203,ADAP1_HUMAN,RS9_HUMAN


R version 3.3.1 (2016-06-21)
Platform: x86_64-w64-mingw32/x64 (64-bit)
Running under: Windows 10 x64 (build 14393)

locale:
[1] LC_COLLATE=English_United States.1252 
[2] LC_CTYPE=English_United States.1252   
[3] LC_MONETARY=English_United States.1252
[4] LC_NUMERIC=C                          
[5] LC_TIME=English_United States.1252    

attached base packages:
[1] stats     graphics  grDevices utils     datasets  methods   base     

loaded via a namespace (and not attached):
 [1] R6_2.2.0            magrittr_1.5        IRdisplay_0.4.4    
 [4] pbdZMQ_0.2-5        tools_3.3.1         crayon_1.3.2       
 [7] uuid_0.1-2          stringi_1.1.5       IRkernel_0.8.6.9000
[10] jsonlite_1.4        stringr_1.2.0       digest_0.6.12      
[13] repr_0.12.0         evaluate_0.10      

#### Willingham etal_2003
Please note the working directory change

In [4]:
##################################################################
## Hippie Dataset subset with Chatterjee2013 - Human orthologs ###
##################################################################

####################################################################################
### If you have query data (df2) and want to match it with entries 
## in both columns of your original data frame (foreg. df1$A and df2$B
##############################################################################
path <- "C:/Users/Sonali/Box Sync/Huntington Interactome/MutantHTT_Interactors/Yeast/MutantHttEnhancers_red"
setwd(path)

####################################################################################
### Read the Hippie dataset ###
### example: df1 <- data.frame(A=sample(1:10, 10), B=sample(1:10, 10)) ## sample data frame 1
####################################################################################
df1 <- read.delim(file= "HIPPIE_lastupdated090514_cleaned.txt", header = TRUE, sep= "\t") ## Hippie Data set
df1[1:10,1:4] ## the first 10 rows and 4 columns of your dataframe.
# df1$ID.Interactor.A


####################################################################################
### Read the dataframe which contains the Entrez Gene IDs of the human orthologs
### example:  df2 <- data.frame(C=1:5) # sample data frame 2
####################################################################################
df2 <- read.delim(file= "WillinghamHumanOrthologs.txt", header = TRUE, sep= "\t") ## Data frame containing entrez gene IDs

dim(df1)
dim(df2)

########################################################################################
### Intersection function - main function doing the job!
### WILL GIVE YOU THE INTERSECTION OF THE COLUMN A WITH YOUR DATA COLUMN C FROM YOUR QUERY DATA FRAME###
### REMEMBER THIS IS A LOGICAL VECTOR.SO YOU WILL GET A BUNCH OF TRUE AND FALSE VALUES#######
##########################################################################################
selectedRows <- (df1$ID.Interactor.A %in% df2$entrezgene | df1$ID.Interactor.B %in% df2$entrezgene) ## the main function that does the work!! ###

###################################################################################################################
### Now get the resultant dataframe we are looking for with corresponding columns from your huge Hippie dataset!
##################################################################################################################

dfReduced <- df1[selectedRows,] ## dataframe containing your results.
dim(dfReduced) # dimensions of the dataframe
dfReduced[1:10,1:4] # view the first 10 and first 4 columns of the dataframe

#dfReduced ## have a look at the result.
## class(dfReduced)

#write.table(dfReduced, file="Willingham2003_Hip_Interactns.txt", sep="\t", col.names = NA) ### export file in text format to the folder.

sessionInfo()



ID.Interactor.A,ID.Interactor.B,Alt.IDs.Interactor.A,Alt.IDs.Interactor.B
216,216,AL1A1_HUMAN,AL1A1_HUMAN
3679,1134,ITA7_HUMAN,ACHA_HUMAN
55607,71,NEB1_HUMAN,ACTG_HUMAN
5552,960,SRGN_HUMAN,CD44_HUMAN
2886,2064,GRB7_HUMAN,ERBB2_HUMAN
5058,2064,PAK1_HUMAN,ERBB2_HUMAN
1742,2064,DLG4_HUMAN,ERBB2_HUMAN
5296,2064,P85B_HUMAN,ERBB2_HUMAN
26469,2064,PTN18_HUMAN,ERBB2_HUMAN
55914,2064,LAP2_HUMAN,ERBB2_HUMAN


Unnamed: 0,ID.Interactor.A,ID.Interactor.B,Alt.IDs.Interactor.A,Alt.IDs.Interactor.B
19161,2937,2937,GSHB_HUMAN,GSHB_HUMAN
26002,2954,2937,MAAI_HUMAN,GSHB_HUMAN
59532,2597,2937,G3P_HUMAN,GSHB_HUMAN
60616,3661,2937,IRF3_HUMAN,GSHB_HUMAN
73670,27161,11136,AGO2_HUMAN,BAT1_HUMAN
77390,11136,7052,BAT1_HUMAN,TGM2_HUMAN
119413,8454,11136,CUL1_HUMAN,BAT1_HUMAN
119781,7013,2937,TERF1_HUMAN,GSHB_HUMAN
129361,2937,9601,GSHB_HUMAN,PDIA4_HUMAN
129394,2937,1155,GSHB_HUMAN,TBCB_HUMAN


R version 3.3.1 (2016-06-21)
Platform: x86_64-w64-mingw32/x64 (64-bit)
Running under: Windows 10 x64 (build 14393)

locale:
[1] LC_COLLATE=English_United States.1252 
[2] LC_CTYPE=English_United States.1252   
[3] LC_MONETARY=English_United States.1252
[4] LC_NUMERIC=C                          
[5] LC_TIME=English_United States.1252    

attached base packages:
[1] stats     graphics  grDevices utils     datasets  methods   base     

loaded via a namespace (and not attached):
 [1] R6_2.2.0            magrittr_1.5        IRdisplay_0.4.4    
 [4] pbdZMQ_0.2-5        tools_3.3.1         crayon_1.3.2       
 [7] uuid_0.1-2          stringi_1.1.5       IRkernel_0.8.6.9000
[10] jsonlite_1.4        stringr_1.2.0       digest_0.6.12      
[13] repr_0.12.0         evaluate_0.10      