In [1]:
# infercnv v1.14.0
library(infercnv)
library(phylogram)
library(pheatmap)
library(ggsci)
library(scales)
library(ggplot2)
library(RColorBrewer)

In [18]:
color <- c(c(pal_d3("category20")(20), "#B52D73", "#4347B5", "#4FED28", "#402727", "#48959C", "#FC6262", "#4A9EFF", "#9E969E"))
# specify colors
# tissue_color <- c("#33a02c","#e31a1c") #"#1f78b4",
tissue_color <- c("#2CA02CFF", "#E377C2FF")
celltype1_color <- c("#0072B5FF", "#D62728FF") # c(pal_nejm("default")(8)[c(2,1)])
celltype2_color <- c("#9467BDFF", "#FF95A8FF", "#8AA600", "#46732EFF", "#D62728FF")
celltype3_color <- c("#9467BDFF", "#FF95A8FF", "#8AA600", "#46732EFF", "#D62728FF", "#FD7446FF", "#8A9197FF")
celltype4_color <- c("#20854EFF", "#008EA0FF", "#FF6F00FF", "#C71000FF")

patient_color <- c(
  "#FED439FF", "#8A9197FF", "#8A4198FF", "#D5E4A2FF", "#197EC0FF", "#FD7446FF", "#46732EFF", "#71D0F5FF", "#E377C2FF",
  "#075149FF", "#e60000", "#91331FFF", "#1A9993FF", "#ff80aa", "#D2AF81FF", "#370335FF", "#cc99ff", "#ff8000", "#59b300"
)

In [14]:
gene_cts <- read.table(file = "00_gene_counts_12291genes.txt", header = T, row.names = 1, sep = "\t")

In [15]:
gene_cts <- as.matrix(gene_cts)
gene_cts[1:2, 1:2]

Unnamed: 0,CRC01_L1_Barcode01,CRC01_L1_Barcode02
MTCO1P12,0,1
MTATP8P1,0,0


In [17]:
infercnv_obj <- CreateInfercnvObject(
  raw_counts_matrix = gene_cts,
  annotations_file = "00_anno_crc_patient_tissue.txt",
  delim = "\t",
  gene_order_file = "00_gene_ordering_file.txt",
  ref_group_names = c("CRC01-NT", "CRC02-NT", "CRC03-NT", "CRC04-NT", "CRC05-NT", "CRC07-NT", "CRC08-NT", "CRC09-NT", "CRC10-NT")
)

INFO [2023-01-12 12:57:47] Parsing gene order file: 00_gene_ordering_file.txt
INFO [2023-01-12 12:57:47] Parsing cell annotations file: 00_anno_crc_patient_tissue.txt
INFO [2023-01-12 12:57:47] ::order_reduce:Start.
INFO [2023-01-12 12:57:48] .order_reduce(): expr and order match.
INFO [2023-01-12 12:57:48] ::process_data:order_reduce:Reduction from positional data, new dimensions (r,c) = 12291,1395 Total=180376311.780204 Min=0 Max=183513.5.
INFO [2023-01-12 12:57:48] num genes removed taking into account provided gene ordering list: 408 = 3.3195020746888% removed.
INFO [2023-01-12 12:57:48] -filtering out cells < 100 or > Inf, removing 0 % of cells
WARN [2023-01-12 12:57:48] Please use "options(scipen = 100)" before running infercnv if you are using the analysis_mode="subclusters" option or you may encounter an error while the hclust is being generated.
INFO [2023-01-12 12:57:49] validating infercnv_obj


In [18]:
# Time-consuming
infercnv_obj <- infercnv::run(
  infercnv_obj,
  cutoff = 1, # cutoff=1 works well for Smart-seq2, and cutoff=0.1 works well for 10x Genomics
  out_dir = "patient_tissue",
  cluster_by_groups = TRUE,
  denoise = TRUE,
  HMM = TRUE
)

INFO [2023-01-12 12:58:16] ::process_data:Start
INFO [2023-01-12 12:58:16] Creating output path patient_tissue
INFO [2023-01-12 12:58:16] Checking for saved results.
INFO [2023-01-12 12:58:16] 

	STEP 1: incoming data

INFO [2023-01-12 12:58:22] 

	STEP 02: Removing lowly expressed genes

INFO [2023-01-12 12:58:22] ::above_min_mean_expr_cutoff:Start
INFO [2023-01-12 12:58:22] Removing 3661 genes from matrix as below mean expr threshold: 1
INFO [2023-01-12 12:58:23] validating infercnv_obj
INFO [2023-01-12 12:58:23] There are 8222 genes and 1395 cells remaining in the expr matrix.
INFO [2023-01-12 12:58:23] no genes removed due to min cells/gene filter
INFO [2023-01-12 12:58:28] 

	STEP 03: normalization by sequencing depth

INFO [2023-01-12 12:58:28] normalizing counts matrix by depth
INFO [2023-01-12 12:58:28] Computed total sum normalization factor as median libsize: 75190.134140
INFO [2023-01-12 12:58:29] Adding h-spike
INFO [2023-01-12 12:58:29] -hspike modeling of CRC01-NT
INFO [2

Centering and scaling data matrix

PC_ 1 
Positive:  CCNG1, ATP10B, HMMR, MAT2B, PTTG1, SLU7, WWC1, FABP6, RARS1, PWWP2A 
	   TTC1, UBLCP1, PANK3, CLINT1, C5orf52, RPL10P9, CYFIP2, SPDL1, MED7, RANBP17 
	   MRPL22, NPM1, FBXW11, CNOT8, STK10, FAXDC2, UBTD2, LARP1, SH3PXD2B, DUSP1 
Negative:  PSMG3, ELFN1-AS1, GTF2IRD1, GTF2I, CLIP2, RFC2, MAD1L1, EIF4H, RCC1L, CCL24 
	   RHBDD2, MDH2, GTF2IRD2B, MRM2, STYXL1, POM121C, HSPB1, TMEM120A, NSUN5P1, ZP3 
	   NUDT1, DTX2, LRRC61, RARRES2, ACTR3C, EIF3B, REPIN1, ATP6V0E2, GIMAP2, ZNF212 
PC_ 2 
Positive:  RNF185, SELENOM, SMTN, TUG1, LIMK2, DUSP18, PIK3IP1, SLC35E4, PATZ1, TCN2 
	   DRG1, PES1, SFI1, MTFP1, PISD, YWHAH, TBC1D10A, RTCB, ASCC2, FBXO7 
	   UQCR10, TIMP3, NIPSNAP1, LARGE1, ISX, THOC5, AP1B1, HMGXB4, EWSR1, TOM1 
Negative:  LY6G6D, CSNK2B, ABHD16A, GPANK1, LY6G6C, C6orf47, DDAH2, APOM, BAG6, CLIC1 
	   PRRC2A, MSH5, TNF, SAPCD1, NFKBIL1, VARS1, LSM2, DDX39B, HSPA1A, HSPA1B 
	   HCP5, SNHG32, NEU1, EHMT2, MICA, C2, CFB, HLA-B, NELFE

INFO [2023-01-12 13:12:36] define_signif_tumor_subclusters(), tumor: CRC02-PT


Centering and scaling data matrix

PC_ 1 
Positive:  FARP1, SLC15A1, STK24, UBAC2, IPO5, TM9SF2, RAP2A, CLYBL, PCCA-DT, MBNL2 
	   PCCA, OXGR1, GGACT, UGGT2, TMTC4, DNAJC3, TPP2, DNAJC3-DT, TEX30, TGDS 
	   SPRY2, BIVM, NDFIP2, RBM26, ERCC5, OBI1, MYCBP2, EFNB2, FBXL3, ARGLU1 
Negative:  NAXE, CCT3, GPATCH4, CRABP2, GLMP, ISG20L2, NCLN, ZNF77, TLE2, NFIC 
	   TLE5, ZNF57, TMEM79, SMIM24, THOP1, METTL25B, DOHH, SGTA, MFSD12, SLC39A3 
	   HMG20B, SMG5, APBA3, HDGF, MRPL54, GADD45B, FAM98C, PSMD8, KCNK6, EIF3K 
PC_ 2 
Positive:  ZNF586, ZNF419, ZNF587, ZNF552, ZNF749, ZNF274, TRAPPC2B, ZNF544, ERVK3-1, RPS5 
	   ZNF584, AURKAIP1, CCNL2, CPTP, MRPL20, ATAD3B, MRPL20-AS1, ATAD3A, SSU72, ZNF324 
	   INTS11, PUSL1, MIB2, UBE2J2, C1QTNF12, ZNF446, SDF4, SLC35E2B, C1orf159, SLC27A5 
Negative:  FASTKD2, EEF1B2, KLF7, CREB1, INO80D-AS2, METTL21A, ABI2, FHL3, UTP11, FZD5 
	   CYP20A1, NOP58, FAM117B, WDR12, MYCBP, SUMO1, CAP1, NBEAL1, MFSD2A, MYCL 
	   TMEM237, IDH1, RHBDL2, TRIT1, STRADB, PPIE, P

INFO [2023-01-12 13:12:37] define_signif_tumor_subclusters(), tumor: CRC03-PT


Centering and scaling data matrix

PC_ 1 
Positive:  LRRC49, THAP10, UACA, MYO9A, TLE3, PKM, DRAIC, PARP6, RPLP1, HEXA 
	   ARIH1, GLCE, BBS4, ANP32A, ADPGK, NEO1, CLN6, CD276, CALML4, PML 
	   PIAS1, UBL7, MAP2K5, CLK3, SERF2, AAGAB, MFAP1, GOLM2, ELL3, EIF3J-DT 
Negative:  SPAG7, PFN1, ZNF232, RABEP1, RNF167, SLC25A11, NUP88, MINK1, RPAIN, COA7 
	   PSMB6, DERL2, RPS13P2, MIS12, ECHDC2, PIMREG, SCP2, TM4SF5, TXNDC17, SLC1A7 
	   CXCL16, MED31, C17orf100, CPT2, XAF1, MEA1, MED11, KLHDC3, PPP2R5D, CNPY3 
PC_ 2 
Positive:  EMC9, PSME2, DCAF11, RNF31, IRF9, IPO4, PCK2, TM9SF1, DHRS4L2, CHMP4A 
	   DHRS4, MDP1, DHRS4-AS1, NEDD8, GMPR2, AP1G2, TINF2, THTPA, RABGGTA, NGDN 
	   PABPN1, DHRS1, BCL2L2-PABPN1, ADCY4, BCL2L2, RIPK3, KHNYN, C14orf119, SDR39U1, ACIN1 
Negative:  RPS9, LENG8, TSEN34, MBOAT7, TMC4, CDC42EP5, LENG1, TFPT, NDUFA3, MYADM 
	   NLRP2, ZNF331, RDH13, EPS8L1, ZNF761, TNNI3, EPN1, ZNF581, ZNF580, ZNF444 
	   PTPRH, ZNF524, ZSCAN5A, ISOC2, UBE2S, PPP6R1, ZNF160, TRAPPC2B, RP

INFO [2023-01-12 13:12:37] define_signif_tumor_subclusters(), tumor: CRC04-PT


Centering and scaling data matrix

PC_ 1 
Positive:  NUP37, WASHC3, PARPBP, HSP90B1, GNPTAB, C12orf73, CHPT1, ARL1, TDG, NFYB 
	   TXNRD1, GAS2L3, RPL18AP3, NOPCHAP1, SCYL2, WASHC4, APPL2, C12orf75, ACTR6, RIC8B 
	   TMEM263, MTERF2, CRY1, SLC25A3, PWP1, PRDM4, SART3, ISCU, CORO1C, TMPO 
Negative:  MRPL20-AS1, CCNL2, AURKAIP1, MRPL20, CPTP, ATAD3B, ATAD3A, INTS11, SSU72, PUSL1 
	   UBE2J2, C1QTNF12, SDF4, MIB2, C1orf159, SLC35E2B, ISG15, NOC2L, LINC01128, CDK11A 
	   NADK, GNB1, TMEM52, PRKCZ, FAAP20, RER1, PEX10, PANK4, TNFRSF14-AS1, TNFRSF14 
PC_ 2 
Positive:  PLA2G4C, SELENOW, NOP53, NAPA, KPTN, DHX34, INAFM1, SAE1, TMEM160, AP2S1 
	   SLC1A5, STRN4, WDR83, DHPS, WDR83OS, FBXW9, PRKD2, TRIR, CALM3, GET3 
	   HOOK2, PPP5C, JUNB, FOXA3, SYMPK, DMPK, SNRPD2, EML2, VASP, FOSB 
Negative:  CAVIN3, FHIP1B, TRIM5, TRIM3, TRIM34, ARFIP2, TIMM10B, RRP8, TRIM68, ILK 
	   TPP1, TAF10, MRPL17, ZNF215, PPFIBP2, TRIM21, CYB5R2, EIF3F, RPL27A, DENND2B 
	   AKIP1, TMEM9B, DENND5A, TMEM41B, IPO7, ZNF

INFO [2023-01-12 13:12:38] define_signif_tumor_subclusters(), tumor: CRC05-PT


Centering and scaling data matrix

PC_ 1 
Positive:  NUP107, RAP1B, CPM, CPSF6, MDM1, DYRK2, LYZ, TMBIM4, YEATS4, CCT2 
	   LEMD3, RAB3IP, GNS, CNOT2, TBK1, XPOT, SRGAP1, KICS2, PTPRR, RXYLT1 
	   TSPAN8, RPL14P1, ZFC3H1, USP15, THAP2, TMEM19, LRIG3, TBC1D15, ATXN7L3B, ATP23 
Negative:  PAK4, PAF1, MED29, ZFP36, RPS16, SUPT5H, TIMM50, FBL, PSMC4, EPS15L1 
	   AP1M1, SCAPER, ETFA, RCN2, TSPAN3, IDH3A, HMG20A, DNAJA4, YJU2, CCNF 
	   FAM32A, RNPS1, WDR61, ECI1, IREB2, E4F1, PGP, SIRT6, HSH2D, PSMA4 
PC_ 2 
Positive:  RPL6P27, LINC00668, NDUFV2, ANKRD12, TWSG1, RALBP1, PPP4R1, VAPA, APCDD1, NAPG 
	   CHMP1B, MPPE1, IMPA2, DOP1B, CBR3-AS1, MORC3, CBR1, PIGP, SETD4, TTC3 
	   RCAN1, AFG3L2, VPS26C, ETS2, SLC5A3, PSMG1, PSMG2, MRPS6, BRWD1, ATP5PO 
Negative:  STK10, FBXW11, UBTD2, SH3PXD2B, DUSP1, NPM1, RANBP17, ERGIC1, SPDL1, RPL26L1 
	   RPL10P9, PANK3, ATP6V0E1, RARS1, CREBRF, WWC1, BNIP1, MAT2B, BOD1, MSX2 
	   SFXN1, HMMR, THOC3, SIMC1, CCNG1, KIAA1191, NOP16, ATP10B, HIGD2A, CLTB 
PC_ 

INFO [2023-01-12 13:12:38] define_signif_tumor_subclusters(), tumor: CRC07-PT


Centering and scaling data matrix

PC_ 1 
Positive:  PIWIL4, ANKRD49, PANX1, MED17, MRE11, C11orf54, FUT4, TAF1D, CEP57, ENDOD1 
	   MTMR2, SRSF8, CWC15, CCDC82, SMCO4, JRKL, BIRC3, BIRC2, CHORDC1, TMEM123 
	   CTSC, MMP7, PRSS23, MMP1, DCUN1D5, ME3, CASP4, HIKESHI, EED, CASP5 
Negative:  PPT1, CAP1, RLF, ZMPSTE24-DT, ZMPSTE24, MFSD2A, SMAP2, MYCL, EXO5, MET 
	   CAPZA2, TES, STMP1, MTPN, NFYC, SMIM30, TRIT1, NUP205, TMEM168, IFRD1 
	   ST7, CREB3L2, ZNF277, CTPS1, CNOT4, DNAJB9, HBP1, PNPLA8, NAMPT, PPIE 
PC_ 2 
Positive:  SKA3, SAP18, IFT88, CRYL1, GJB2, ZMYM2, ZMYM5, CDC42EP2, DPF2, YWHAQ 
	   ADAM17, TAF1B, FRMD8, IAH1, KLF11, RRM2, HPCAL1, ODC1, CPSF3, NEAT1 
	   NOL10, PDIA6, SLC66A3, MALAT1, ITGB1BP1, PCID2, ROCK2, SCYL1, NUBP2, F10 
Negative:  MYOF, CEP55, BTAF1, FFAR4, PCGF5, RPP30, KIF20B, FRA10AC1, PANK1, IFIT3 
	   NOC3L, LIPA, CYP2C18, FAS, PDLIM1, SORBS1, STAMBPL1, TCTN3, ENTPD1-AS1, ANKRD22 
	   ZNF518A, BLNK, PTEN, RPL13AP5, LCOR, ATAD1, FRAT2, MINPP1, PGAM1, LINC00863 

INFO [2023-01-12 13:12:39] define_signif_tumor_subclusters(), tumor: CRC08-PT


Centering and scaling data matrix

PC_ 1 
Positive:  SLC46A3, SLC7A1, POMP, UBL3, URAD, HMGB1, CDX2, USPL1, PDX1, HSPH1 
	   POLR1D, N4BP2L1, N4BP2L2, MTIF3, PDS5B, GTF3A, STARD13, RASL11A, RFC3, ALG5 
	   RPL21, EXOSC8, USP12, SUPT20H, CDK8, UFM1, NHLRC3, RNF6, COG6, NUP58 
Negative:  HEXA, ARIH1, PARP6, BBS4, PKM, ADPGK, MYO9A, THAP10, NEO1, LRRC49 
	   CD276, UACA, TLE3, PML, DRAIC, UBL7, RPLP1, CLK3, GLCE, EDC3 
	   CSK, ANP32A, ULK3, CLN6, SCAMP2, CALML4, MPI, PIAS1, MAP2K5, FAM219B 
PC_ 2 
Positive:  CGGBP1, C3orf38, CHMP2B, PROS1, GBE1, NSUN3, STX19, ZNF717, RIOX2, CLDND1 
	   LINC00960, CPOX, CMSS1, FAM86DP, TBC1D23, PPP4R2, NIT2, TFG, SHQ1, TRMT10C 
	   RYBP, PCNP, FOXP1, ARL6IP5, ZBTB11, UBA3, RPL24, TMF1, NFKBIZ, PSMC1P1 
Negative:  GFER, NPW, NOXO1, SLC9A3R2, TBL3, NTHL1, SNHG19, TSC2, PKD1-AS1, TRAF7 
	   SNHG9, MLST8, PGP, RPS2, E4F1, ECI1, NDUFB10, RNPS1, CCNF, MSRB1 
	   ATP6V0C, FAHD1, AMDHD2, HAGH, PDPK1, NUBP2, SPSB3, MRPS34, NME3, JPT2 
PC_ 3 
Positive:  RARS1, PANK

INFO [2023-01-12 13:12:40] define_signif_tumor_subclusters(), tumor: CRC09-PT


Centering and scaling data matrix

PC_ 1 
Positive:  ANGPTL4, RAB11B, RPS28, ZNF317, HNRNPM, NDUFA7, ZNF266, CD320, ZNF426, TIMM44 
	   ZNF562, SNAPC2, ZNF846, TRAPPC5, FBXL12, STXBP2, UBL5, PET100, XAB2, PIN1 
	   PNPLA6, MCOLN1, SHFL, PEX11G, ARHGEF18, PPAN, SH2D3A, TRIP10, GPR108, EIF3G 
Negative:  PCCB, CEP63, ANAPC13, STAG1, NCK1, DBR1, ARMC8, CEP70, FAIM, PIK3CB 
	   MRPS22, CNIH1, GMFB, CGRRF1, CDKN3, BMP4, GCH1, GNPNAT1, MAPK1IP1L, PSMC6 
	   COPB2, ERO1A, LGALS3, DLGAP5, RTRAF, FBXO34, TMX1, KTN1, TMEM260, RBP2 
PC_ 2 
Positive:  PARP10, GRINA, OPLAH, EXOSC4, GPAA1, CYC1, SHARPIN, MAF1, HGH1, MROH1 
	   BOP1, HSF1, PSMC4, FBL, TIMM50, SUPT5H, RPS16, ZFP36, MED29, PAF1 
	   PAK4, MRPS12, TECR, DNAJB1, NDUFB7, GIPC1, PKN1, SARS2, DDX39A, RAD23A 
Negative:  SMARCA5, ANAPC10, USP38, ABCE1, INPP4B, SMAD1, ZNF330, LSM6, ELMOD2, TMEM184C 
	   SCOC, PRMT9, MGST2, LRBA, NDUFC1, ELF2, C4orf33, SCLT1, RPS3A, PGRMC2 
	   LARP1B, SH3D19, ABHD18, GATB, MFSD8, SPRY1, ARFIP1, NUDT6, TRIM2, KI

INFO [2023-01-12 13:12:40] define_signif_tumor_subclusters(), tumor: CRC10-PT


Centering and scaling data matrix

PC_ 1 
Positive:  NAMPT, HBP1, COG5, SYPL1, DUS4L, ATXN7L1, BCAP29, RINT1, PUS7, CBLL1-AS1 
	   SRPK2, CBLL1, KMT2E-AS1, DLD, KMT2E, ORC5, RCC1L, GTF2IRD2B, NSUN5P1, GTF2I 
	   GTF2IRD1, PSMC2, LAMB1, POM121C, CCL24, DNAJC2, CLIP2, PNPLA8, RHBDD2, PMPCB 
Negative:  GAR1, PITX2, LARP7, CAMK2D, UGT8, SNHG8, METTL14, SEC24D, USP53, FABP2 
	   ANXA5, EXOSC9, CCNA2, BBS7, KIAA1109, NUDT6, SPRY1, MFSD8, ABHD18, LARP1B 
	   PGRMC2, SCLT1, C4orf33, ELF2, NDUFC1, MGST2, SCOC, ELMOD2, ZNF330, INPP4B 
PC_ 2 
Positive:  TRAM1, NCOA2, LACTB2, CPA6, ARFGEF1, TERF1, COPS5, CSPP1, SNHG6, RPL7 
	   SGK3, RDH10, C8orf44, STAU2, RRS1, UBE2W, PDE7A, ELOC, MTFR1, PPP2CB 
	   FUT10, UBXN8, RBPMS, MAK16, DCTN6, GSR, GTF2E2, LINC01605, TMEM70, ARMC1 
Negative:  CEACAM6, RPS19, ARHGEF1, CEACAM5, DMAC2, B3GNT8, RABAC1, CEACAM7, BCKDHA, EXOSC5 
	   B9D2, ZNF574, CCDC97, DEDD2, HNRNPUL1, PAFAH1B3, CNFN, CEACAM1, CD177, LYPD3 
	   ETHE1, XRCC1, ZNF576, PLAUR, KCNN4, ZNF224, ZNF23

INFO [2023-01-12 13:12:41] define_signif_tumor_subclusters(), tumor: CRC01-NT


Centering and scaling data matrix

PC_ 1 
Positive:  LPAR2, ZNF101, PBX4, ZNF506, NDUFA13, GATAD2A, ZNF253, ZNF430, ZNF429, ZNF91 
	   ZNF675, RPSAP58, ZNF254, ZNF83, ZNF701, ZNF880, LINC00662, LINC02987, UQCRFS1, POP4 
	   TRIM4, AZGP1, CYP3A5, ZKSCAN1, ZNF655, ZSCAN21, FAM200A, ZNF3, ZNF394, COPS6 
Negative:  PRELID2, YIPF5, SH3RF2, ARHGAP26, SPRY4, LARS1, NDFIP1, RBM27, GNPDA1, RNF14 
	   TCERG1, DELE1, PCDH1, SPINK1, FCHSD1, RELL2, FBXO38, HDAC3, DIAPH1, TAF7 
	   HARS1, ZMAT2, HARS2, WDR55, IK, PCYOX1L, TMCO6, NDUFA2, CD14, SLC35A4 
PC_ 2 
Positive:  HMGB1P5, RPL15, NR1D2, SGO1, TOP2B, NGLY1, RAB5A, OXSM, TBC1D5, CMC1 
	   OXNAD1, AZI2, DPH3, ANKRD28, BTD, TGFBR2, HACL1, STT3B, EAF1, OSBPL10 
	   METTL6, GPD1L, CMTM8, CMTM7, CAPN7, CMTM6, RBSN, INPP1, MFSD6, HIBCH 
Negative:  RAMAC, SNHG21, C15orf40, WDR73, BTBD1, NMB, RPS17, SEC11A, UBE2Q2P2, PDE8A 
	   EFL1, AKAP13, STARD5, KLHL25, MRPL46, MESD, MRPS11, CEMIP, AEN, FAH 
	   ISG20, CYTOR, KRCC1, RMND5A, ZFAND6, ABHD2, FABP1, RNF1

INFO [2023-01-12 13:12:41] define_signif_tumor_subclusters(), tumor: CRC02-NT


Centering and scaling data matrix

PC_ 1 
Positive:  NLRP2, CDC42EP5, LENG8, RPS9, TSEN34, MBOAT7, TMC4, ZNF586, LENG1, TFPT 
	   NDUFA3, MYADM, ZNF552, ZNF331, ZNF761, ZNF816, ZNF160, ZNF468, ZNF28, TPT1 
	   ZNF587, ZNF600, ZNF83, EDN1, RPL15P3, TBC1D7, ADTRP, SIRT5, NEDD9, TPT1-AS1 
Negative:  SRSF4, EPB41, MECR, YTHDF2, PUM1, SNRNP40, ZCCHC17, FABP3, SERINC2, HDAC1 
	   LCK, MARCKSL1, EIF3I, TINAGL1, BSDC1, TMEM234, PEF1, ZBTB8A, IQCC, ZBTB8OS 
	   RBBP4, CCDC28B, PTP4A2, YARS1, TXLNA, KHDRBS1, KPNA6, TMEM39B, S100PBP, TMEM54 
PC_ 2 
Positive:  TGOLN2, TMSB10, CAPG, TRABD2A, PARTICL, SUCLG1, MAT2A, GGCX, VAMP8, VAMP5 
	   REG3A, RNF181, USP39, REG1A, C2orf68, REG1B, PTCD3, IMMT, GCFC2, MRPL35 
	   MRPL19, EVA1A, KDM3A, TMEM42, ZDHHC3, KIF15, KIAA1143, ZNF502, POLE4, EXOSC7 
Negative:  PSMD14, TANK, GCG, DPP4, IFIH1, ITGB6, GCA, GALNT3, LY75, CERS6 
	   MARCHF7, NOSTRIN, BAZ2B, SPC25, WDSUB1, TANC1, FASTKD1, PKP4, PPIG, ACVR1 
	   PHOSPHO2, FAM133DP, KLHL23, GPD2, SSB, NR4A2, METTL5

INFO [2023-01-12 13:12:42] define_signif_tumor_subclusters(), tumor: CRC03-NT


Centering and scaling data matrix

PC_ 1 
Positive:  SNX25, CFAP97, SLC25A4, IPPK, SUSD3, ACSL1, NINJ1, WNK2, CENPU, PRIMPOL 
	   CASP3, MAB21L4, GPR35, CAPN10, ANKMY1, COPS9, IRF2, RNPEPL1, NDUFA10, HES6 
	   TCF3, CDKN2AIP, SCAMP4, ILKAP, CSNK1G2, DCTD, BTBD2, MKNK2, SCLY, AGA 
Negative:  NCOA7, HDDC2, HINT3, TPD52L1, TRMT11, SMPDL3A, PKIB, CENPW, SERINC1, RNF146 
	   HSF2, ECHDC1, ASF1A, PTPRK, ARHGAP18, NUS1, TMEM200A, EPB41L2, GOPC, ZUP1 
	   RWDD1, TSPYL1, NT5DC1, HDAC2, MARCKS, YRDC, CDCA8, C1orf122, C1orf109, SF3A3 
PC_ 2 
Positive:  KRR1, PHLDA1, ATXN7L3B, NAP1L1, TBC1D15, INO80C, GALNT1, ZNF24, OSBPL8, ZNF271P 
	   C18orf21, TMEM19, RPRD1A, SLC39A6, ZNF397, PAWR, ELP2, THAP2, MAPRE2, TPGS2 
	   ZFC3H1, PPP1R12A, RNF138, PIK3C3, PSTPIP2, CCDC59, TSPAN8, SMAD7, ATP5F1A, HAUS1 
Negative:  TMEM208, NOL3, TPPP3, KIAA0895L, ELMO3, FBXL8, E2F4, HSD11B2, TRADD, CMTM4 
	   PHAF1, ATP6V0D1, DYNC1LI2, CKLF, CBFB, NAE1, TK2, CES3, LINC00920, CES2 
	   CA7, SLC38A7, RPS27AP16, CTCF, CIAO2

INFO [2023-01-12 13:12:42] define_signif_tumor_subclusters(), tumor: CRC04-NT


Centering and scaling data matrix

PC_ 1 
Positive:  TMEM52, PRKCZ, FAAP20, RER1, GNB1, PEX10, SLC35E2B, MIB2, PANK4, CDK11A 
	   NADK, TNFRSF14-AS1, GEMIN7, SSU72, TNFRSF14, PRXL2B, TRAPPC6A, MMEL1, ARHGEF16, TPRG1L 
	   ERCC2, ATAD3A, WRAP73, POLR1G, PLAUR, ERCC1, LRRC47, ZNF576, ATAD3B, FOSB 
Negative:  FZD6, SLC25A32, DCAF13, ATP5MC3, LNPK, ATF2, OXR1, H3P6, HOXD1, SCRN3 
	   CIR1, OLA1, MTX2, SP3, CDCA7, HNRNPA3, EIF3E, MAP3K20, UBR5-DT, NFE2L2 
	   ITGA6, AGPS, METAP1D, EMC2, RBM45, LRATD1, LNX1, PRKRA, FIP1L1, CHIC2 
PC_ 2 
Positive:  IL1B, IL1RN, BUB1, MIR4435-2HG, SLC20A1, MTLN, PAX8-AS1, NPHP1, BCL2L11, CHCHD5 
	   CBWD2, POLR1B, MALL, RABL2A, ZC3H8, ANAPC1, TMEM87B, SLC35F5, SOWAHC, DDX18 
	   SEPTIN10, CCDC93, CCDC138, INSIG2, STEAP3, RANBP2, C2orf76, GCC2, DBI, SULT1C2 
Negative:  MGME1, OVOL2, SNX5, KAT14, RRBP1, DSTN, SNRPB2, PET117, KIF16B, NDUFAF5 
	   ESF1, ZNF133, TASP1, BTBD3, JAG1, POLR3F, SLX4IP, MKKS, PLCB4, SEC23B 
	   TMX4, FERMT1, CRLS1, SMIM26, TRMT6, SHLD1, 

INFO [2023-01-12 13:12:42] define_signif_tumor_subclusters(), tumor: CRC05-NT


Centering and scaling data matrix

PC_ 1 
Positive:  RBBP4, S100PBP, YARS1, TMEM54, AK2, ZBTB8OS, AZIN2, ZBTB8A, PHC2, SMIM12 
	   BSDC1, GJB4, MARCKSL1, GJB3, HDAC1, TMEM35B, LCK, EIF3I, ZMYM6, TMEM234 
	   IQCC, CCDC28B, SFPQ, TXLNA, KIAA0319L, KPNA6, PSMB2, TMEM39B, KHDRBS1, AGO3 
Negative:  ZNF83, ZNF701, ZNF880, ZNF480, ZNF766, ZNF350, ZNF649, ZNF577, ETFB, KLK12 
	   KLK11, KLK10, KLK8, KLK7, FLJ42393, LPP, KLK6, RTP4, KLK1, ST6GAL1 
	   C19orf48, RFC4, JOSD2, EIF4A2, PCID2, EMC10, F10, ATAD3B, MCF2L, ATAD3A 
PC_ 2 
Positive:  TMEM123, MMP7, BIRC2, MMP1, DCUN1D5, BIRC3, CASP4, CASP5, JRKL, CASP1 
	   CARD16, AASDHPPT, CWF19L2, CCDC82, SLC35F2, CUL5, MTMR2, ACAT1, CEP57, POGLUT3 
	   ENDOD1, DDX10, FDX1, COLCA2, PPP2R1B, ALG9, FDXACB1, C11orf1, CRYAB, C11orf52 
Negative:  MRPL45, NPEPPSP1, HNF1B, CDK12, PPP1R1B, STARD3, PGAP3, ERBB2, MIEN1, GRB7 
	   GSDMB, MAP3K13, LIPH, TMEM41A, IGF2BP2, SENP2, EHHADH, TRA2B, VPS8, CLCN2 
	   EIF4G1, POLR2H, MAGEF1, PSMD2, TBCCD1, EPHB3, EEF1AKM

INFO [2023-01-12 13:12:43] define_signif_tumor_subclusters(), tumor: CRC07-NT


Centering and scaling data matrix

PC_ 1 
Positive:  NDUFA5, WASL, WASL-DT, FAM3C, POT1, ING3, GRM8, TSPAN12, LSM8, CFTR 
	   ST7, CAPZA2, MET, TES, SMIM30, TMEM168, IFRD1, ZNF277, DNAJB9, PNPLA8 
	   SF3B1, COQ10B, HSPD1, LAMB1, GTF3C3, SLC39A10, STK17B, HSPE1, NABP1, MOB4 
Negative:  DOLPP1, CRAT, PTPA, LINC00963, NTMT1, ASB6, PTGES, TOR1B, TOR1A, C9orf78 
	   USP20, ASS1, FUBP3, EXOSC2, ABL1, NUP214, POMT1, UCK1, MED27, SETX 
	   TTF1, GOSR2, DDX31, SPIB, POLD1, CDC27, NR1H2, GARIN5A, MYH14, VRK3 
PC_ 2 
Positive:  NR1H3, ACP2, SLC39A13, PSMC3, CELF1, NDUFS3, PTPMT1, KBTBD4, MTCH2, FNBP4 
	   DMAP1, ERI3, CCDC24, TMEM53, KIF2C, RPS8, B4GALT2, PLK3, NUP160, ATP6V0B 
	   EIF2B3, DPH2, HECTD3, PTPRF, TNKS1BP1, UROD, HPDL, HYI, MUTYH, SSRP1 
Negative:  GBA, SCAMP3, MTX1, FDPS, THBS3, RUSC1, MUC1, ASH1L, MSTO1, KRTCAP2 
	   YY1AP1, DAP3, GON4L, DPM3, KHDC4, RXFP4, SSR2, SLC50A1, LAMTOR2, RAB25 
	   LMNA, EFNA1, SEMA4A, MEF2A, PRC1, LINS1, SLCO3A1, RCCD1, LRRC28, MCTP2 
PC_ 3 
Positive:  

INFO [2023-01-12 13:12:43] define_signif_tumor_subclusters(), tumor: CRC08-NT


Centering and scaling data matrix

PC_ 1 
Positive:  F3, SLC44A3-AS1, SLC44A3, CNN3, ALG14, TLCD4, SNX7, SLC35A3, RPL7P9, RWDD3 
	   TRMT13, DBT, RTCA, EXTL2, SLC30A7, DPH5, DPH5-DT, RNPC3, AMY2B, PRMT6 
	   VAV3, SLC25A24, STXBP3, PRPF38B, HENMT1, GPSM2, CLCC1, TAF13, TMEM167B, SARS1 
Negative:  ATG13, AMBRA1, MDK, CREB3L1, MSRB1, NDUFB10, RPS2, FAHD1, HAGH, SNHG9 
	   NUBP2, JPT2, TBL3, CLCN7, SPSB3, NME3, LARGE2, C16orf91, MRPS34, GNPTG 
	   NOXO1, TSR3, UBE2I, TPSG1, PEX16, LMF1, GFER, CHTF18, RPUSD1, SNRNP25 
PC_ 2 
Positive:  ATG4D, KRI1, KEAP1, CDKN2D, SLC44A2, AP1M2, CDC37, ILF3-DT, TYK2, ILF3 
	   ICAM3, QTRT1, RAVER1, DNM2, FDX2, TMED1, ICAM1, YIPF2, TIMM29, SMARCA4 
	   ZNF627, ACP5, LDLR, ELOF1, ZNF823, ZNF69, ECSIT, DOCK6, PRKCSH, ZNF700 
Negative:  ANXA2, TPM1, VPS13C, LACTB, CIAO2A, RPS27L, DAPK2, SNX1, CA12, USP3 
	   HERC1, RPS3AP6, KCNE3, POLD3, LIPT2-AS1, PPIB, SLCO2B1, BNIP2, PGM2L1, ARRB1 
	   GTF2A2, GCNT3, UCP2, RPS3, KLHL35, MYO1E, GDPD5, SERPINH1, PAAF1, CCNB2 

INFO [2023-01-12 13:12:43] define_signif_tumor_subclusters(), tumor: CRC09-NT


Centering and scaling data matrix

PC_ 1 
Positive:  PLEKHB1, P2RY2, ATG16L2, STARD10, ARAP1, CLPB, INPPL1, FOLR1, ANAPC15, LAMTOR1 
	   NUMA1, RNF121, NADSYN1, DHCR7, CTTN, PPFIA1, FADD, LTO1, CCND1, LINC02747 
	   SLC39A3, MYEOV, TPCN2, GADD45B, IGHMBP2, NDUFAB1, COG8, LMNB2, MRPL21, VPS4A 
Negative:  RNF138, MAPRE2, DSG2, ZNF397, GALNT1, C18orf21, ZNF271P, INO80C, ZNF24, RPRD1A 
	   SLC39A6, DSC2, ELP2, SS18, TPGS2, PIK3C3, PSTPIP2, IMPACT, ATP5F1A, HAUS1 
	   OSBPL1A, HDHD2, LAMA3, IER3IP1, NPC1, SMAD7, RMC1, DYM, RIOK3, RPL17-C18orf32 
PC_ 2 
Positive:  PEX1, RBM48, CDC23, FAM13B, FAM133B, SMAD5, TGFBI, CDC25C, CXCL14, FAM53C 
	   HEPACAM2, MACROH2A1, KDM3B, PCBD2, EGR1, TXNDC15, VPS50, ETF1, C5orf24, BET1 
	   HSPA9, DDX46, PON2, ANKHD1-EIF4EBP3, SRA1, ANKHD1, ANKHD1-DT, CTNNA1, HBEGF, EIF4EBP3 
Negative:  CLUAP1, NAA60, DNASE1, ZNF174, PAM16, CREBBP, TRAP1, ZSCAN32, CORO7-PAM16, CORO7 
	   ZNF75A, ZNF263, DNAJA3, ZNF200, NMRAL1, IL32, HMOX2, BICDL2, CDIP1, THOC6 
	   MGRN1, HCFC

INFO [2023-01-12 13:12:44] define_signif_tumor_subclusters(), tumor: CRC10-NT


Centering and scaling data matrix

PC_ 1 
Positive:  ZNF552, ZNF586, ZNF587, ZNF419, ZNF274, ZNF749, ZNF544, TRAPPC2B, ERVK3-1, RPS5 
	   ZSCAN5A, ZNF584, ZNF324, ZNF444, ZNF577, ETFB, KLK12, ZNF649, KLK11, ZNF446 
	   EPN1, ZNF350, KLK10, ZNF766, KLK8, SLC27A5, ZNF480, KLK7, KLK6, ZNF880 
Negative:  SMIM30, TES, TMEM168, MET, IFRD1, CAPZA2, ZNF277, ST7, CFTR, ACAA2 
	   DNAJB9, MYO5B, LIPG, RPL17, ME2, MBD1, ELAC1, RPL17-C18orf32, CCDC68, TXNL1 
	   DYM, SMAD7, NARS1, IER3IP1, LSM8, HDHD2, HAUS1, ZNF271P, ZNF397, ZNF24 
PC_ 2 
Positive:  YTHDF2, TAF12, EPB41, ZCCHC17, SNHG12, SNRNP40, FABP3, MECR, PUM1, SRSF4 
	   TRNAU1AP, SERINC2, SNHG3, TINAGL1, RCC1, PHACTR4, PEF1, MED18, PTP4A2, SESN2 
	   ATP5IF1, KHDRBS1, DNAJC8, TMEM39B, EYA3, KPNA6, XKR8, TXLNA, SMPDL3B, RPA2 
Negative:  DCAF5, ACTN1, EXD2, ERH, ZFP36L1, SLC39A9, RAD51B, RDH11, SUSD6, VTI1B 
	   SRSF5, COX16, RPL7AP6, ARG2, SYNJ2BP, MED6, SIPA1L1, DCAF4, ZFYVE1, RBM25 
	   PSEN1, NUMB, ACOT2, PNMA1, ZNF410, COQ6, NFIB, TTC39B

INFO [2023-01-12 13:12:59] -mirroring for hspike
INFO [2023-01-12 13:12:59] define_signif_tumor_subclusters(p_val=0.1
INFO [2023-01-12 13:13:00] define_signif_tumor_subclusters(), tumor: spike_tumor_cell_CRC01-NT
INFO [2023-01-12 13:13:00] define_signif_tumor_subclusters(), tumor: spike_tumor_cell_CRC02-NT
INFO [2023-01-12 13:13:00] define_signif_tumor_subclusters(), tumor: spike_tumor_cell_CRC03-NT
INFO [2023-01-12 13:13:00] define_signif_tumor_subclusters(), tumor: spike_tumor_cell_CRC04-NT
INFO [2023-01-12 13:13:00] define_signif_tumor_subclusters(), tumor: spike_tumor_cell_CRC05-NT
INFO [2023-01-12 13:13:01] define_signif_tumor_subclusters(), tumor: spike_tumor_cell_CRC07-NT
INFO [2023-01-12 13:13:01] define_signif_tumor_subclusters(), tumor: spike_tumor_cell_CRC08-NT
INFO [2023-01-12 13:13:01] define_signif_tumor_subclusters(), tumor: spike_tumor_cell_CRC09-NT
INFO [2023-01-12 13:13:01] define_signif_tumor_subclusters(), tumor: spike_tumor_cell_CRC10-NT
INFO [2023-01-12 13:13:01] 

In [34]:
saveRDS(infercnv_obj, file = "patient_tissue/00_infercnv_obj.rds")

# CNV heatmap using heatmap.3.R

In [4]:
infercnv_obj <- readRDS("patient_tissue/00_infercnv_obj.rds")

In [None]:
source("./heatmap.3.R")

In [6]:
# load results
res <- t(as.data.frame(infercnv_obj@expr.data))
dim(res)
res[1:2, 1:5]

Unnamed: 0,LINC01128,NOC2L,ISG15,C1orf159,SDF4
CRC01_L1_Barcode01,1.175955,1.178252,1.181446,1.186522,1.189957
CRC01_L1_Barcode02,1.002464,1.002464,1.002464,1.002464,1.002464


In [7]:
# genes order
gene_order <- read.table(file = "00_gene_ordering_file.txt", header = F)
colnames(gene_order) <- c("gene", "chr", "start", "end")
rownames(gene_order) <- gene_order$gene
gene_order <- gene_order[intersect(colnames(res), rownames(gene_order)), ]
gene_order$order <- c(1:length(gene_order$chr))
gene_order$chr <- factor(gene_order$chr, levels = c(
  "chr1", "chr2", "chr3", "chr4", "chr5", "chr6", "chr7", "chr8", "chr9", "chr10", "chr11",
  "chr12", "chr13", "chr14", "chr15", "chr16", "chr17", "chr18", "chr19", "chr20", "chr21", "chr22"
))
all(rownames(gene_order) == colnames(res))
head(gene_order, 2)

Unnamed: 0_level_0,gene,chr,start,end,order
Unnamed: 0_level_1,<chr>,<fct>,<int>,<int>,<int>
LINC01128,LINC01128,chr1,825138,859446,1
NOC2L,NOC2L,chr1,944203,959309,2


In [8]:
colnames(res) <- gene_order$order
head(res, 2)

Unnamed: 0,1,2,3,4,5,6,7,8,9,10,⋯,8213,8214,8215,8216,8217,8218,8219,8220,8221,8222
CRC01_L1_Barcode01,1.175955,1.178252,1.181446,1.186522,1.189957,1.194382,1.198764,1.20153,1.204647,1.205138,⋯,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464
CRC01_L1_Barcode02,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464,⋯,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464


In [11]:
# load annotation file
ont <- readRDS(file = "../02_RNA_seurat/01_RNA_2184_1395_tx/00_tx_2184_1395_hvg1000_PC1_25.rds")
meta <- ont@meta.data[order(ont@meta.data$Tissue, ont@meta.data$celltype1, ont@meta.data$celltype3, ont@meta.data$patient), ]
head(meta, 2)
table(meta$Tissue)

Unnamed: 0_level_0,orig.ident,nCount_RNA,nFeature_RNA,CellName,library,patient,library_sub,tissue,position,barcode,⋯,PC_2,tSNE_1,tSNE_2,nCount_GENE,nFeature_GENE,celltype1,celltype1_1,celltype1_2,celltype2,celltype3
Unnamed: 0_level_1,<fct>,<dbl>,<int>,<chr>,<chr>,<chr>,<chr>,<chr>,<chr>,<chr>,⋯,<dbl>,<dbl>,<dbl>,<dbl>,<int>,<fct>,<chr>,<chr>,<fct>,<fct>
CRC01_L1_Barcode01,CRC01,274730.8,6733,CRC01_L1_Barcode01,CRC01_L1,CRC01,L1,NT,T1,Barcode01,⋯,-17.8032495,-17.989282,-12.42012,274730.8,4661,Normal epithelium,NE,NE,Stem/TA,Stem/TA
CRC01_L1_Barcode05,CRC01,10177.8,711,CRC01_L1_Barcode05,CRC01_L1,CRC01,L1,NT,T1,Barcode05,⋯,0.3504461,5.427324,-11.93935,10177.8,545,Normal epithelium,NE,NE,Stem/TA,Stem/TA



Normal Tissue Primary Tumor 
          298          1097 

In [12]:
res <- res[meta$CellName, ]
head(res, 2)

Unnamed: 0,1,2,3,4,5,6,7,8,9,10,⋯,8213,8214,8215,8216,8217,8218,8219,8220,8221,8222
CRC01_L1_Barcode01,1.175955,1.178252,1.181446,1.186522,1.189957,1.194382,1.198764,1.20153,1.204647,1.205138,⋯,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464
CRC01_L1_Barcode05,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464,⋯,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464,1.002464


In [42]:
# row annotation
df_rlab <- data.frame(
  row.names = meta$CellName,
  Patient = meta$patient,
  Subtype = meta$celltype3,
  Cell_type = meta$celltype1,
  Tissue = meta$Tissue
)
head(df_rlab, 1)
table(df_rlab$Patient)
table(df_rlab$Cell_type)
table(df_rlab$Subtype)
table(df_rlab$Tissue)

Unnamed: 0_level_0,Patient,Subtype,Cell_type,Tissue
Unnamed: 0_level_1,<chr>,<fct>,<fct>,<fct>
CRC01_L1_Barcode01,CRC01,Stem/TA,Normal epithelium,Normal Tissue



CRC01 CRC02 CRC03 CRC04 CRC05 CRC07 CRC08 CRC09 CRC10 
  165   122    91   100   164   275   132   204   142 


Normal epithelium      Cancer cells 
              374              1021 


               Stem/TA             Enterocyte        Immature Goblet 
                   186                     34                    117 
                Goblet           Stem/TA-like   Immature Goblet-like 
                    37                    826                    186 
Goblet/Enterocyte-like 
                     9 


Normal Tissue Primary Tumor 
          298          1097 

In [43]:
map_Patient <- data.frame(
  Patient = names(table(meta$patient)), Patient_colors = patient_color[c(1:9)]
)
map_Subtype <- data.frame(
  Subtype = names(table(meta$celltype3)), Subtype_colors = celltype3_color
)
map_Cell_type <- data.frame(
  Cell_type = names(table(meta$celltype1)), Cell_type_colors = celltype1_color
)
map_Tissue <- data.frame(
  Tissue = names(table(meta$Tissue)), Tissue_colors = tissue_color
)

In [44]:
df_rlab_colors <- df_rlab
df_rlab_colors$Patient <- map_Patient[match(df_rlab_colors$Patient, map_Patient$Patient), "Patient_colors"]
df_rlab_colors$Subtype <- map_Subtype[match(df_rlab_colors$Subtype, map_Subtype$Subtype), "Subtype_colors"]
df_rlab_colors$Cell_type <- map_Cell_type[match(df_rlab_colors$Cell_type, map_Cell_type$Cell_type), "Cell_type_colors"]
df_rlab_colors$Tissue <- map_Tissue[match(df_rlab_colors$Tissue, map_Tissue$Tissue), "Tissue_colors"]
df_rlab_colors <- as.matrix(t(df_rlab_colors))
df_rlab_colors

Unnamed: 0,CRC01_L1_Barcode01,CRC01_L1_Barcode05,CRC01_L1_Barcode09,CRC01_L1_Barcode10,CRC01_L1_Barcode17,CRC01_L1_Barcode21,CRC01_L1_Barcode22,CRC01_L1_Barcode30,CRC01_L1_Barcode31,CRC01_L1_Barcode33,⋯,CRC09_L4_CRC10_L2_Barcode93,CRC09_L3_CRC10_L1_Barcode15,CRC09_L3_CRC10_L1_Barcode17,CRC09_L3_CRC10_L1_Barcode31,CRC09_L4_CRC10_L2_Barcode21,CRC01_L3_Barcode13,CRC01_L3_Barcode31,CRC04_L1_CRC07_L2_Barcode09,CRC09_L4_CRC10_L2_Barcode82,CRC09_L4_CRC10_L2_Barcode24
Patient,#FED439FF,#FED439FF,#FED439FF,#FED439FF,#FED439FF,#FED439FF,#FED439FF,#FED439FF,#FED439FF,#FED439FF,⋯,#71D0F5FF,#E377C2FF,#E377C2FF,#E377C2FF,#E377C2FF,#FED439FF,#FED439FF,#D5E4A2FF,#71D0F5FF,#E377C2FF
Subtype,#9467BDFF,#9467BDFF,#9467BDFF,#9467BDFF,#9467BDFF,#9467BDFF,#9467BDFF,#9467BDFF,#9467BDFF,#9467BDFF,⋯,#FD7446FF,#FD7446FF,#FD7446FF,#FD7446FF,#FD7446FF,#8A9197FF,#8A9197FF,#8A9197FF,#8A9197FF,#8A9197FF
Cell_type,#0072B5FF,#0072B5FF,#0072B5FF,#0072B5FF,#0072B5FF,#0072B5FF,#0072B5FF,#0072B5FF,#0072B5FF,#0072B5FF,⋯,#D62728FF,#D62728FF,#D62728FF,#D62728FF,#D62728FF,#D62728FF,#D62728FF,#D62728FF,#D62728FF,#D62728FF
Tissue,#2CA02CFF,#2CA02CFF,#2CA02CFF,#2CA02CFF,#2CA02CFF,#2CA02CFF,#2CA02CFF,#2CA02CFF,#2CA02CFF,#2CA02CFF,⋯,#E377C2FF,#E377C2FF,#E377C2FF,#E377C2FF,#E377C2FF,#E377C2FF,#E377C2FF,#E377C2FF,#E377C2FF,#E377C2FF


In [23]:
summary(as.numeric(res))

   Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
 0.5334  1.0025  1.0025  1.0110  1.0025  2.1926 

In [24]:
up_limit <- 2 - min(res)
res[res > up_limit] <- up_limit

In [None]:
# chromosome boundary line
bin_len <- as.data.frame(table(gene_order$chr))
# cumsum(bin_len$Freq)

v_lines <- c(1 + 3, cumsum(bin_len$Freq))
# v_lines
h_lines <- c(1 - 0.5, dim(res)[1] + 0.5)
# h_lines

In [28]:
mycol <- colorRampPalette(rev(c(
  rep("#b2182b", 1), rep("#d6604d", 1), rep("#f4a582", 1), rep("#fddbc7", 1),
  rep("#f7f7f7", 1), rep("#f7f7f7", 1),
  rep("#d1e5f0", 1), rep("#92c5de", 1), rep("#4393c3", 1), rep("#2166ac", 1)
)))(100)
# colorRampPalette(c(rep("blue",1), rep("white",1),rep("red",1)))(50)

In [None]:
# no clustering
pdf("1_heatmap_infercnv_nocluster.pdf", height = 10, width = 10)
heatmap.3(
  res,
  col = mycol,
  Rowv = FALSE, Colv = FALSE, dendrogram = "none", scale = "none",
  # hclustfun=myclust, distfun=mydist,na.rm = TRUE,
  # revC = FALSE,
  RowSideColors = df_rlab_colors, RowSideColorsSize = 1.5, # keysize = 1,
  add.expr = abline(
    h = c(1 - 0.5, table(meta$celltype1)[2], dim(res)[1] + 0.5), v = v_lines
  ),
  labCol = FALSE, labRow = FALSE, margins = c(25, 4)
)
dev.off()

In [None]:
# Define custom dist and hclust functions for use with heatmaps
mydist <- function(c) {
  dist(c, method = "euclidean")
}
myclust <- function(c) {
  hclust(c, method = "ward.D")
}

In [50]:
# clustering
pdf("1_heatmap_infercnv_cluster.pdf", height = 10, width = 10)
p_out <- heatmap.3(
  res,
  col = mycol,
  # row clustering
  Rowv = TRUE, Colv = FALSE, dendrogram = "row", scale = "none",
  # clustering function
  hclustfun = myclust, distfun = mydist, na.rm = TRUE,
  # rev based on results
  revC = TRUE,
  # row annotation
  RowSideColors = df_rlab_colors, RowSideColorsSize = 1.5,
  # add chromosome lines
  add.expr = abline(h = h_lines, v = v_lines),
  labCol = FALSE, labRow = FALSE, margins = c(25, 4)
)
dev.off()