This notebook summarizes number of genes related to the metablism of reactive oxygen/nitrogen species in the KEGG annotations that were only found in pieces that were increased in abundance in CD.

In [1]:
setwd("..")

In [3]:
library(dplyr)
library(readr)
library(purrr)

In [11]:
definitions <- read_csv("~/github/2020-ibd/inputs/kegg_ortholog_definitions.csv", show_col_types = F)

In [12]:
head(definitions)

ko,definition
<chr>,<chr>
K00844,HK; hexokinase [EC:2.7.1.1]
K12407,GCK; glucokinase [EC:2.7.1.2]
K00845,glk; glucokinase [EC:2.7.1.2]
K01810,"GPI, pgi; glucose-6-phosphate isomerase [EC:5.3.1.9]"
K06859,"pgi1; glucose-6-phosphate isomerase, archaeal [EC:5.3.1.9]"
K13810,tal-pgi; transaldolase / glucose-6-phosphate isomerase [EC:2.2.1.2 5.3.1.9]


In [13]:
ox_kos <- Sys.glob("outputs/sgc_pangenome_catlases_corncob_annotation_analysis/*_distinct_ox_kos.tsv") %>%
  map_dfr(read_tsv, show_col_types = F) %>%
  left_join(definitions, by = "ko")

In [14]:
head(ox_kos)

dom_id,KEGG_ko,abundance,species,ko,source,definition
<dbl>,<chr>,<chr>,<chr>,<chr>,<chr>,<chr>
37940,ko:K00384,increased,s__Enterocloster-clostridioformis_A,K00384,10.1016/j.freeradbiomed.2019.03.032,"trxB, TRR; thioredoxin reductase (NADPH) [EC:1.8.1.9]"
59840,ko:K03386,increased,s__Enterocloster-clostridioformis_A,K03386,10.1016/j.freeradbiomed.2019.03.032,"PRDX2_4, ahpC; peroxiredoxin 2/4 [EC:1.11.1.24]"
59840,ko:K03386,increased,s__Enterocloster-clostridioformis_A,K03386,10.1016/j.freeradbiomed.2019.03.032,"PRDX2_4, ahpC; peroxiredoxin 2/4 [EC:1.11.1.24]"
71955,ko:K00384,increased,s__Enterocloster-clostridioformis_A,K00384,10.1016/j.freeradbiomed.2019.03.032,"trxB, TRR; thioredoxin reductase (NADPH) [EC:1.8.1.9]"
73059,ko:K00384,increased,s__Enterocloster-clostridioformis_A,K00384,10.1016/j.freeradbiomed.2019.03.032,"trxB, TRR; thioredoxin reductase (NADPH) [EC:1.8.1.9]"
83257,ko:K03386,increased,s__Enterocloster-clostridioformis_A,K03386,10.1016/j.freeradbiomed.2019.03.032,"PRDX2_4, ahpC; peroxiredoxin 2/4 [EC:1.11.1.24]"


In [15]:
ox_kos %>%
  select(species, abundance, ko, definition) %>%
  group_by(species, abundance, ko, definition) %>%
  tally()

species,abundance,ko,definition,n
<chr>,<chr>,<chr>,<chr>,<int>
s__Enterocloster-bolteae,increased,K00384,"trxB, TRR; thioredoxin reductase (NADPH) [EC:1.8.1.9]",14
s__Enterocloster-bolteae,increased,K03386,"PRDX2_4, ahpC; peroxiredoxin 2/4 [EC:1.11.1.24]",10
s__Enterocloster-bolteae,increased,K04565,"SOD1; superoxide dismutase, Cu-Zn family [EC:1.15.1.1]",10
s__Enterocloster-bolteae,increased,K05919,dfx; superoxide reductase [EC:1.15.1.2],4
s__Enterocloster-clostridioformis,increased,K00384,"trxB, TRR; thioredoxin reductase (NADPH) [EC:1.8.1.9]",11
s__Enterocloster-clostridioformis,increased,K03386,"PRDX2_4, ahpC; peroxiredoxin 2/4 [EC:1.11.1.24]",16
s__Enterocloster-clostridioformis,increased,K04565,"SOD1; superoxide dismutase, Cu-Zn family [EC:1.15.1.1]",15
s__Enterocloster-clostridioformis,increased,K05919,dfx; superoxide reductase [EC:1.15.1.2],4
s__Enterocloster-clostridioformis_A,increased,K00384,"trxB, TRR; thioredoxin reductase (NADPH) [EC:1.8.1.9]",12
s__Enterocloster-clostridioformis_A,increased,K03386,"PRDX2_4, ahpC; peroxiredoxin 2/4 [EC:1.11.1.24]",6


In [16]:
ox_kos %>%
  select(species, abundance, ko, definition) %>%
  distinct()

species,abundance,ko,definition
<chr>,<chr>,<chr>,<chr>
s__Enterocloster-clostridioformis_A,increased,K00384,"trxB, TRR; thioredoxin reductase (NADPH) [EC:1.8.1.9]"
s__Enterocloster-clostridioformis_A,increased,K03386,"PRDX2_4, ahpC; peroxiredoxin 2/4 [EC:1.11.1.24]"
s__Enterocloster-clostridioformis_A,increased,K04565,"SOD1; superoxide dismutase, Cu-Zn family [EC:1.15.1.1]"
s__Enterocloster-clostridioformis_A,increased,K05919,dfx; superoxide reductase [EC:1.15.1.2]
s__Enterocloster-bolteae,increased,K03386,"PRDX2_4, ahpC; peroxiredoxin 2/4 [EC:1.11.1.24]"
s__Enterocloster-bolteae,increased,K00384,"trxB, TRR; thioredoxin reductase (NADPH) [EC:1.8.1.9]"
s__Enterocloster-bolteae,increased,K05919,dfx; superoxide reductase [EC:1.15.1.2]
s__Enterocloster-bolteae,increased,K04565,"SOD1; superoxide dismutase, Cu-Zn family [EC:1.15.1.1]"
s__Enterocloster-sp005845215,increased,K03386,"PRDX2_4, ahpC; peroxiredoxin 2/4 [EC:1.11.1.24]"
s__Enterocloster-sp005845215,increased,K05919,dfx; superoxide reductase [EC:1.15.1.2]


In [17]:
ox_kos %>%
  select(species, abundance, ko, definition) %>%
  distinct() %>%
  group_by(species, abundance) %>%
  tally()

species,abundance,n
<chr>,<chr>,<int>
s__Enterocloster-bolteae,increased,4
s__Enterocloster-clostridioformis,increased,4
s__Enterocloster-clostridioformis_A,increased,4
s__Enterocloster-sp005845215,increased,4
s__Ruminococcus_B-gnavus,decreased,2
s__Ruminococcus_B-gnavus,increased,3
