## Environment
Using Kernel: `dan-dev-py312-r433`

-----

In [1]:
import sys
import os

# ##### SET SYS PATH TO WHERE THE SOURCE CODE IS. #####
# Note: This is not required if you are using the pip installed package
wormcat_dir = "/Users/dan/Code/Python/wormcat3"
sys.path.insert(0, wormcat_dir)

print("Working directory:", wormcat_dir)

Working directory: /Users/dan/Code/Python/wormcat3


In [2]:
# What Annotations are available by default?

import wormcat3
from wormcat3 import AnnotationsManager
print(f"Wormcat3 {wormcat3.__version__}")
AnnotationsManager.available_annotation_files()


Wormcat3 0.1.7


['ORF_only_v2_nov-11-2021.csv',
 'ahringer_v2_nov-11-2021.csv',
 'orfeome_v2_nov-11-2021.csv',
 'whole_genome_v2_nov-11-2021.csv']

In [3]:
# What PAdjustMethod(s) are available?

from wormcat3 import PAdjustMethod
print(list(PAdjustMethod))

[<PAdjustMethod.BONFERRONI: 'bonferroni'>, <PAdjustMethod.FDR: 'fdr_bh'>]


-----
#### Stress-responsive and metabolic gene regulation are altered in low S-adenosylmethionine

**Compare**
- low sam basal condition whole_genome_v2
- low sam heat shock whole_genome_v2


In [7]:
from wormcat3 import Wormcat, WormcatError, PAdjustMethod
from wormcat3 import constants as cs
from pathlib import Path

derived_data_path = Path("../derived_data/walker_lab")
input_data_path = derived_data_path / "low_sam_s009/basal_conditions"
output_analysis_path = "../analysis/walker_lab/low_sam"

wormcat = Wormcat(working_dir_path = output_analysis_path,
                  title = "low_sam basal_conditions Whole Genome", 
                  annotation_file_name = 'whole_genome_v2_nov-11-2021.csv')

wormcat.wormcat_batch(input_data_path, 
                      p_adjust_method = PAdjustMethod.BONFERRONI, 
                      p_adjust_threshold = 0.05,
                      gene_type = cs.GENE_TYPE_WORMBASE_ID)

Analysis complete. Output can be found at ../analysis/walker_lab/low_sam/low_sam_basal_conditions_Whole_Genome_79223/sams-1_down_29527
Analysis complete. Output can be found at ../analysis/walker_lab/low_sam/low_sam_basal_conditions_Whole_Genome_79223/set-2_up_88943
Analysis complete. Output can be found at ../analysis/walker_lab/low_sam/low_sam_basal_conditions_Whole_Genome_79223/set-16_up_53933
Analysis complete. Output can be found at ../analysis/walker_lab/low_sam/low_sam_basal_conditions_Whole_Genome_79223/sams-1_up_65659
Analysis complete. Output can be found at ../analysis/walker_lab/low_sam/low_sam_basal_conditions_Whole_Genome_79223/set-2_down_44653
Analysis complete. Output can be found at ../analysis/walker_lab/low_sam/low_sam_basal_conditions_Whole_Genome_79223/set-16_down_11503
Analysis complete. Output can be found at ../analysis/walker_lab/low_sam/low_sam_basal_conditions_Whole_Genome_79223


In [8]:
from wormcat3 import Wormcat, WormcatError, PAdjustMethod
from wormcat3 import constants as cs

input_data_path = derived_data_path / "low_sam_s012/heat_shock"
output_analysis_path = "../analysis/walker_lab/low_sam"

wormcat = Wormcat(working_dir_path = output_analysis_path,
                  title = "low_sams heat shock Whole Genome", 
                  annotation_file_name = 'whole_genome_v2_nov-11-2021.csv')

wormcat.wormcat_batch(input_data_path, 
                      p_adjust_method = PAdjustMethod.BONFERRONI, 
                      p_adjust_threshold = 0.05,
                      gene_type = cs.GENE_TYPE_WORMBASE_ID)

Analysis complete. Output can be found at ../analysis/walker_lab/low_sam/low_sams_heat_shock_Whole_Genome_50850/control_down_61015
Analysis complete. Output can be found at ../analysis/walker_lab/low_sam/low_sams_heat_shock_Whole_Genome_50850/sams-1_down_24414
Analysis complete. Output can be found at ../analysis/walker_lab/low_sam/low_sams_heat_shock_Whole_Genome_50850/control_up_65665
Analysis complete. Output can be found at ../analysis/walker_lab/low_sam/low_sams_heat_shock_Whole_Genome_50850/set-2_up_44605
Analysis complete. Output can be found at ../analysis/walker_lab/low_sam/low_sams_heat_shock_Whole_Genome_50850/set-16_up_18747
Analysis complete. Output can be found at ../analysis/walker_lab/low_sam/low_sams_heat_shock_Whole_Genome_50850/sams-1_up_73510
Analysis complete. Output can be found at ../analysis/walker_lab/low_sam/low_sams_heat_shock_Whole_Genome_50850/set-2_down_76008
Analysis complete. Output can be found at ../analysis/walker_lab/low_sam/low_sams_heat_shock_Whole

-----
#### S-adenosylmethionine synthases specify distinct H3K4me3 populations and gene expression patterns during heat stress

**Compare**
- cut & tag whole_genome_v2
- cut & tag ORF_only_v2

In [17]:
from wormcat3 import Wormcat, WormcatError, PAdjustMethod
from wormcat3 import constants as cs

input_data_path = derived_data_path / "cut_and_tag/cut_and_tag"
output_analysis_path = "../analysis/walker_lab/cut_and_tag"


wormcat = Wormcat(working_dir_path = output_analysis_path,
                  title = "Cut and Tag Whole Genome", 
                  annotation_file_name = 'whole_genome_v2_nov-11-2021.csv')

wormcat.wormcat_batch(input_data_path, 
                      p_adjust_method = PAdjustMethod.BONFERRONI, 
                      p_adjust_threshold = 0.05,
                      gene_type = cs.GENE_TYPE_WORMBASE_ID)

Analysis complete. Output can be found at ../analysis/walker_lab/cut_and_tag/Cut_and_Tag_Whole_Genome_12112/control_37_41779
Analysis complete. Output can be found at ../analysis/walker_lab/cut_and_tag/Cut_and_Tag_Whole_Genome_12112/sams-1_37_78901
Analysis complete. Output can be found at ../analysis/walker_lab/cut_and_tag/Cut_and_Tag_Whole_Genome_12112/sams-4_15_29518
Analysis complete. Output can be found at ../analysis/walker_lab/cut_and_tag/Cut_and_Tag_Whole_Genome_12112/sams-1_15_12932
Analysis complete. Output can be found at ../analysis/walker_lab/cut_and_tag/Cut_and_Tag_Whole_Genome_12112/sams-4_37_29595
Analysis complete. Output can be found at ../analysis/walker_lab/cut_and_tag/Cut_and_Tag_Whole_Genome_12112/control_15_49041
Analysis complete. Output can be found at ../analysis/walker_lab/cut_and_tag/Cut_and_Tag_Whole_Genome_12112


In [18]:

input_data_path = derived_data_path / "cut_and_tag/cut_and_tag"
output_analysis_path = "../analysis/walker_lab/cut_and_tag"

wormcat = Wormcat(working_dir_path = output_analysis_path,
                  title = "Cut and Tag ORF Only", 
                  annotation_file_name = 'ORF_only_v2_nov-11-2021.csv')

wormcat.wormcat_batch(input_data_path, 
                      p_adjust_method = PAdjustMethod.BONFERRONI, 
                      p_adjust_threshold = 0.05,
                      gene_type = cs.GENE_TYPE_WORMBASE_ID)


Analysis complete. Output can be found at ../analysis/walker_lab/cut_and_tag/Cut_and_Tag_ORF_Only_43800/control_37_18712
Analysis complete. Output can be found at ../analysis/walker_lab/cut_and_tag/Cut_and_Tag_ORF_Only_43800/sams-1_37_08956
Analysis complete. Output can be found at ../analysis/walker_lab/cut_and_tag/Cut_and_Tag_ORF_Only_43800/sams-4_15_28319
Analysis complete. Output can be found at ../analysis/walker_lab/cut_and_tag/Cut_and_Tag_ORF_Only_43800/sams-1_15_86096
Analysis complete. Output can be found at ../analysis/walker_lab/cut_and_tag/Cut_and_Tag_ORF_Only_43800/sams-4_37_57374
Analysis complete. Output can be found at ../analysis/walker_lab/cut_and_tag/Cut_and_Tag_ORF_Only_43800/control_15_61660
Analysis complete. Output can be found at ../analysis/walker_lab/cut_and_tag/Cut_and_Tag_ORF_Only_43800


-----
#### WormCat: An Online Tool for Annotation and Visualization of Caenorhabditis elegans Genome-Scale Data 

**Compare**
- Random genes whole_genome_v2
- Random genes ORF_only_v2

In [14]:

from wormcat3 import Wormcat, WormcatError, PAdjustMethod
from wormcat3 import constants as cs

input_data_path = derived_data_path / "wc1_random/random"
output_analysis_path = "../analysis/walker_lab/random"

wormcat = Wormcat(working_dir_path = output_analysis_path,
                  title = "Random Whole Genome", 
                  annotation_file_name = 'whole_genome_v2_nov-11-2021.csv')

wormcat.wormcat_batch(input_data_path, 
                      p_adjust_method = PAdjustMethod.BONFERRONI, 
                      p_adjust_threshold = 0.05,
                      gene_type = cs.GENE_TYPE_WORMBASE_ID)

Analysis complete. Output can be found at ../analysis/walker_lab/random/Random_Whole_Genome_36216/random_1000_46238
Error: [801 INVALID_STATE] While creating bubble plot found DataFrame empty or None 
Analysis complete. Output can be found at ../analysis/walker_lab/random/Random_Whole_Genome_36216/random_500_63382
Analysis complete. Output can be found at ../analysis/walker_lab/random/Random_Whole_Genome_36216/random_100_05616
Analysis complete. Output can be found at ../analysis/walker_lab/random/Random_Whole_Genome_36216/random_1500_02134
Analysis complete. Output can be found at ../analysis/walker_lab/random/Random_Whole_Genome_36216


In [16]:

input_data_path = derived_data_path / "wc1_random/random"
output_analysis_path = "../analysis/walker_lab/random"

wormcat = Wormcat(working_dir_path = output_analysis_path,
                  title = "Random ORF Only", 
                  annotation_file_name = 'ORF_only_v2_nov-11-2021.csv')

wormcat.wormcat_batch(input_data_path, 
                      p_adjust_method = PAdjustMethod.BONFERRONI, 
                      p_adjust_threshold = 0.05,
                      gene_type = cs.GENE_TYPE_WORMBASE_ID)

Error: [801 INVALID_STATE] While creating bubble plot found DataFrame empty or None 
Error: [801 INVALID_STATE] While creating bubble plot found DataFrame empty or None 
Error: [801 INVALID_STATE] While creating bubble plot found DataFrame empty or None 
Analysis complete. Output can be found at ../analysis/walker_lab/random/Random_ORF_Only_30731/random_1000_41811
Error: [801 INVALID_STATE] While creating bubble plot found DataFrame empty or None 
Error: [801 INVALID_STATE] While creating bubble plot found DataFrame empty or None 
Error: [801 INVALID_STATE] While creating bubble plot found DataFrame empty or None 
Analysis complete. Output can be found at ../analysis/walker_lab/random/Random_ORF_Only_30731/random_500_02433
Error: [801 INVALID_STATE] While creating bubble plot found DataFrame empty or None 
Error: [801 INVALID_STATE] While creating bubble plot found DataFrame empty or None 
Error: [801 INVALID_STATE] While creating bubble plot found DataFrame empty or None 
Analysis com

-----
#### Defining characteristics and conservation of poorly annotated genes in Caenorhabditis elegans using WormCat 2.0

**Compare**
- Peptides whole_genome_v2
- Peptides ORF_only_v2


In [20]:
input_data_path = derived_data_path / "wc2_peptides/peptides"
output_analysis_path = "../analysis/walker_lab/peptides"

wormcat = Wormcat(working_dir_path = output_analysis_path,
                  title = "Peptides Whole Genome", 
                  annotation_file_name = 'whole_genome_v2_nov-11-2021.csv')

wormcat.wormcat_batch(input_data_path, 
                      p_adjust_method = PAdjustMethod.BONFERRONI, 
                      p_adjust_threshold = 0.05,
                      gene_type = cs.GENE_TYPE_WORMBASE_ID)

Analysis complete. Output can be found at ../analysis/walker_lab/peptides/Peptides_Whole_Genome_13762/cytoplasm_57125
Analysis complete. Output can be found at ../analysis/walker_lab/peptides/Peptides_Whole_Genome_13762/all_detected_peptides_33957
Analysis complete. Output can be found at ../analysis/walker_lab/peptides/Peptides_Whole_Genome_13762/aging_change_96936
Analysis complete. Output can be found at ../analysis/walker_lab/peptides/Peptides_Whole_Genome_13762


In [21]:
input_data_path = derived_data_path / "wc2_peptides/peptides"
output_analysis_path = "../analysis/walker_lab/peptides"

wormcat = Wormcat(working_dir_path = output_analysis_path,
                  title = "Peptides ORF Only", 
                  annotation_file_name = 'ORF_only_v2_nov-11-2021.csv')

wormcat.wormcat_batch(input_data_path, 
                      p_adjust_method = PAdjustMethod.BONFERRONI, 
                      p_adjust_threshold = 0.05,
                      gene_type = cs.GENE_TYPE_WORMBASE_ID)

Analysis complete. Output can be found at ../analysis/walker_lab/peptides/Peptides_ORF_Only_98597/cytoplasm_20392
Analysis complete. Output can be found at ../analysis/walker_lab/peptides/Peptides_ORF_Only_98597/all_detected_peptides_91509
Analysis complete. Output can be found at ../analysis/walker_lab/peptides/Peptides_ORF_Only_98597/aging_change_25005
Analysis complete. Output can be found at ../analysis/walker_lab/peptides/Peptides_ORF_Only_98597
