Skip to content

Commit

Permalink
add usher placements to summary
Browse files Browse the repository at this point in the history
  • Loading branch information
Katherine Eaton authored and ktmeaton committed May 17, 2022
1 parent 0d0ffbd commit 943cde9
Show file tree
Hide file tree
Showing 2 changed files with 26 additions and 25 deletions.
12 changes: 9 additions & 3 deletions scripts/summary.sh
Original file line number Diff line number Diff line change
Expand Up @@ -20,8 +20,13 @@ while [[ $# -gt 0 ]]; do
shift # past argument
shift # past value
;;
--usher)
usher=$2
--usher-clades)
usher_clades=$2
shift # past argument
shift # past value
;;
--usher-placements)
usher_placements=$2
shift # past argument
shift # past value
;;
Expand Down Expand Up @@ -76,7 +81,8 @@ sort_col="usher_subtree"
csvtk cut -t -f "strain,${cols},clade,Nextclade_pango" ${nextclade} \
| csvtk rename -t -f "clade" -n "Nextclade_clade" \
| csvtk merge -t --na "NA" -f "strain" - ${sc2rf} \
| csvtk merge -t -k --na "NA" -f "strain" - ${usher} \
| csvtk merge -t -k --na "NA" -f "strain" - ${usher_clades} \
| csvtk merge -t -k --na "NA" -f "strain" - ${usher_placements} \
| csvtk merge -t -k --na "NA" -f "strain" - ${subtrees} \
| csvtk sort -t -k "$sort_col" \
| csvtk mutate2 -t -n "ncov-recombinant_version" -e "\"$ncov_recombinant_ver\"" \
Expand Down
39 changes: 17 additions & 22 deletions workflow/Snakefile
Original file line number Diff line number Diff line change
Expand Up @@ -351,13 +351,12 @@ rule sc2rf:
debug_csv = "results/{build}/sc2rf_debug.csv",
debug_tsv = "results/{build}/sc2rf_debug.tsv",
params:
clades = lambda wildcards: " ".join(config["builds"][wildcards.build]["sc2rf"]["clades"]),
primers = lambda wildcards: config["builds"][wildcards.build]["sc2rf"]["primers"],
primers_name = lambda wildcards: config["builds"][wildcards.build]["sc2rf"]["primers_name"],
sc2rf_args = lambda wildcards: config["builds"][wildcards.build]["sc2rf"]["sc2rf_args"],
debug_args = lambda wildcards: config["builds"][wildcards.build]["sc2rf"]["debug_args"],
clades = lambda wildcards: " ".join(config["builds"][wildcards.build]["sc2rf"]["clades"]),
mutation_threshold = lambda wildcards: config["builds"][wildcards.build]["sc2rf"]["mutation_threshold"],
sc2rf_args = lambda wildcards: config["builds"][wildcards.build]["sc2rf"]["sc2rf_args"],
debug_args = lambda wildcards: config["builds"][wildcards.build]["sc2rf"]["debug_args"],
max_name_length = lambda wildcards: config["builds"][wildcards.build]["sc2rf"]["max_name_length"],
outdir = lambda wildcards: "results/{build}".format(build=wildcards.build),
outdir = lambda wildcards: "results/{build}".format(build=wildcards.build),
threads: 1
resources:
cpus = 1,
Expand All @@ -368,12 +367,6 @@ rule sc2rf:
debug = "logs/{rule}/{{build}}_debug_{today}.log".format(today=today, rule=rule_name),
shell:
"""
# Check if we're using primers
primers_flag=""
if [[ "{params.primers}" ]]; then
primers_flag="--primers {params.primers} --primers-name {params.primers_name}"
fi
# Regular Parameters
bash scripts/sc2rf.sh \
--aligned {input.aligned} \
Expand All @@ -382,7 +375,7 @@ rule sc2rf:
--log {log.regular} \
--max-name-length {params.max_name_length} \
--clades "{params.clades}" \
${{primers_flag}} \
--mutation-threshold {params.mutation_threshold} \
{params.sc2rf_args};
# Debugging Parameters
Expand All @@ -393,7 +386,7 @@ rule sc2rf:
--log {log.debug} \
--max-name-length {params.max_name_length} \
--clades "{params.clades}" \
${{primers_flag}} \
--mutation-threshold {params.mutation_threshold} \
{params.debug_args};
"""

Expand Down Expand Up @@ -686,13 +679,14 @@ rule summary:
"""
message: "{wildcards.build} | Summarizing results from various tools."
input:
nextclade = "results/{build}/nextclade.metadata.tsv",
sc2rf = "results/{build}/sc2rf.recombinants.tsv",
usher = "results/{build}/usher.clades.tsv",
subtrees = "results/{build}/subtrees_collapse/metadata.tsv",
usher_ver = lambda wildcards: "data/{base_input}/version.txt".format(
base_input=config["builds"][wildcards.build]["base_input"]
),
nextclade = "results/{build}/nextclade.metadata.tsv",
sc2rf = "results/{build}/sc2rf.recombinants.tsv",
usher_clades = "results/{build}/usher.clades.tsv",
usher_placements = "results/{build}/usher.placement_stats.tsv",
subtrees = "results/{build}/subtrees_collapse/metadata.tsv",
usher_ver = lambda wildcards: "data/{base_input}/version.txt".format(
base_input=config["builds"][wildcards.build]["base_input"]
),

output:
summary = "results/{build}/summary.tsv",
Expand All @@ -712,7 +706,8 @@ rule summary:
bash scripts/summary.sh \
--nextclade {input.nextclade} \
--sc2rf {input.sc2rf} \
--usher {input.usher} \
--usher-clades {input.usher_clades} \
--usher-placements {input.usher_placements} \
--usher-dataset {input.usher_ver} \
--subtrees {input.subtrees} \
--cols {params.cols} \
Expand Down

0 comments on commit 943cde9

Please sign in to comment.