Permalink

Comparing changes

Choose two branches to see what’s changed or to start a new pull request. If you need to, you can also .

Open a pull request

Create a new pull request by comparing changes across two branches. If you need to, you can also .
...
Checking mergeability… Don’t worry, you can still create the pull request.
  • 1 commit
  • 6 files changed
  • 0 commit comments
  • 1 contributor
Commits on Apr 22, 2017
@vdauwera vdauwera Generic pre-processing workflows
	- One "uBAM to clean BAM"; one "uBAM to HaplotypeCaller GVCF"
	- Reference-agnostic (hg38 and b37 jsons provided)
	- Can be applied to exomes instead of genomes by swapping out intervals files
fd87f5a
@@ -0,0 +1,46 @@
+{
+ "##_COMMENT1": "SAMPLE NAME AND UNMAPPED BAMS",
+ "GenericPreProcessingToGVCFWorkflow.sample_name": "NA12878",
+ "GenericPreProcessingToGVCFWorkflow.base_file_name": "NA12878_20k.b37",
+ "GenericPreProcessingToGVCFWorkflow.flowcell_unmapped_bams": [
+ "gs://genomics-public-data/test-data/dna/wgs/hiseq2500/NA12878/H06HDADXX130110.1.ATCACGAT.20k_reads.bam",
+ "gs://genomics-public-data/test-data/dna/wgs/hiseq2500/NA12878/H06HDADXX130110.2.ATCACGAT.20k_reads.bam",
+ "gs://genomics-public-data/test-data/dna/wgs/hiseq2500/NA12878/H06JUADXX130110.1.ATCACGAT.20k_reads.bam"
+ ],
+ "GenericPreProcessingToGVCFWorkflow.final_gvcf_name": "NA12878_20k.b37.g.vcf.gz",
+ "GenericPreProcessingToGVCFWorkflow.unmapped_bam_suffix": ".bam",
+
+ "##_COMMENT2": "INTERVALS",
+ "GenericPreProcessingToGVCFWorkflow.calling_interval_list": "gs://gatk-legacy-bundles/b37/wgs_calling_regions.v1.interval_list",
+ "GenericPreProcessingToGVCFWorkflow.scattered_calling_intervals_list": "gs://gatk-legacy-bundles/b37/wgs_scattered_calling_intervals.txt",
+ "GenericPreProcessingToGVCFWorkflow.HaplotypeCaller.interval_padding": 0,
+
+ "##_COMMENT3": "REFERENCE FILES",
+ "GenericPreProcessingToGVCFWorkflow.ref_dict": "gs://gatk-legacy-bundles/b37/human_g1k_v37_decoy.dict",
+ "GenericPreProcessingToGVCFWorkflow.ref_fasta": "gs://gatk-legacy-bundles/b37/human_g1k_v37_decoy.fasta",
+ "GenericPreProcessingToGVCFWorkflow.ref_fasta_index": "gs://gatk-legacy-bundles/b37/human_g1k_v37_decoy.fasta.fai",
+ "GenericPreProcessingToGVCFWorkflow.ref_sa": "gs://gatk-legacy-bundles/b37/human_g1k_v37_decoy.fasta.sa",
+ "GenericPreProcessingToGVCFWorkflow.ref_amb": "gs://gatk-legacy-bundles/b37/human_g1k_v37_decoy.fasta.amb",
+ "GenericPreProcessingToGVCFWorkflow.ref_bwt": "gs://gatk-legacy-bundles/b37/human_g1k_v37_decoy.fasta.bwt",
+ "GenericPreProcessingToGVCFWorkflow.ref_ann": "gs://gatk-legacy-bundles/b37/human_g1k_v37_decoy.fasta.ann",
+ "GenericPreProcessingToGVCFWorkflow.ref_pac": "gs://gatk-legacy-bundles/b37/human_g1k_v37_decoy.fasta.pac",
+
+ "##_COMMENT4": "KNOWN SITES RESOURCES",
+ "GenericPreProcessingToGVCFWorkflow.dbSNP_vcf": "gs://gatk-legacy-bundles/b37/dbsnp_138.b37.vcf",
+ "GenericPreProcessingToGVCFWorkflow.dbSNP_vcf_index": "gs://gatk-legacy-bundles/b37/dbsnp_138.b37.vcf.idx",
+ "GenericPreProcessingToGVCFWorkflow.known_indels_sites_VCFs": [
+ "gs://gatk-legacy-bundles/b37/Mills_and_1000G_gold_standard.indels.b37.vcf"
+ ],
+ "GenericPreProcessingToGVCFWorkflow.known_indels_sites_indices": [
+ "gs://gatk-legacy-bundles/b37/Mills_and_1000G_gold_standard.indels.b37.vcf.idx"
+ ],
+
+ "##_COMMENT5": "DISK SIZES + PREEMPTIBLES",
+ "GenericPreProcessingToGVCFWorkflow.agg_small_disk": 200,
+ "GenericPreProcessingToGVCFWorkflow.agg_medium_disk": 300,
+ "GenericPreProcessingToGVCFWorkflow.agg_large_disk": 400,
+ "GenericPreProcessingToGVCFWorkflow.agg_preemptible_tries": 3,
+ "GenericPreProcessingToGVCFWorkflow.flowcell_small_disk": 100,
+ "GenericPreProcessingToGVCFWorkflow.flowcell_medium_disk": 200,
+ "GenericPreProcessingToGVCFWorkflow.preemptible_tries": 3
+}
@@ -0,0 +1,49 @@
+{
+ "##_COMMENT1": "SAMPLE NAME AND UNMAPPED BAMS",
+ "GenericPreProcessingToGVCFWorkflow.sample_name": "NA12878",
+ "GenericPreProcessingToGVCFWorkflow.base_file_name": "NA12878_20k.hg38",
+ "GenericPreProcessingToGVCFWorkflow.flowcell_unmapped_bams": [
+ "gs://genomics-public-data/test-data/dna/wgs/hiseq2500/NA12878/H06HDADXX130110.1.ATCACGAT.20k_reads.bam",
+ "gs://genomics-public-data/test-data/dna/wgs/hiseq2500/NA12878/H06HDADXX130110.2.ATCACGAT.20k_reads.bam",
+ "gs://genomics-public-data/test-data/dna/wgs/hiseq2500/NA12878/H06JUADXX130110.1.ATCACGAT.20k_reads.bam"
+ ],
+ "GenericPreProcessingToGVCFWorkflow.final_gvcf_name": "NA12878_20k.hg38.g.vcf.gz",
+ "GenericPreProcessingToGVCFWorkflow.unmapped_bam_suffix": ".bam",
+
+ "##_COMMENT2": "INTERVALS",
+ "GenericPreProcessingToGVCFWorkflow.calling_interval_list": "gs://genomics-public-data/resources/broad/hg38/v0/wgs_calling_regions.hg38.interval_list",
+ "GenericPreProcessingToGVCFWorkflow.scattered_calling_intervals_list": "gs://gatk-test-data/intervals/hg38_wgs_scattered_calling_intervals.txt",
+ "GenericPreProcessingToGVCFWorkflow.HaplotypeCaller.interval_padding": 0,
+
+ "##_COMMENT3": "REFERENCE FILES",
+ "GenericPreProcessingToGVCFWorkflow.ref_dict": "gs://genomics-public-data/resources/broad/hg38/v0/Homo_sapiens_assembly38.dict",
+ "GenericPreProcessingToGVCFWorkflow.ref_fasta": "gs://genomics-public-data/resources/broad/hg38/v0/Homo_sapiens_assembly38.fasta",
+ "GenericPreProcessingToGVCFWorkflow.ref_fasta_index": "gs://genomics-public-data/resources/broad/hg38/v0/Homo_sapiens_assembly38.fasta.fai",
+ "GenericPreProcessingToGVCFWorkflow.ref_alt": "gs://genomics-public-data/resources/broad/hg38/v0/Homo_sapiens_assembly38.fasta.64.alt",
+ "GenericPreProcessingToGVCFWorkflow.ref_sa": "gs://genomics-public-data/resources/broad/hg38/v0/Homo_sapiens_assembly38.fasta.64.sa",
+ "GenericPreProcessingToGVCFWorkflow.ref_amb": "gs://genomics-public-data/resources/broad/hg38/v0/Homo_sapiens_assembly38.fasta.64.amb",
+ "GenericPreProcessingToGVCFWorkflow.ref_bwt": "gs://genomics-public-data/resources/broad/hg38/v0/Homo_sapiens_assembly38.fasta.64.bwt",
+ "GenericPreProcessingToGVCFWorkflow.ref_ann": "gs://genomics-public-data/resources/broad/hg38/v0/Homo_sapiens_assembly38.fasta.64.ann",
+ "GenericPreProcessingToGVCFWorkflow.ref_pac": "gs://genomics-public-data/resources/broad/hg38/v0/Homo_sapiens_assembly38.fasta.64.pac",
+
+ "##_COMMENT4": "KNOWN SITES RESOURCES",
+ "GenericPreProcessingToGVCFWorkflow.dbSNP_vcf": "gs://genomics-public-data/resources/broad/hg38/v0/Homo_sapiens_assembly38.dbsnp138.vcf",
+ "GenericPreProcessingToGVCFWorkflow.dbSNP_vcf_index": "gs://genomics-public-data/resources/broad/hg38/v0/Homo_sapiens_assembly38.dbsnp138.vcf.idx",
+ "GenericPreProcessingToGVCFWorkflow.known_indels_sites_VCFs": [
+ "gs://genomics-public-data/resources/broad/hg38/v0/Mills_and_1000G_gold_standard.indels.hg38.vcf.gz",
+ "gs://genomics-public-data/resources/broad/hg38/v0/Homo_sapiens_assembly38.known_indels.vcf.gz"
+ ],
+ "GenericPreProcessingToGVCFWorkflow.known_indels_sites_indices": [
+ "gs://genomics-public-data/resources/broad/hg38/v0/Mills_and_1000G_gold_standard.indels.hg38.vcf.gz.tbi",
+ "gs://genomics-public-data/resources/broad/hg38/v0/Homo_sapiens_assembly38.known_indels.vcf.gz.tbi"
+ ],
+
+ "##_COMMENT5": "DISK SIZES + PREEMPTIBLES",
+ "GenericPreProcessingToGVCFWorkflow.agg_small_disk": 200,
+ "GenericPreProcessingToGVCFWorkflow.agg_medium_disk": 300,
+ "GenericPreProcessingToGVCFWorkflow.agg_large_disk": 400,
+ "GenericPreProcessingToGVCFWorkflow.agg_preemptible_tries": 3,
+ "GenericPreProcessingToGVCFWorkflow.flowcell_small_disk": 100,
+ "GenericPreProcessingToGVCFWorkflow.flowcell_medium_disk": 200,
+ "GenericPreProcessingToGVCFWorkflow.preemptible_tries": 3
+}
Oops, something went wrong.

No commit comments for this range