Skip to content

Commit

Permalink
Add Proteomics datatypes proBAM and proBED
Browse files Browse the repository at this point in the history
Add datatypes proBAM and proBED for genomic alignment and annotation of
proteomic analysis results.
  • Loading branch information
jj-umn committed Jan 22, 2018
1 parent 3ae47e6 commit 007e3cc
Show file tree
Hide file tree
Showing 3 changed files with 16 additions and 0 deletions.
2 changes: 2 additions & 0 deletions config/datatypes_conf.xml.sample
Original file line number Diff line number Diff line change
Expand Up @@ -20,6 +20,7 @@
<converter file="bam_to_bigwig_converter.xml" target_datatype="bigwig"/>
<converter file="bam_native_to_bam_converter.xml" target_datatype="bam"/>
</datatype>
<datatype extension="probam" type="galaxy.datatypes.binary:ProBam" mimetype="application/octet-stream" display_in_upload="true"/>
<datatype extension="cram" type="galaxy.datatypes.binary:CRAM" mimetype="application/octet-stream" display_in_upload="true" description="CRAM is a file format for highly efficient and tunable reference-based compression of alignment data." description_url="http://www.ebi.ac.uk/ena/software/cram-usage">
<converter file="cram_to_bam_converter.xml" target_datatype="bam"/>
</datatype>
Expand All @@ -40,6 +41,7 @@
<datatype extension="bed6" type="galaxy.datatypes.interval:Bed6" display_in_upload="true">
</datatype>
<datatype extension="bed12" type="galaxy.datatypes.interval:Bed12" display_in_upload="true"/>
<datatype extension="probed" type="galaxy.datatypes.interval:ProBed" display_in_upload="true"/>
<datatype extension="len" type="galaxy.datatypes.chrominfo:ChromInfo" display_in_upload="true">
<converter file="len_to_linecount.xml" target_datatype="linecount" />
</datatype>
Expand Down
7 changes: 7 additions & 0 deletions lib/galaxy/datatypes/binary.py
Original file line number Diff line number Diff line change
Expand Up @@ -489,6 +489,13 @@ def samtools_dataprovider(self, dataset, **settings):
return dataproviders.dataset.SamtoolsDataProvider(dataset_source, **settings)


class ProBam(Bam):
"""Class describing a BAM binary file - extended for proteomics data"""
edam_format = "format_3826"
edam_data = "data_0863"
file_ext = "probam"


class CRAM(Binary):
file_ext = "cram"
edam_format = "format_3462"
Expand Down
7 changes: 7 additions & 0 deletions lib/galaxy/datatypes/interval.py
Original file line number Diff line number Diff line change
Expand Up @@ -572,6 +572,13 @@ def sniff(self, filename):
return False


class ProBed(Bed):
"""Tab delimited data in proBED format - adaptation of BED for proteomics data."""
edam_format = "format_3827"
file_ext = "probed"
column_names = ['Chrom', 'Start', 'End', 'Name', 'Score', 'Strand', 'ThickStart', 'ThickEnd', 'ItemRGB', 'BlockCount', 'BlockSizes', 'BlockStarts', 'ProteinAccession', 'PeptideSequence', 'Uniqueness', 'GenomeReferenceVersion', 'PsmScore', 'Fdr', 'Modifications', 'Charge', 'ExpMassToCharge', 'CalcMassToCharge', 'PsmRank', 'DatasetID', 'Uri']


class BedStrict(Bed):
"""Tab delimited data in strict BED format - no non-standard columns allowed"""
edam_format = "format_3584"
Expand Down

0 comments on commit 007e3cc

Please sign in to comment.