This repository has been archived by the owner on Nov 9, 2023. It is now read-only.
/
shared_phylotypes.py
executable file
·77 lines (64 loc) · 3.46 KB
/
shared_phylotypes.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
#!/usr/bin/env python
# File created on 12 Aug 2010
from __future__ import division
__author__ = "Jens Reeder"
__copyright__ = "Copyright 2011, The QIIME Project"
__credits__ = ["Jens Reeder"]
__license__ = "GPL"
__version__ = "1.8.0"
__maintainer__ = "Jose Clemente"
__email__ = "jose.clemente@gmail.com"
from glob import glob
from os.path import exists, split, splitext, isdir
from qiime.util import make_option
from qiime.util import parse_command_line_parameters,\
get_options_lookup, create_dir
from qiime.shared_phylotypes import calc_shared_phylotypes
options_lookup = get_options_lookup()
script_info = {}
script_info['brief_description'] = "Compute shared OTUs between all pairs of samples"
script_info['script_description'] = "This script computes from an OTU table a matrix with the number of shared phylotypes between all pairs of samples."
script_info['script_usage'] = [
("Single example","Compute shared OTUs on one OTU table for all samples","%prog -i otu_table.biom -o shared_otus.txt"),
("Reference sample example","Compute shared OTUs with respect to a reference sample. Computes shared OTUs between all pairs of samples and the reference sample. E.g. in a transplant study this can be used to establish a base line count of shared OTUs with the Donor sample before and after the transplant.","%prog -i otu_table.biom -o shared_otus_PC.636.txt -r PC.636"),
("Batch mode example","Compute shared OTUs for a set of OTU tables, e.g. from running multiple_rarefactions.py, with an even number of sequences per sample. The resulting directory can be fed to dissimilarity_mtx_stats.py, which computes mean, median and the standard deviation on the provided tables.", "%prog -i rarefied_otu_tables/ -o shared_otus/")
]
script_info['output_description']= ""
script_info['required_options'] = [\
make_option('-i','--otu_table_fp',type='existing_path',\
help='path to the input OTU table in biom format or a directory containing OTU tables'),
options_lookup['output_fp']
]
script_info['optional_options'] = [\
# Example optional option
make_option('-r','--reference_sample',type='string',
help='Name of reference sample to which all pairs of samples should be compared '
+ '[default: %default]', default=None),
]
script_info['version'] = __version__
def main():
option_parser, opts, args =\
parse_command_line_parameters(**script_info)
if isdir(opts.otu_table_fp):
ret_code = create_dir(opts.output_fp, fail_on_exist=False)
#run on each file in dir
for fp in glob(opts.otu_table_fp +'/*biom'):
parent_dir_name, file_name = split(fp)
basename, extension = splitext(file_name)
out_fp = opts.output_fp +"/"+basename+"_shared_OTUs.txt"
out_fh = open(out_fp, "w")
out_fh.write(calc_shared_phylotypes(open(fp, "U"),
opts.reference_sample))
out_fh.close()
else:
#run in single file mode
try:
out_fh = open(opts.output_fp,"w")
except IOError, message:
exit(("Can't open output file %s for writing. Check the permissions "\
+"or existing directory with identical name.\n%s")
% (opts.output_fp,message))
out_fh.write(calc_shared_phylotypes(open(opts.otu_table_fp, "U"),
opts.reference_sample))
if __name__ == "__main__":
main()