Skip to content

Commit

Permalink
Merge pull request #91 from carlosp420/dont_use_lowercase_gene_vouche…
Browse files Browse the repository at this point in the history
…r_codes

Dont use lowercase gene voucher codes
  • Loading branch information
carlosp420 committed Mar 13, 2015
2 parents 0755f60 + b15f20b commit 710b961
Show file tree
Hide file tree
Showing 8 changed files with 94 additions and 82 deletions.
11 changes: 5 additions & 6 deletions voseq/core/utils.py
Expand Up @@ -33,15 +33,15 @@ def get_voucher_codes(cleaned_data):
for i in voucher_codes:
if re.search('^--', i):
i_clean = re.sub('^--', '', i)
voucher_codes_clean.append(i_clean.lower())
voucher_codes_clean.append(i_clean)
else:
voucher_codes_clean.append(i.lower())
voucher_codes_clean.append(i)
voucher_codes_set = set(voucher_codes_clean)

vouchers_to_drop = []
for i in voucher_codes:
if re.search('^--', i):
vouchers_to_drop.append(re.sub('^--', '', i).lower())
vouchers_to_drop.append(re.sub('^--', '', i))

voucher_codes_filtered = []
for i in voucher_codes_set:
Expand All @@ -68,9 +68,8 @@ def get_gene_codes(cleaned_data):
if len(cleaned_data['gene_codes']) > 0:
gene_codes += [i.gene_code for i in cleaned_data['gene_codes']]

gene_codes_lower_case = [i.lower() for i in gene_codes]
gene_codes_lower_case.sort()
return set(gene_codes_lower_case)
gene_codes.sort()
return set(gene_codes)


def get_version_stats():
Expand Down
4 changes: 2 additions & 2 deletions voseq/create_dataset/dataset.py
Expand Up @@ -27,7 +27,7 @@ def get_reading_frames(self):
reading_frames = dict()
genes = Genes.objects.all().values('gene_code', 'reading_frame')
for gene in genes:
gene_code = gene['gene_code'].lower()
gene_code = gene['gene_code']
if gene_code in self.gene_codes:
reading_frames[gene_code] = gene['reading_frame']
return reading_frames
Expand All @@ -47,7 +47,7 @@ def split_sequence_in_codon_positions(self, gene_code, seq):
processed to extract the codon positions requested by the user.
"""
reading_frame = int(self.reading_frames[gene_code.lower()]) - 1
reading_frame = int(self.reading_frames[gene_code]) - 1
seq = seq[reading_frame:]

# This is the BioPython way to get codon positions
Expand Down
10 changes: 5 additions & 5 deletions voseq/create_dataset/tests/tests_create_nexus_dataset.py
Expand Up @@ -43,20 +43,20 @@ def test_nexus(self):
FORMAT INTERLEAVE DATATYPE=DNA MISSING=? GAP=-;
MATRIX
[coi]
[COI]
CP100-10_Melitaea_diamina ?????????????????????????TGAGCCGGTATAATTGGTACATCCCTAAGTCTTATTATTCGAACCGAATTAGGAAATCCTAGTTTTTTAATTGGAGATGATCAAATTTATAATACCATTGTAACAGCTCATGCTTTTATTATAATTTTTTTTATAGTTATGCCAATTATAATTGGAGGATTTGGTAATTGACTTGTACCATTAATATTGGGAGCCCCAGATATAGCTTTCCCCCGAATAAATTATATAAGATTTTGATTATTGCCTCCATCCTTAATTCTTTTAATTTCAAGTAGAATTGTAGAAAATGGGGCAGGAACTGGATGAACAGTTTACCCCCCACTTTCATCTAATATTGCCCATAGAGGAGCTTCAGTGGATTTAGCTATTTTTTCTTTACATTTAGCTGGGATTTCCTCTATCTTAGGAGCTATTAATTTTATTACTACAATTATTAATATACGAATTAATAATATATCTTATGATCAAATACCTTTATTTGTATGAGCAGTAGGAATTACAGCATTACTTCTCTTATTATCTTTACCAGTTTTAGCTGGAGCTATTACTATACTTTTAACGGATCGAAATCTTAATACCTCATTTTTTGATTCCTGCGGAGGAGGAGATCC???????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????
CP100-11_Melitaea_diamina ??TGAGCCGGTATAATTGGTACATCCCTAAGTCTTATTATTCGAACCGAATTAGGAAATCCTAGTTTTTTAATTGGAGATGATCAAATTTATAATACCATTGTAACAGCTCATGCTTTTATTATAATTTTTTTTATAGTTATGCCAATTATAATTGGAGGATTTGGTAATTGACTTGTACCATTAATATTGGGAGCCCCAGATATAGCTTTCCCCCGAATAAATTATATAAGATTTTGATTATTGCCTCCATCCTTAATTCTTTTAATTTCAAGTAGAATTGTAGAAAATGGGGCAGGAACTGGATGAACAGTTTACCCCCCACTTTCATCTAATATTGCCCATAGAGGAGCTTCAGTGGATTTAGCTATTTTTTCTTTACATTTAGCTGGGATTTCCTCTATCTTAGGAGCTATTAATTTTATTACTACAATTATTAATATACGAATTAATAATATATCTTATGATCAAATACCTTTATTTGTATGAGCAGTAGGAATTACAGCATTACTTCTCTTATTATCTTTACCAGTTTTAGCTGGAGCTATTACTATACTTTTAACGGATCGAAATCTTAATACCTCATTTTTTGATTCCTGCGGAGGAGGAGATCC??????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????
[ef1a]
[EF1a]
CP100-10_Melitaea_diamina ???????????????CAAGTCCACCACCACCGGCCACTTGATTTACAAATGTGGTGGTATCGACAAACGTACCATCGAGAAGTTCGAGAAGGAAGCCCAGGAAATGGGCAAGGGTTCCTTCAAGTACGCTTGGGTGTTGGACAAACTTAAGGCTGAGCGCGAGCGTGGTATCACTATTGATATTGCTCTGTGGAAGTTCGAGACTGCCAAATACTATGTAACCATCATCGATGCTCCCGGACACAGAGATTTCATCAAGAACATGATCACCGGAACATCACAAGCCGATTGCGCCGTACTTATCGTCGCCGCCGGTACTGGTGAGTTCGAAGCCGGTATCTCAAAGAACGGTCAGACCCGTGAGCACGCTCTGCTCGCCTTCACATTAGGTGTAAAGCAGCTGATTGTAGGAGTCAACAAAATGGACTCCACTGAGCCCCCATACAATGAGGGACGTTTCGAGGAAATCAAAAAGGAAGTGTCCTCTTACATCAAGAAGATCGGTTACAACCCAGCTGCCGTCGCTTTCGTACCCATTTCTGGCTGGCACGGAGACAACATGCTGGAGCCATCTACCAAAATGTCCCGGTTCAAGGGATGGCAAGTGGAGCGCAAAGAAGGCAAGG???AAGGTAAATGCCTCATTGAAGCTC???ACGCCATCCTTCCTCCGG?????CCCAC????????????????????????????????????????????????TATTGGTACAGTGCCCGTAGGCAGAGTAGAAACTGGTATCCTCAAACCAGGTACCATTGTTGTTTTCGCTCCCGCCAACATCACCACTGAAGTCAAATCTGTGGAGATGCACCACGAAGCTCTCCAAGAGGCTGTACCTGGAGACAATGTAGGTTTCAACGTCAAGAACGTTTCCGTCAAGGAATTACGTCGTGGTTATGTAGCTGGTGACTCCAAGAACAACCCACCCAAGGGAGCTGCTGACTTCACCGCACAAGTCATTGTGCTCAACCACCCCGGTCAAATCTCCAATGGCTACACACCTGTGCTCGATTGCCACACAGCTCACATTGCCTGCAAATTCGCCGAAATCAAAGAAAAGGTTGACCGTCGTTCCGGTAAATCYACTGAGGACAATCCTAAATCTATCAAATCTGGTGATGCTGCCATTGTGAACTTGGTACCTTCCAAACCCCTCTGTGTGGAGGCCTTCCAAGAATTCCCACCTCTTGGTCG?????????????
CP100-11_Melitaea_diamina ????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????
;
END;
begin mrbayes;
charset coi = 1-1047;
charset ef1a = 1048-2287;
partition GENES = 2: coi, ef1a;
charset COI = 1-1047;
charset EF1a = 1048-2287;
partition GENES = 2: COI, EF1a;
set partition = GENES;
Expand Down

0 comments on commit 710b961

Please sign in to comment.