In [7]:
import re

class Motifs:
    def __init__(self, seq=None, walker_a_motif=None, walker_b_motif=None):
        self.seq = seq
        self.walker_a_motif = walker_a_motif
        self.walker_b_motif = walker_b_motif

# The walker a motif in proteins is associated with phosphate binding. 
# The motif has the pattern G-x(4)-GK-[TS], where G, K, T and S denote glycine, lysine, threonine and serine residues respectively, and x denotes any amino acid. 
# It is present in many ATP or GTP utilizing proteins; it is the β phosphate of the nucleotide that is bound. 

    def find_walker_a(self, file):
        line = line.rstrip()
        
        for line in open(file):
            if line.startswith(">"):
                print("Protein information:\n", line)
                
            else:
                m = re.search('[G]\D{4}[G][K][TS]', line)
                if m:
                    print("Walker A motif found!")
                else:
                    print("No motif found :(")
                    
# Walker B motif is a motif in most P-loop proteins situated well downstream of the A-motif. 
# The consensus sequence of this motif was reported to be [RK]-x(3)-G-x(3)-LhhhD, where R, K, G, L and D denote arginine, lysine, glycine, leucine and aspartic acid residues respectively, 
# x represents any of the 20 standard amino acids and h denotes a hydrophobic amino acid.

    def find_walker_b(self, file):
        line = line.rstrip()
        
        for line in open(file):
            if line.startswith(">"):
                print("Protein information:\n", line)
                
            else:
                m = re.search('[RK]\D{3}[G]\D{3}[L]\D{3}[D]', line)
                if m:
                    print("Walker B motif found!")
                else:
                    print("No motif found :(")   

In [3]:
import re

line = 'GHDJSKEIDKCGXXDSGKTVFCFFVDESASSDF'

def walker_a(line):
    m = re.search('[G]\D{4}[G][K][TS]', line)
    if m:
        print("Walker A motif found!")
    else:
        print("No motif found :(")
        
walker_a(line)

Walker A motif found!


In [6]:
line = 'GHDJSKEIDKCGXDSGKTVFCFFVDESASSDF'

walker_a(line)

No motif found :(


In [9]:
# hemoglobin subunit beta [Homo sapiens]
line = 'MVHLTPEEKSAVTALWGKVNVDEVGGEALGRLLVVYPWTQRFFESFGDLSTPDAVMGNPKVKAHGKKVLGAFSDGLAHLDNLKGTFATLSELHCDKLHVDPENFRLLGNVLVCVLAHHFGKEFTPPVQAAYQKVVAGVANALAHKYH'

walker_a(line)

No motif found :(


In [12]:
# ATP-binding cassette sub-family E member 1 [Homo sapiens]
line = 'MADKLTRIAIVNHDKCKPKKCRQECKKSCPVVRMGKLCIEVTPQSKIAWISETLCIGCGICIKKCPFGALSIVNLPSNLEKETTHRYCANAFKLHRLPIPRPGEVLGLVGTNGIGKSTALKILAGKQKPNLGKYDDPPDWQEILTYFRGSELQNYFTKILEDDLKAIIKPQYVDQIPKAAKGTVGSILDRKDETKTQAIVCQQLDLTHLKERNVEDLSGGELQRFACAVVCIQKADIFMFDEPSSYLDVKQRLKAAITIRSLINPDRYIIVVEHDLSVLDYLSDFICCLYGVPSAYGVVTMPFSVREGINIFLDGYVPTENLRFRDASLVFKVAETANEEEVKKMCMYKYPGMKKKMGEFELAIVAGEFTDSEIMVMLGENGTGKTTFIRMLAGRLKPDEGGEVPVLNVSYKPQKISPKSTGSVRQLLHEKIRDAYTHPQFVTDVMKPLQIENIIDQEVQTLSGGELQRVALALCLGKPADVYLIDEPSAYLDSEQRLMAARVVKRFILHAKKTAFVVEHDFIMATYLADRVIVFDGVPSKNTVANSPQTLLAGMNKFLSQLEITFRRDPNNYRPRINKLNSIKDVEQKKSGNYFFLDD'

walker_a(line)

Walker A motif found!
