diff --git a/findspam.py b/findspam.py index 9222088cd6..f162fa5a21 100644 --- a/findspam.py +++ b/findspam.py @@ -26,7 +26,8 @@ class FindSpam: "JobsTribune", "join the illuminati", "Brorsoft", "Remo Recover", "kinnaristeel", "clash of (clan|stone)s? (cheats?|tricks?|gems?)", r"(?x:B [\s_]* A [\s_]* M \W{0,5} W [\s_]* A [\s_]* R [\s_]* \.? [\s_]* C [\s_]* O [\s_]* M)", - "slumber pm", "1-844-400-7325", "male enhancement"] + "slumber pm", "1-844-400-7325", "male enhancement", + "\p{script=Hangul}"] bad_keywords_nwb = [u"ಌ", "babyliss", "garcinia", "acai ?berry", # "nwb" == "no word boundary" "aging ?cream", u"오피", "b ?a ?m ?((w ?o ?w)|(w ?a ?r))"] blacklisted_websites = ["online ?kelas", "careyourhealths", "wowtoes",