Skip to content

Commit

Permalink
cricket, menhealth
Browse files Browse the repository at this point in the history
  • Loading branch information
normalhuman committed Mar 1, 2016
1 parent 93d2d39 commit a97d7be
Showing 1 changed file with 2 additions and 1 deletion.
3 changes: 2 additions & 1 deletion findspam.py
Original file line number Diff line number Diff line change
Expand Up @@ -341,7 +341,7 @@ class FindSpam:
# Patterns: the top few lines are the most straightforward, matching any site with this string in domain name
pattern_websites = [r"(inboxmachine|(get|buy)cheap|escort|diploma|extramoney|earnathome|spell(caster|specialist)|profits|seo(tool|service|trick)|onsale|fat(burn|loss)|(\.|//|best)cheap|online(training|solution))[\w-]*?\.(co|net|org|in\W|info|wordpress|blogspot)",
r"(trainingin|cracked\w{3}|bestmover|relocation|\w{4}mortgage|loans|revenue|testo[-bsx]|cleanse|cleansing|detox|supplement|lubricant|serum|wrinkle|topcare|freetrial)[\w-]*?\.(co|net|org|in\W|info|wordpress|blogspot)",
r"(babaji|spellcaster|potentbody|moist|lefair|lubricant|derma(?![nt])|xtrm|factorx|nitro(?!us)|crazy(bulk|mass)|nauseam|endorev|ketone|//xtra)[\w-]*?\.(co|net|org|in\W|info|wordpress|blogspot)",
r"(menhealth|babaji|spellcaster|potentbody|moist|lefair|lubricant|derma(?![nt])|xtrm|factorx|nitro(?!us)|crazy(bulk|mass)|nauseam|endorev|ketone|//xtra)[\w-]*?\.(co|net|org|in\W|info|wordpress|blogspot)",
r"([\w-]password|\w{5}facts|\w\dfacts|\Btoyshop|[\w-]{6}cheats|credits)\.(co|net|org|in\W|info)",
r"health\d{3,}\.(com|net)", "https?://[\w-.]*?\.(repair|help)[\W]",
r"filefix(er)?\.com", "\.page\.tl\W",
Expand Down Expand Up @@ -382,6 +382,7 @@ class FindSpam:
r"scam[\w-]*?(book|alert|register|punch)[\w-]*?\.(co|net|org|in\W|info)",
r"https?://[^/\s]{8,}healer",
r"\w{9}rev\.com",
r"world[\w-]*?cricket[\w-]*?\.(co|net|org|in\W|info)",
r"(credit|online)[\w-]*?loan[\w-]*?\.(co|net|org|in\W|info)"]
rules = [
# Sites in sites[] will be excluded if 'all' == True. Whitelisted if 'all' == False.
Expand Down

0 comments on commit a97d7be

Please sign in to comment.