Skip to content

Commit

Permalink
Version 20240417.03. Handle new form of old spam loop.
Browse files Browse the repository at this point in the history
  • Loading branch information
Arkiver2 committed Apr 17, 2024
1 parent 6e61565 commit e926de3
Show file tree
Hide file tree
Showing 2 changed files with 9 additions and 4 deletions.
2 changes: 1 addition & 1 deletion pipeline.py
Expand Up @@ -83,7 +83,7 @@ def search(self, text):
#
# Update this each time you make a non-cosmetic change.
# It will be added to the WARC files and reported to the tracker.
VERSION = '20240417.02'
VERSION = '20240417.03'
#USER_AGENT = 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/86.0.4240.183 Safari/537.36'
TRACKER_ID = 'urls'
TRACKER_HOST = 'legacy-api.arpa.li'
Expand Down
11 changes: 8 additions & 3 deletions urls.lua
Expand Up @@ -247,11 +247,16 @@ local filter_pattern_sets = {
--["flashplayer"]="^https?://www%.macromedia%.com/go/getflashplayer$",
["tupian"]={
"^https?://[^/]+%.[^%./]+%.[a-z]+/tupian_1/[^%./]+%.jpg$",
"^https?://[^/]+%.[^%./]+%.[a-z]+/templates/moban",
"^https?://[^/]+%.[^%./]+%.[a-z]+/templates/[^/]+/moban"
"^https?://[^/]+%.[^%./]+%.[a-z]+/templates/moban[0-9]*/",
"^https?://[^/]+%.[^%./]+%.[a-z]+/templates/[^/]+/moban[0-9]*/"
},
["slash"]="^https?://[^/]+%.[^%./]+%.[a-z]+/[^/]+/$",
["tk88"]="tk88",
["other1"]={
"tk88",
"^https?://[^/]+%.[^%./]+%.[a-z]+/list_[a-z]+/$",
"^https?://[^/]+%.[^%./]+%.[a-z]+/news/[0-9][0-9][0-9][0-9][0-9][0-9][0-9][0-9][^0-9]",
"^https?://[^/]+%.[^%./]+%.[a-z]+/static/logo%.jpg"
},
["other"]={
"%.xlsx?$",
"%.pptx?$",
Expand Down

0 comments on commit e926de3

Please sign in to comment.