Skip to content

Commit

Permalink
Add Vuhuv turkish search engine to bot list (closes PR #576)
Browse files Browse the repository at this point in the history
  • Loading branch information
NielsLeenheer committed Jan 4, 2021
1 parent 5cdf50b commit 4293566
Show file tree
Hide file tree
Showing 3 changed files with 7 additions and 2 deletions.
1 change: 1 addition & 0 deletions data/applications-bots.php
Original file line number Diff line number Diff line change
Expand Up @@ -276,6 +276,7 @@
[ 'name' => 'Voilabot', 'id' => 'voila', 'regexp' => '/Voila[Bb]ot/u' ],
[ 'name' => 'VocusBot', 'id' => 'vocus', 'regexp' => '/VocusBot ([0-9.]*)/u' ],
[ 'name' => 'Vodafone mCrawler', 'id' => 'mcrawler', 'regexp' => '/Vodafone mCrawler/u' ],
[ 'name' => 'VuhuvBot', 'id' => 'vuhuv', 'regexp' => '/vuhuvBot\/([0-9.]*)/u' ],
[ 'name' => 'W3Bot', 'id' => 'w3bot', 'regexp' => '/W3Bot ([0-9.]*)/u' ],
[ 'name' => 'W3C CSS Validator', 'id' => 'jigsaw', 'regexp' => '/Jigsaw\/([0-9.]*)/u' ],
[ 'name' => 'W3C Internationalization Checker', 'id' => 'w3c', 'regexp' => '/W3C_I18n-Checker\/([0-9.]*)/u' ],
Expand Down
2 changes: 1 addition & 1 deletion data/regexes/applications-bots.php
Original file line number Diff line number Diff line change
Expand Up @@ -2,4 +2,4 @@

namespace WhichBrowser\Data;

Applications::$BOTS_REGEX = '/(008|360|a6|abound|muncher|adaxas|addthis|admantx|ahrefs|archiver|altavista|curious|cloudfront|amorank|apple|archive|jeeves|astra|backlink|baidu|bazqux|bingbot|msnbot|msmobot|bing|blex|blogbridge|bloglines|bloglovin|blogpulse|blogram|blogtrot|blogshares|boardreader|lddc|browsershots|bubing|buck|builtwith|butterfly|bytespider|heritrix|cliqz|cloudflare|comodo|commafeed|cbot|cresearch|watchdog|datasearch|dataprovider|daumoa|digg|domaincrawl|domainstats|discord|domain|dmca|duckduck|embed|exabot|exactseek|ezooms|facebook|fast|flamingo|fastladder|feed|wrangler|validator|fever|florienzh|friendica|robot|genieo|fetchor|google|gofeed|gomez|ichiro|gooblog|goorss|gowiki|grammarly|grub|hatena|capture|heureka|htdig|httpmon|hubpages|spider|indeed|istellabot|crawler|kakao|kouio|larbin|letsearch|linkedin|linkpad|linkdex|livedoor|seeker|ltx71|magpie|mj12bot|mapion|mail\.ru|megaindex|socialstreams|mixi|mnogo|monitor|dotbot|rogerbot|yeti|mxtoolbox|netcraft|netestate|netvibes|newsblur|newsgator|nimbostratus|orange|pages|psbot|pingdom|pinterest|pocket|postrank|comment|reddit|rssbar|hunter|quora|safesearch|scrapy|searchatlas|semrush|serpstat|seokicks|seznam|shopwiki|reader|simplepie|site24|slack|sogou|sophora|soso|spaziodati|spdycheck|spinn|sputnik|detector|summify|telegram|twisted|twitter|tiny|tineye|tlsprober|trustedsite|typhoeus|vagabondo|voat|voila|vocus|mcrawler|w3bot|jigsaw|w3c|wappalyzer|wayback|webindexer|wordpress|mechanize|xerka|sitemap|yacy|yandex|yahoo|y\!j|slurp|yelp|yioop|yisou|zmeu|httpclient|nutch|synapse|indy|go|node|wget|curl|package|java|simple|libwww|lwp|urllib|requests|php|pear|zend|ruby)/i';
Applications::$BOTS_REGEX = '/(008|360|a6|abound|muncher|adaxas|addthis|admantx|ahrefs|archiver|altavista|curious|cloudfront|amorank|apple|archive|jeeves|astra|backlink|baidu|bazqux|bingbot|msnbot|msmobot|bing|blex|blogbridge|bloglines|bloglovin|blogpulse|blogram|blogtrot|blogshares|boardreader|lddc|browsershots|bubing|buck|builtwith|butterfly|bytespider|heritrix|cliqz|cloudflare|comodo|commafeed|cbot|cresearch|watchdog|datasearch|dataprovider|daumoa|digg|domaincrawl|domainstats|discord|domain|dmca|duckduck|embed|exabot|exactseek|ezooms|facebook|fast|flamingo|fastladder|feed|wrangler|validator|fever|florienzh|friendica|robot|genieo|fetchor|google|gofeed|gomez|ichiro|gooblog|goorss|gowiki|grammarly|grub|hatena|capture|heureka|htdig|httpmon|hubpages|spider|indeed|istellabot|crawler|kakao|kouio|larbin|letsearch|linkedin|linkpad|linkdex|livedoor|seeker|ltx71|magpie|mj12bot|mapion|mail\.ru|megaindex|socialstreams|mixi|mnogo|monitor|dotbot|rogerbot|yeti|mxtoolbox|netcraft|netestate|netvibes|newsblur|newsgator|nimbostratus|orange|pages|psbot|pingdom|pinterest|pocket|postrank|comment|reddit|rssbar|hunter|quora|safesearch|scrapy|searchatlas|semrush|serpstat|seokicks|seznam|shopwiki|reader|simplepie|site24|slack|sogou|sophora|soso|spaziodati|spdycheck|spinn|sputnik|detector|summify|telegram|twisted|twitter|tiny|tineye|tlsprober|trustedsite|typhoeus|vagabondo|voat|voila|vocus|mcrawler|vuhuv|w3bot|jigsaw|w3c|wappalyzer|wayback|webindexer|wordpress|mechanize|xerka|sitemap|yacy|yandex|yahoo|y\!j|slurp|yelp|yioop|yisou|zmeu|httpclient|nutch|synapse|indy|go|node|wget|curl|package|java|simple|libwww|lwp|urllib|requests|php|pear|zend|ruby)/i';
6 changes: 5 additions & 1 deletion tests/data/bots/generic.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -849,4 +849,8 @@
-
headers: 'User-Agent: Seeker v.1 http://LookSeek.com/seeker/'
readable: 'LookSeek 1'
result: { browser: { name: LookSeek, version: '1' }, device: { type: bot } }
result: { browser: { name: LookSeek, version: '1' }, device: { type: bot } }
-
headers: 'User-Agent: Mozilla/5.0 (compatible; vuhuvBot/1.0; +http://vuhuv.com/bot.html)'
readable: 'VuhuvBot 1.0'
result: { browser: { name: VuhuvBot, version: '1.0' }, device: { type: bot } }

0 comments on commit 4293566

Please sign in to comment.