Skip to content

Commit

Permalink
Add Letsearch Russian search engine to bots list (closing PR #577)
Browse files Browse the repository at this point in the history
  • Loading branch information
NielsLeenheer committed Jan 4, 2021
1 parent 80bcc17 commit ac6299b
Show file tree
Hide file tree
Showing 3 changed files with 7 additions and 2 deletions.
1 change: 1 addition & 0 deletions data/applications-bots.php
Original file line number Diff line number Diff line change
Expand Up @@ -171,6 +171,7 @@
[ 'name' => 'KakaoTalk Bot', 'id' => 'kakao', 'regexp' => '/kakaotalk-scrap\/([0-9.]*)/u' ],
[ 'name' => 'Kouio', 'id' => 'kouio', 'regexp' => '/kouio.com/u' ],
[ 'name' => 'Larbin', 'id' => 'larbin', 'regexp' => '/[Ll]arbin[\/_]([0-9.]*)/u' ],
[ 'name' => 'LetsearchBot', 'id' => 'letsearch', 'regexp' => '/LetsearchBot\/([0-9.]*)/u' ],
[ 'name' => 'Linkedin Bot', 'id' => 'linkedin', 'regexp' => '/LinkedInBot\/([0-9.]*)/u' ],
[ 'name' => 'Linkpad Bot', 'id' => 'linkpad', 'regexp' => '/LinkpadBot\/([0-9.]*)/u' ],
[ 'name' => 'Linkdex Bot', 'id' => 'linkdex', 'regexp' => '/linkdexbot-mobile\/([0-9.]*)/u' ],
Expand Down
2 changes: 1 addition & 1 deletion data/regexes/applications-bots.php
Original file line number Diff line number Diff line change
Expand Up @@ -2,4 +2,4 @@

namespace WhichBrowser\Data;

Applications::$BOTS_REGEX = '/(008|360|a6|abound|muncher|adaxas|addthis|admantx|ahrefs|archiver|altavista|curious|cloudfront|amorank|apple|archive|jeeves|astra|backlink|baidu|bazqux|bingbot|msnbot|msmobot|bing|blex|blogbridge|bloglines|bloglovin|blogpulse|blogram|blogtrot|blogshares|boardreader|lddc|browsershots|bubing|buck|builtwith|butterfly|bytespider|heritrix|cliqz|cloudflare|comodo|commafeed|cbot|cresearch|watchdog|datasearch|dataprovider|daumoa|digg|domaincrawl|domainstats|discord|domain|dmca|duckduck|embed|exabot|exactseek|ezooms|facebook|fast|flamingo|fastladder|feed|wrangler|validator|fever|florienzh|friendica|robot|genieo|fetchor|google|gofeed|gomez|ichiro|gooblog|goorss|gowiki|grammarly|grub|hatena|capture|heureka|htdig|httpmon|hubpages|spider|indeed|istellabot|crawler|kakao|kouio|larbin|linkedin|linkpad|linkdex|livedoor|ltx71|magpie|mj12bot|mapion|mail\.ru|megaindex|socialstreams|mixi|mnogo|monitor|dotbot|rogerbot|yeti|mxtoolbox|netcraft|netestate|netvibes|newsblur|newsgator|nimbostratus|orange|pages|psbot|pingdom|pinterest|pocket|postrank|comment|reddit|rssbar|hunter|quora|safesearch|scrapy|searchatlas|semrush|serpstat|seokicks|seznam|shopwiki|reader|simplepie|site24|slack|sogou|sophora|soso|spaziodati|spdycheck|spinn|sputnik|detector|summify|telegram|twisted|twitter|tiny|tineye|tlsprober|trustedsite|typhoeus|vagabondo|voat|voila|vocus|mcrawler|w3bot|jigsaw|w3c|wappalyzer|wayback|webindexer|wordpress|mechanize|xerka|sitemap|yacy|yandex|yahoo|y\!j|slurp|yelp|yioop|yisou|zmeu|httpclient|nutch|synapse|indy|go|node|wget|curl|package|java|simple|libwww|lwp|urllib|requests|php|pear|zend|ruby)/i';
Applications::$BOTS_REGEX = '/(008|360|a6|abound|muncher|adaxas|addthis|admantx|ahrefs|archiver|altavista|curious|cloudfront|amorank|apple|archive|jeeves|astra|backlink|baidu|bazqux|bingbot|msnbot|msmobot|bing|blex|blogbridge|bloglines|bloglovin|blogpulse|blogram|blogtrot|blogshares|boardreader|lddc|browsershots|bubing|buck|builtwith|butterfly|bytespider|heritrix|cliqz|cloudflare|comodo|commafeed|cbot|cresearch|watchdog|datasearch|dataprovider|daumoa|digg|domaincrawl|domainstats|discord|domain|dmca|duckduck|embed|exabot|exactseek|ezooms|facebook|fast|flamingo|fastladder|feed|wrangler|validator|fever|florienzh|friendica|robot|genieo|fetchor|google|gofeed|gomez|ichiro|gooblog|goorss|gowiki|grammarly|grub|hatena|capture|heureka|htdig|httpmon|hubpages|spider|indeed|istellabot|crawler|kakao|kouio|larbin|letsearch|linkedin|linkpad|linkdex|livedoor|ltx71|magpie|mj12bot|mapion|mail\.ru|megaindex|socialstreams|mixi|mnogo|monitor|dotbot|rogerbot|yeti|mxtoolbox|netcraft|netestate|netvibes|newsblur|newsgator|nimbostratus|orange|pages|psbot|pingdom|pinterest|pocket|postrank|comment|reddit|rssbar|hunter|quora|safesearch|scrapy|searchatlas|semrush|serpstat|seokicks|seznam|shopwiki|reader|simplepie|site24|slack|sogou|sophora|soso|spaziodati|spdycheck|spinn|sputnik|detector|summify|telegram|twisted|twitter|tiny|tineye|tlsprober|trustedsite|typhoeus|vagabondo|voat|voila|vocus|mcrawler|w3bot|jigsaw|w3c|wappalyzer|wayback|webindexer|wordpress|mechanize|xerka|sitemap|yacy|yandex|yahoo|y\!j|slurp|yelp|yioop|yisou|zmeu|httpclient|nutch|synapse|indy|go|node|wget|curl|package|java|simple|libwww|lwp|urllib|requests|php|pear|zend|ruby)/i';
6 changes: 5 additions & 1 deletion tests/data/bots/generic.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -841,4 +841,8 @@
-
headers: 'User-Agent: YisouSpider'
readable: 'Yisou Spider'
result: { browser: { name: 'Yisou Spider' }, device: { type: bot } }
result: { browser: { name: 'Yisou Spider' }, device: { type: bot } }
-
headers: 'User-Agent: Mozilla/5.0 (compatible; LetsearchBot/1.0; +https://letsearch.ru/bots)'
readable: 'LetsearchBot 1.0'
result: { browser: { name: LetsearchBot, version: '1.0' }, device: { type: bot } }

0 comments on commit ac6299b

Please sign in to comment.