|
|
@@ -1,5 +1,5 @@ |
|
|
|
<?php |
|
|
|
if (!defined('DEDEINC')) exit ('dedebiz'); |
|
|
|
if (!defined('DEDEINC')) exit('dedebiz'); |
|
|
|
/* |
|
|
|
* This file is part of Crawler Detect - the web crawler detection library. |
|
|
|
* |
|
|
@@ -8,7 +8,7 @@ if (!defined('DEDEINC')) exit ('dedebiz'); |
|
|
|
* This source file is subject to the MIT license that is bundled |
|
|
|
* with this source code in the file LICENSE. |
|
|
|
*/ |
|
|
|
require_once(DEDEINC."/libraries/fixtures/abstractprovider.php"); |
|
|
|
require_once(DEDEINC . "/libraries/fixtures/abstractprovider.php"); |
|
|
|
|
|
|
|
class Crawlers extends AbstractProvider |
|
|
|
{ |
|
|
@@ -22,6 +22,7 @@ class Crawlers extends AbstractProvider |
|
|
|
'^Aether', |
|
|
|
'^Amazon Simple Notification Service Agent$', |
|
|
|
'^Amazon-Route53-Health-Check-Service', |
|
|
|
'^Amazon CloudFront', |
|
|
|
'^b0t$', |
|
|
|
'^bluefish ', |
|
|
|
'^Calypso v\/', |
|
|
@@ -57,6 +58,7 @@ class Crawlers extends AbstractProvider |
|
|
|
'^pnpm\/', |
|
|
|
'^RMA\/', |
|
|
|
'^Ruby|Ruby\/[0-9]', |
|
|
|
"^symbolicator\\/", |
|
|
|
'^Swurl ', |
|
|
|
'^TLS tester ', |
|
|
|
'^twine\/', |
|
|
@@ -159,7 +161,6 @@ class Crawlers extends AbstractProvider |
|
|
|
'a\.pr-cy\.ru', |
|
|
|
'B-l-i-t-z-B-O-T', |
|
|
|
'Backlink-Ceck', |
|
|
|
'backlink-check', |
|
|
|
'BacklinkHttpStatus', |
|
|
|
'BackStreet', |
|
|
|
'BackupLand', |
|
|
@@ -168,6 +169,7 @@ class Crawlers extends AbstractProvider |
|
|
|
'Badass', |
|
|
|
'baidu\.com', |
|
|
|
'Bandit', |
|
|
|
'Barracuda Sentinel \(EE\)', |
|
|
|
'basicstate', |
|
|
|
'BatchFTP', |
|
|
|
'Battleztar Bazinga', |
|
|
@@ -208,7 +210,6 @@ class Crawlers extends AbstractProvider |
|
|
|
'Branch Metrics API', |
|
|
|
'Branch-Passthrough', |
|
|
|
'Brandprotect', |
|
|
|
'BrandVerity', |
|
|
|
'Brandwatch', |
|
|
|
'Brodie\/', |
|
|
|
'Browsershots', |
|
|
@@ -222,6 +223,7 @@ class Crawlers extends AbstractProvider |
|
|
|
'Butterfly\/', |
|
|
|
'BuzzSumo', |
|
|
|
'CAAM\/[0-9]', |
|
|
|
'caam dot crwlr at gmail dot com', |
|
|
|
'CakePHP', |
|
|
|
'Calculon', |
|
|
|
'Canary%20Mail', |
|
|
@@ -294,6 +296,7 @@ class Crawlers extends AbstractProvider |
|
|
|
'DareBoost', |
|
|
|
'DatabaseDriverMysqli', |
|
|
|
'DataCha0s', |
|
|
|
'DatadogSynthetics', |
|
|
|
'Datafeedwatch', |
|
|
|
'Datanyze', |
|
|
|
'DataparkSearch', |
|
|
@@ -374,6 +377,7 @@ class Crawlers extends AbstractProvider |
|
|
|
'Extreme Picture Finder', |
|
|
|
'EyeNetIE', |
|
|
|
'ezooms', |
|
|
|
'facebookcatalog', |
|
|
|
'facebookexternalhit', |
|
|
|
'facebookexternalua', |
|
|
|
'facebookplatform', |
|
|
@@ -420,16 +424,20 @@ class Crawlers extends AbstractProvider |
|
|
|
'Flunky', |
|
|
|
'flynxapp', |
|
|
|
'forensiq', |
|
|
|
'ForusP', |
|
|
|
'FoundSeoTool', |
|
|
|
'free gallery', |
|
|
|
'fragFINN\.de', |
|
|
|
'free thumbnails', |
|
|
|
'Freeuploader', |
|
|
|
'FreshRSS', |
|
|
|
'frontman', |
|
|
|
'Funnelback', |
|
|
|
'Fuzz Faster U Fool', |
|
|
|
'G-i-g-a-b-o-t', |
|
|
|
'g00g1e\.net', |
|
|
|
'ganarvisitas', |
|
|
|
'gdnplus\.com', |
|
|
|
'GeedoProductSearch', |
|
|
|
'geek-tools', |
|
|
|
'Genieo', |
|
|
|
'GentleSource', |
|
|
@@ -471,13 +479,13 @@ class Crawlers extends AbstractProvider |
|
|
|
'Google PP Default', |
|
|
|
'Google Search Console', |
|
|
|
'Google Web Preview', |
|
|
|
'Google-Ads-Creatives-Assistant', |
|
|
|
'Google-Ads-Overview', |
|
|
|
'Google-Ads', |
|
|
|
'Google-Adwords', |
|
|
|
'Google-Apps-Script', |
|
|
|
'Google-Calendar-Importer', |
|
|
|
'Google-HotelAdsVerifier', |
|
|
|
'Google-HTTP-Java-Client', |
|
|
|
'Google-InspectionTool', |
|
|
|
'Google-Podcast', |
|
|
|
'Google-Publisher-Plugin', |
|
|
|
'Google-Read-Aloud', |
|
|
@@ -491,6 +499,7 @@ class Crawlers extends AbstractProvider |
|
|
|
'Google-Youtube-Links', |
|
|
|
'GoogleDocs', |
|
|
|
'GoogleHC\/', |
|
|
|
'GoogleOther', |
|
|
|
'GoogleProber', |
|
|
|
'GoogleProducer', |
|
|
|
'GoogleSites', |
|
|
@@ -524,7 +533,6 @@ class Crawlers extends AbstractProvider |
|
|
|
'Hatena', |
|
|
|
'Havij', |
|
|
|
'HaxerMen', |
|
|
|
'HeadlessChrome', |
|
|
|
'HEADMasterSEO', |
|
|
|
'HeartRails_Capture', |
|
|
|
'help@dataminr\.com', |
|
|
@@ -552,7 +560,7 @@ class Crawlers extends AbstractProvider |
|
|
|
'http-request\/', |
|
|
|
'HTTP-Tiny', |
|
|
|
'HTTP::Lite', |
|
|
|
'http:\/\/www.neomo.de\/', //'Francis [Bot]' |
|
|
|
'http:\/\/www.neomo.de\/', // 'Francis [Bot]' |
|
|
|
'HttpComponents', |
|
|
|
'httphr', |
|
|
|
'HTTPie', |
|
|
@@ -614,6 +622,7 @@ class Crawlers extends AbstractProvider |
|
|
|
'intraVnews', |
|
|
|
'IODC', |
|
|
|
'IOI', |
|
|
|
'Inboxb0t', |
|
|
|
'iplabel', |
|
|
|
'ips-agent', |
|
|
|
'IPS\/[0-9]', |
|
|
@@ -662,6 +671,7 @@ class Crawlers extends AbstractProvider |
|
|
|
'knows\.is', |
|
|
|
'KOCMOHABT', |
|
|
|
'kouio', |
|
|
|
'krawler\.dk', |
|
|
|
'kube-probe', |
|
|
|
'kubectl', |
|
|
|
'kulturarw3', |
|
|
@@ -686,6 +696,7 @@ class Crawlers extends AbstractProvider |
|
|
|
'Link Valet', |
|
|
|
'LinkAlarm\/', |
|
|
|
'LinkAnalyser', |
|
|
|
'link-check', |
|
|
|
'linkCheck', |
|
|
|
'linkdex', |
|
|
|
'LinkExaminer', |
|
|
@@ -706,6 +717,7 @@ class Crawlers extends AbstractProvider |
|
|
|
'longurl-r-package', |
|
|
|
'looid\.com', |
|
|
|
'looksystems\.net', |
|
|
|
'lscache_runner', |
|
|
|
'ltx71', |
|
|
|
'lua-resty-http', |
|
|
|
'Lucee \(CFML Engine\)', |
|
|
@@ -718,6 +730,7 @@ class Crawlers extends AbstractProvider |
|
|
|
'L\.webis', |
|
|
|
'mabontland', |
|
|
|
'MacOutlook\/', |
|
|
|
'MagentaNews\/', |
|
|
|
'Mag-Net', |
|
|
|
'MagpieRSS', |
|
|
|
'Mail::STS', |
|
|
@@ -734,6 +747,7 @@ class Crawlers extends AbstractProvider |
|
|
|
'masscan\/', |
|
|
|
'Mata Hari', |
|
|
|
'mattermost', |
|
|
|
'MatchorySearch\/', |
|
|
|
'Mediametric', |
|
|
|
'Mediapartners-Google', |
|
|
|
'mediawords', |
|
|
@@ -751,6 +765,7 @@ class Crawlers extends AbstractProvider |
|
|
|
'Microsoft Windows Network Diagnostics', |
|
|
|
'Microsoft-WebDAV-MiniRedir', |
|
|
|
'Microsoft\.Data\.Mashup', |
|
|
|
'MicrosoftPreview', |
|
|
|
'MIDown tool', |
|
|
|
'MIIxpc', |
|
|
|
'Mindjet', |
|
|
@@ -766,10 +781,12 @@ class Crawlers extends AbstractProvider |
|
|
|
'mogimogi', |
|
|
|
'Mojeek', |
|
|
|
'Mojolicious \(Perl\)', |
|
|
|
'Mollie', |
|
|
|
'monitis', |
|
|
|
'Monitority\/', |
|
|
|
'Monit\/', |
|
|
|
'montastic', |
|
|
|
'MonSpark', |
|
|
|
'MonTools', |
|
|
|
'Moreover', |
|
|
|
'Morfeus Fucking Scanner', |
|
|
@@ -793,6 +810,7 @@ class Crawlers extends AbstractProvider |
|
|
|
'Nameprotect', |
|
|
|
'nationalarchives', |
|
|
|
'Navroad', |
|
|
|
'nbertaupete95', |
|
|
|
'NearSite', |
|
|
|
'Needle', |
|
|
|
'Nessus', |
|
|
@@ -947,6 +965,7 @@ class Crawlers extends AbstractProvider |
|
|
|
'PrintFriendly', |
|
|
|
'PritTorrent', |
|
|
|
'Prlog', |
|
|
|
'probely\.com', |
|
|
|
'probethenet', |
|
|
|
'Project ?25499', |
|
|
|
'Project-Resonance', |
|
|
@@ -958,6 +977,7 @@ class Crawlers extends AbstractProvider |
|
|
|
'pshtt, https scanning', |
|
|
|
'PTST ', |
|
|
|
'PTST\/[0-9]+', |
|
|
|
'pulsetic\.com', |
|
|
|
'Pump', |
|
|
|
'Python-httplib2', |
|
|
|
'python-httpx', |
|
|
@@ -1006,6 +1026,7 @@ class Crawlers extends AbstractProvider |
|
|
|
'RPT-HTTPClient', |
|
|
|
'RSSMix\/', |
|
|
|
'RSSOwl', |
|
|
|
'RuxitSynthetic', |
|
|
|
'RyowlEngine', |
|
|
|
'safe-agent-scanner', |
|
|
|
'SalesIntelligent', |
|
|
@@ -1050,6 +1071,7 @@ class Crawlers extends AbstractProvider |
|
|
|
'Seobility', |
|
|
|
'SEOCentro', |
|
|
|
'SeoCheck', |
|
|
|
'seocompany', |
|
|
|
'SEOkicks', |
|
|
|
'SEOlizer', |
|
|
|
'Seomoz', |
|
|
@@ -1119,9 +1141,11 @@ class Crawlers extends AbstractProvider |
|
|
|
'SpamExperts', |
|
|
|
'Spammen', |
|
|
|
'Spanner', |
|
|
|
'Spawning-AI', |
|
|
|
'spaziodati', |
|
|
|
'SPDYCheck', |
|
|
|
'Specificfeeds', |
|
|
|
'SpeedKit', |
|
|
|
'speedy', |
|
|
|
'SPEng', |
|
|
|
'Spinn3r', |
|
|
@@ -1244,9 +1268,11 @@ class Crawlers extends AbstractProvider |
|
|
|
'VB Project', |
|
|
|
'vBSEO', |
|
|
|
'VCI', |
|
|
|
'Verity', |
|
|
|
'via ggpht\.com GoogleImageProxy', |
|
|
|
'Virusdie', |
|
|
|
'visionutils', |
|
|
|
'Visual Rights Group', |
|
|
|
'vkShare', |
|
|
|
'VoidEYE', |
|
|
|
'Voil', |
|
|
@@ -1394,6 +1420,7 @@ class Crawlers extends AbstractProvider |
|
|
|
'Zabbix', |
|
|
|
'Zade', |
|
|
|
'Zao', |
|
|
|
'Zapier', |
|
|
|
'Zauba', |
|
|
|
'Zemanta Aggregator', |
|
|
|
'Zend\\\\Http\\\\Client', |
|
|
@@ -1407,6 +1434,6 @@ class Crawlers extends AbstractProvider |
|
|
|
'Zoom\.Mac', |
|
|
|
'ZoteroTranslationServer', |
|
|
|
'ZyBorg', |
|
|
|
'[a-z0-9\-_]*(bot|crawl|archiver|transcoder|spider|uptime|validator|fetcher|cron|checker|reader|extractor|monitoring|analyzer|scraper)', |
|
|
|
'[a-z0-9\-_]*(bot|crawl|headless|archiver|transcoder|spider|uptime|validator|fetcher|cron|checker|reader|extractor|monitoring|analyzer|scraper)', |
|
|
|
); |
|
|
|
} |
|
|
|
} |