File manager - Edit - /home/autoph/public_html/projects/Rating-AutoHub/public/css/jaybizzle.tar
Back
crawler-detect/composer.json 0000644 00000001437 15025017654 0012205 0 ustar 00 { "name": "jaybizzle/crawler-detect", "type": "library", "description": "CrawlerDetect is a PHP class for detecting bots/crawlers/spiders via the user agent", "keywords": ["crawler", "crawler detect", "crawler detector", "crawlerdetect", "php crawler detect"], "homepage": "https://github.com/JayBizzle/Crawler-Detect/", "license": "MIT", "authors": [ { "name": "Mark Beech", "email": "m@rkbee.ch", "role": "Developer" } ], "require": { "php": ">=5.3.0" }, "require-dev": { "phpunit/phpunit": "^4.8|^5.5|^6.5|^9.4" }, "autoload": { "psr-4": { "Jaybizzle\\CrawlerDetect\\": "src/" } }, "scripts": { "test": "vendor/bin/phpunit" } } crawler-detect/src/CrawlerDetect.php 0000644 00000010274 15025017654 0013512 0 ustar 00 <?php /* * This file is part of Crawler Detect - the web crawler detection library. * * (c) Mark Beech <m@rkbee.ch> * * This source file is subject to the MIT license that is bundled * with this source code in the file LICENSE. */ namespace Jaybizzle\CrawlerDetect; use Jaybizzle\CrawlerDetect\Fixtures\Crawlers; use Jaybizzle\CrawlerDetect\Fixtures\Exclusions; use Jaybizzle\CrawlerDetect\Fixtures\Headers; class CrawlerDetect { /** * The user agent. * * @var string|null */ protected $userAgent; /** * Headers that contain a user agent. * * @var array */ protected $httpHeaders = array(); /** * Store regex matches. * * @var array */ protected $matches = array(); /** * Crawlers object. * * @var \Jaybizzle\CrawlerDetect\Fixtures\Crawlers */ protected $crawlers; /** * Exclusions object. * * @var \Jaybizzle\CrawlerDetect\Fixtures\Exclusions */ protected $exclusions; /** * Headers object. * * @var \Jaybizzle\CrawlerDetect\Fixtures\Headers */ protected $uaHttpHeaders; /** * The compiled regex string. * * @var string */ protected $compiledRegex; /** * The compiled exclusions regex string. * * @var string */ protected $compiledExclusions; /** * Class constructor. */ public function __construct(array $headers = null, $userAgent = null) { $this->crawlers = new Crawlers(); $this->exclusions = new Exclusions(); $this->uaHttpHeaders = new Headers(); $this->compiledRegex = $this->compileRegex($this->crawlers->getAll()); $this->compiledExclusions = $this->compileRegex($this->exclusions->getAll()); $this->setHttpHeaders($headers); $this->setUserAgent($userAgent); } /** * Compile the regex patterns into one regex string. * * @param array * * @return string */ public function compileRegex($patterns) { return '('.implode('|', $patterns).')'; } /** * Set HTTP headers. * * @param array|null $httpHeaders */ public function setHttpHeaders($httpHeaders) { // Use global _SERVER if $httpHeaders aren't defined. if (! is_array($httpHeaders) || ! count($httpHeaders)) { $httpHeaders = $_SERVER; } // Clear existing headers. $this->httpHeaders = array(); // Only save HTTP headers. In PHP land, that means // only _SERVER vars that start with HTTP_. foreach ($httpHeaders as $key => $value) { if (strpos($key, 'HTTP_') === 0) { $this->httpHeaders[$key] = $value; } } } /** * Return user agent headers. * * @return array */ public function getUaHttpHeaders() { return $this->uaHttpHeaders->getAll(); } /** * Set the user agent. * * @param string|null $userAgent */ public function setUserAgent($userAgent) { if (is_null($userAgent)) { foreach ($this->getUaHttpHeaders() as $altHeader) { if (isset($this->httpHeaders[$altHeader])) { $userAgent .= $this->httpHeaders[$altHeader].' '; } } } return $this->userAgent = $userAgent; } /** * Check user agent string against the regex. * * @param string|null $userAgent * * @return bool */ public function isCrawler($userAgent = null) { $agent = trim(preg_replace( "/{$this->compiledExclusions}/i", '', $userAgent ?: $this->userAgent ?: '' )); if ($agent === '') { return false; } return (bool) preg_match("/{$this->compiledRegex}/i", $agent, $this->matches); } /** * Return the matches. * * @return string|null */ public function getMatches() { return isset($this->matches[0]) ? $this->matches[0] : null; } /** * @return string|null */ public function getUserAgent() { return $this->userAgent; } } crawler-detect/src/Fixtures/Crawlers.php 0000644 00000100117 15025017654 0014351 0 ustar 00 <?php /* * This file is part of Crawler Detect - the web crawler detection library. * * (c) Mark Beech <m@rkbee.ch> * * This source file is subject to the MIT license that is bundled * with this source code in the file LICENSE. */ namespace Jaybizzle\CrawlerDetect\Fixtures; class Crawlers extends AbstractProvider { /** * Array of regular expressions to match against the user agent. * * @var array */ protected $data = array( ' YLT', '^Aether', '^Amazon Simple Notification Service Agent$', '^Amazon-Route53-Health-Check-Service', '^b0t$', '^bluefish ', '^Calypso v\/', '^COMODO DCV', '^Corax', '^DangDang', '^DavClnt', '^DHSH', '^docker\/[0-9]', '^Expanse', '^FDM ', '^git\/', '^Goose\/', '^Grabber', '^Gradle\/', '^HTTPClient\/', '^HTTPing', '^Java\/', '^Jeode\/', '^Jetty\/', '^Mail\/', '^Mget', '^Microsoft URL Control', '^Mikrotik\/', '^Netlab360', '^NG\/[0-9\.]', '^NING\/', '^npm\/', '^Nuclei', '^PHP-AYMAPI\/', '^PHP\/', '^pip\/', '^pnpm\/', '^RMA\/', '^Ruby|Ruby\/[0-9]', '^Swurl ', '^TLS tester ', '^twine\/', '^ureq', '^VSE\/[0-9]', '^WordPress\.com', '^XRL\/[0-9]', '^ZmEu', '008\/', '13TABS', '192\.comAgent', '2GDPR\/', '2ip\.ru', '404enemy', '7Siters', '80legs', 'a3logics\.in', 'A6-Indexer', 'Abonti', 'Aboundex', 'aboutthedomain', 'Accoona-AI-Agent', 'acebookexternalhit\/', 'acoon', 'acrylicapps\.com\/pulp', 'Acunetix', 'AdAuth\/', 'adbeat', 'AddThis', 'ADmantX', 'AdminLabs', 'adressendeutschland', 'adreview\/', 'adscanner', 'adstxt-worker', 'Adstxtaggregator', 'adstxt\.com', 'Adyen HttpClient', 'AffiliateLabz\/', 'affilimate-puppeteer', 'agentslug', 'AHC', 'aihit', 'aiohttp\/', 'Airmail', 'akka-http\/', 'akula\/', 'alertra', 'alexa site audit', 'Alibaba\.Security\.Heimdall', 'Alligator', 'allloadin', 'AllSubmitter', 'alyze\.info', 'amagit', 'Anarchie', 'AndroidDownloadManager', 'Anemone', 'AngleSharp', 'annotate_google', 'Anthill', 'Anturis Agent', 'Ant\.com', 'AnyEvent-HTTP\/', 'Apache Ant\/', 'Apache Droid', 'Apache OpenOffice', 'Apache-HttpAsyncClient', 'Apache-HttpClient', 'ApacheBench', 'Apexoo', 'apimon\.de', 'APIs-Google', 'AportWorm\/', 'AppBeat\/', 'AppEngine-Google', 'AppleSyndication', 'Aprc\/[0-9]', 'Arachmo', 'arachnode', 'Arachnophilia', 'aria2', 'Arukereso', 'asafaweb', 'Asana\/', 'Ask Jeeves', 'AskQuickly', 'ASPSeek', 'Asterias', 'Astute', 'asynchttp', 'Attach', 'attohttpc', 'autocite', 'AutomaticWPTester', 'Autonomy', 'awin\.com', 'AWS Security Scanner', 'axios\/', 'a\.pr-cy\.ru', 'B-l-i-t-z-B-O-T', 'Backlink-Ceck', 'backlink-check', 'BacklinkHttpStatus', 'BackStreet', 'BackupLand', 'BackWeb', 'Bad-Neighborhood', 'Badass', 'baidu\.com', 'Bandit', 'basicstate', 'BatchFTP', 'Battleztar Bazinga', 'baypup\/', 'BazQux', 'BBBike', 'BCKLINKS', 'BDFetch', 'BegunAdvertising', 'Bewica-security-scan', 'Bidtellect', 'BigBozz', 'Bigfoot', 'biglotron', 'BingLocalSearch', 'BingPreview', 'binlar', 'biNu image cacher', 'Bitacle', 'Bitrix link preview', 'biz_Directory', 'BKCTwitterUnshortener\/', 'Black Hole', 'Blackboard Safeassign', 'BlackWidow', 'BlockNote\.Net', 'BlogBridge', 'Bloglines', 'Bloglovin', 'BlogPulseLive', 'BlogSearch', 'Blogtrottr', 'BlowFish', 'boitho\.com-dc', 'Boost\.Beast', 'BPImageWalker', 'Braintree-Webhooks', 'Branch Metrics API', 'Branch-Passthrough', 'Brandprotect', 'BrandVerity', 'Brandwatch', 'Brodie\/', 'Browsershots', 'BUbiNG', 'Buck\/', 'Buddy', 'BuiltWith', 'Bullseye', 'BunnySlippers', 'Burf Search', 'Butterfly\/', 'BuzzSumo', 'CAAM\/[0-9]', 'CakePHP', 'Calculon', 'Canary%20Mail', 'CaretNail', 'catexplorador', 'CC Metadata Scaper', 'Cegbfeieh', 'censys', 'centuryb.o.t9[at]gmail.com', 'Cerberian Drtrs', 'CERT\.at-Statistics-Survey', 'cf-facebook', 'cg-eye', 'changedetection', 'ChangesMeter', 'Charlotte', 'chatterino-api-cache', 'CheckHost', 'checkprivacy', 'CherryPicker', 'ChinaClaw', 'Chirp\/', 'chkme\.com', 'Chlooe', 'Chromaxa', 'CirrusExplorer', 'CISPA Vulnerability Notification', 'CISPA Web Analyser', 'Citoid', 'CJNetworkQuality', 'Clarsentia', 'clips\.ua\.ac\.be', 'Cloud mapping', 'CloudEndure', 'CloudFlare-AlwaysOnline', 'Cloudflare-Healthchecks', 'Cloudinary', 'cmcm\.com', 'coccoc', 'cognitiveseo', 'ColdFusion', 'colly -', 'CommaFeed', 'Commons-HttpClient', 'commonscan', 'contactbigdatafr', 'contentkingapp', 'Contextual Code Sites Explorer', 'convera', 'CookieReports', 'copyright sheriff', 'CopyRightCheck', 'Copyscape', 'cortex\/', 'Cosmos4j\.feedback', 'Covario-IDS', 'Craw\/', 'Crescent', 'Criteo', 'Crowsnest', 'CSHttp', 'CSSCheck', 'Cula\/', 'curb', 'Curious George', 'curl', 'cuwhois\/', 'cybo\.com', 'DAP\/NetHTTP', 'DareBoost', 'DatabaseDriverMysqli', 'DataCha0s', 'DatadogSynthetics', 'Datafeedwatch', 'Datanyze', 'DataparkSearch', 'dataprovider', 'DataXu', 'Daum(oa)?[ \/][0-9]', 'dBpoweramp', 'ddline', 'deeris', 'delve\.ai', 'Demon', 'DeuSu', 'developers\.google\.com\/\+\/web\/snippet\/', 'Devil', 'Digg', 'Digincore', 'DigitalPebble', 'Dirbuster', 'Discourse Forum Onebox', 'Dispatch\/', 'Disqus\/', 'DittoSpyder', 'dlvr', 'DMBrowser', 'DNSPod-reporting', 'docoloc', 'Dolphin http client', 'DomainAppender', 'DomainLabz', 'Domains Project\/', 'Donuts Content Explorer', 'dotMailer content retrieval', 'dotSemantic', 'downforeveryoneorjustme', 'Download Wonder', 'downnotifier', 'DowntimeDetector', 'Drip', 'drupact', 'Drupal \(\+http:\/\/drupal\.org\/\)', 'DTS Agent', 'dubaiindex', 'DuplexWeb-Google', 'DynatraceSynthetic', 'EARTHCOM', 'Easy-Thumb', 'EasyDL', 'Ebingbong', 'ec2linkfinder', 'eCairn-Grabber', 'eCatch', 'ECCP', 'eContext\/', 'Ecxi', 'EirGrabber', 'ElectricMonk', 'elefent', 'EMail Exractor', 'EMail Wolf', 'EmailWolf', 'Embarcadero', 'Embed PHP Library', 'Embedly', 'endo\/', 'europarchive\.org', 'evc-batch', 'EventMachine HttpClient', 'Everwall Link Expander', 'Evidon', 'Evrinid', 'ExactSearch', 'ExaleadCloudview', 'Excel\/', 'exif', 'ExoRank', 'Exploratodo', 'Express WebPictures', 'Extreme Picture Finder', 'EyeNetIE', 'ezooms', 'facebookexternalhit', 'facebookexternalua', 'facebookplatform', 'fairshare', 'Faraday v', 'fasthttp', 'Faveeo', 'Favicon downloader', 'faviconarchive', 'faviconkit', 'FavOrg', 'Feed Wrangler', 'Feedable\/', 'Feedbin', 'FeedBooster', 'FeedBucket', 'FeedBunch\/', 'FeedBurner', 'feeder', 'Feedly', 'FeedshowOnline', 'Feedshow\/', 'Feedspot', 'FeedViewer\/', 'Feedwind\/', 'FeedZcollector', 'feeltiptop', 'Fetch API', 'Fetch\/[0-9]', 'Fever\/[0-9]', 'FHscan', 'Fiery%20Feeds', 'Filestack', 'Fimap', 'findlink', 'findthatfile', 'FlashGet', 'FlipboardBrowserProxy', 'FlipboardProxy', 'FlipboardRSS', 'Flock\/', 'Florienzh\/', 'fluffy', 'Flunky', 'flynxapp', 'forensiq', 'ForusP', 'FoundSeoTool', 'free thumbnails', 'Freeuploader', 'FreshRSS', 'frontman', 'Funnelback', 'Fuzz Faster U Fool', 'G-i-g-a-b-o-t', 'g00g1e\.net', 'ganarvisitas', 'gdnplus\.com', 'geek-tools', 'Genieo', 'GentleSource', 'GetCode', 'Getintent', 'GetLinkInfo', 'getprismatic', 'GetRight', 'getroot', 'GetURLInfo\/', 'GetWeb', 'Geziyor', 'Ghost Inspector', 'GigablastOpenSource', 'GIS-LABS', 'github-camo', 'GitHub-Hookshot', 'github\.com', 'Go http package', 'Go [\d\.]* package http', 'Go!Zilla', 'Go-Ahead-Got-It', 'Go-http-client', 'go-mtasts\/', 'gobuster', 'gobyus', 'Gofeed', 'gofetch', 'Goldfire Server', 'GomezAgent', 'gooblog', 'Goodzer\/', 'Google AppsViewer', 'Google Desktop', 'Google favicon', 'Google Keyword Suggestion', 'Google Keyword Tool', 'Google Page Speed Insights', 'Google PP Default', 'Google Search Console', 'Google Web Preview', 'Google-Ads-Creatives-Assistant', 'Google-Ads-Overview', 'Google-Adwords', 'Google-Apps-Script', 'Google-Calendar-Importer', 'Google-HotelAdsVerifier', 'Google-HTTP-Java-Client', 'Google-Podcast', 'Google-Publisher-Plugin', 'Google-Read-Aloud', 'Google-SearchByImage', 'Google-Site-Verification', 'Google-SMTP-STS', 'Google-speakr', 'Google-Structured-Data-Testing-Tool', 'Google-Transparency-Report', 'google-xrawler', 'Google-Youtube-Links', 'GoogleDocs', 'GoogleHC\/', 'GoogleProber', 'GoogleProducer', 'GoogleSites', 'Gookey', 'GoSpotCheck', 'gosquared-thumbnailer', 'Gotit', 'GoZilla', 'grabify', 'GrabNet', 'Grafula', 'Grammarly', 'GrapeFX', 'GreatNews', 'Gregarius', 'GRequests', 'grokkit', 'grouphigh', 'grub-client', 'gSOAP\/', 'GT::WWW', 'GTmetrix', 'GuzzleHttp', 'gvfs\/', 'HAA(A)?RTLAND http client', 'Haansoft', 'hackney\/', 'Hadi Agent', 'HappyApps-WebCheck', 'Hardenize', 'Hatena', 'Havij', 'HaxerMen', 'HeadlessChrome', 'HEADMasterSEO', 'HeartRails_Capture', 'help@dataminr\.com', 'heritrix', 'Hexometer', 'historious', 'hkedcity', 'hledejLevne\.cz', 'Hloader', 'HMView', 'Holmes', 'HonesoSearchEngine', 'HootSuite Image proxy', 'Hootsuite-WebFeed', 'hosterstats', 'HostTracker', 'ht:\/\/check', 'htdig', 'HTMLparser', 'htmlyse', 'HTTP Banner Detection', 'http-get', 'HTTP-Header-Abfrage', 'http-kit', 'http-request\/', 'HTTP-Tiny', 'HTTP::Lite', 'http:\/\/www.neomo.de\/', //'Francis [Bot]' 'HttpComponents', 'httphr', 'HTTPie', 'HTTPMon', 'httpRequest', 'httpscheck', 'httpssites_power', 'httpunit', 'HttpUrlConnection', 'http\.rb\/', 'HTTP_Compression_Test', 'http_get', 'http_request2', 'http_requester', 'httrack', 'huaweisymantec', 'HubSpot ', 'HubSpot-Link-Resolver', 'Humanlinks', 'i2kconnect\/', 'Iblog', 'ichiro', 'Id-search', 'IdeelaborPlagiaat', 'IDG Twitter Links Resolver', 'IDwhois\/', 'Iframely', 'igdeSpyder', 'iGooglePortal', 'IlTrovatore', 'Image Fetch', 'Image Sucker', 'ImageEngine\/', 'ImageVisu\/', 'Imagga', 'imagineeasy', 'imgsizer', 'InAGist', 'inbound\.li parser', 'InDesign%20CC', 'Indy Library', 'InetURL', 'infegy', 'infohelfer', 'InfoTekies', 'InfoWizards Reciprocal Link', 'inpwrd\.com', 'instabid', 'Instapaper', 'Integrity', 'integromedb', 'Intelliseek', 'InterGET', 'Internet Ninja', 'InternetSeer', 'internetVista monitor', 'internetwache', 'internet_archive', 'intraVnews', 'IODC', 'IOI', 'iplabel', 'ips-agent', 'IPS\/[0-9]', 'IPWorks HTTP\/S Component', 'iqdb\/', 'Iria', 'Irokez', 'isitup\.org', 'iskanie', 'isUp\.li', 'iThemes Sync\/', 'IZaBEE', 'iZSearch', 'JAHHO', 'janforman', 'Jaunt\/', 'Java.*outbrain', 'javelin\.io', 'Jbrofuzz', 'Jersey\/', 'JetCar', 'Jigsaw', 'Jobboerse', 'JobFeed discovery', 'Jobg8 URL Monitor', 'jobo', 'Jobrapido', 'Jobsearch1\.5', 'JoinVision Generic', 'JolokiaPwn', 'Joomla', 'Jorgee', 'JS-Kit', 'JungleKeyThumbnail', 'JustView', 'Kaspersky Lab CFR link resolver', 'Kelny\/', 'Kerrigan\/', 'KeyCDN', 'Keyword Density', 'Keywords Research', 'khttp\/', 'KickFire', 'KimonoLabs\/', 'Kml-Google', 'knows\.is', 'KOCMOHABT', 'kouio', 'kube-probe', 'kubectl', 'kulturarw3', 'KumKie', 'Larbin', 'Lavf\/', 'leakix\.net', 'LeechFTP', 'LeechGet', 'letsencrypt', 'Lftp', 'LibVLC', 'LibWeb', 'Libwhisker', 'libwww', 'Licorne', 'Liferea\/', 'Lighthouse', 'Lightspeedsystems', 'Likse', 'limber\.io', 'Link Valet', 'LinkAlarm\/', 'LinkAnalyser', 'linkCheck', 'linkdex', 'LinkExaminer', 'linkfluence', 'linkpeek', 'LinkPreview', 'LinkScan', 'LinksManager', 'LinkTiger', 'LinkWalker', 'link_thumbnailer', 'Lipperhey', 'Litemage_walker', 'livedoor ScreenShot', 'LoadImpactRload', 'localsearch-web', 'LongURL API', 'longurl-r-package', 'looid\.com', 'looksystems\.net', 'ltx71', 'lua-resty-http', 'Lucee \(CFML Engine\)', 'Lush Http Client', 'lwp-request', 'lwp-trivial', 'LWP::Simple', 'lycos', 'LYT\.SR', 'L\.webis', 'mabontland', 'MacOutlook\/', 'Mag-Net', 'MagpieRSS', 'Mail::STS', 'MailChimp', 'Mail\.Ru', 'Majestic12', 'makecontact\/', 'Mandrill', 'MapperCmd', 'marketinggrader', 'MarkMonitor', 'MarkWatch', 'Mass Downloader', 'masscan\/', 'Mata Hari', 'mattermost', 'Mediametric', 'Mediapartners-Google', 'mediawords', 'MegaIndex\.ru', 'MeltwaterNews', 'Melvil Rawi', 'MemGator', 'Metaspinner', 'MetaURI', 'MFC_Tear_Sample', 'Microsearch', 'Microsoft Data Access', 'Microsoft Office', 'Microsoft Outlook', 'Microsoft Windows Network Diagnostics', 'Microsoft-WebDAV-MiniRedir', 'Microsoft\.Data\.Mashup', 'MIDown tool', 'MIIxpc', 'Mindjet', 'Miniature\.io', 'Miniflux', 'mio_httpc', 'Miro-HttpClient', 'Mister PiX', 'mixdata dot com', 'mixed-content-scan', 'mixnode', 'Mnogosearch', 'mogimogi', 'Mojeek', 'Mojolicious \(Perl\)', 'Mollie', 'monitis', 'Monitority\/', 'Monit\/', 'montastic', 'MonTools', 'Moreover', 'Morfeus Fucking Scanner', 'Morning Paper', 'MovableType', 'mowser', 'Mrcgiguy', 'Mr\.4x3 Powered', 'MS Web Services Client Protocol', 'MSFrontPage', 'mShots', 'MuckRack\/', 'muhstik-scan', 'MVAClient', 'MxToolbox\/', 'myseosnapshot', 'nagios', 'Najdi\.si', 'Name Intelligence', 'NameFo\.com', 'Nameprotect', 'nationalarchives', 'Navroad', 'NearSite', 'Needle', 'Nessus', 'Net Vampire', 'NetAnts', 'NETCRAFT', 'NetLyzer', 'NetMechanic', 'NetNewsWire', 'Netpursual', 'netresearch', 'NetShelter ContentScan', 'Netsparker', 'NetSystemsResearch', 'nettle', 'NetTrack', 'Netvibes', 'NetZIP', 'Neustar WPM', 'NeutrinoAPI', 'NewRelicPinger', 'NewsBlur .*Finder', 'NewsGator', 'newsme', 'newspaper\/', 'Nexgate Ruby Client', 'NG-Search', 'nghttp2', 'Nibbler', 'NICErsPRO', 'NihilScio', 'Nikto', 'nineconnections', 'NLNZ_IAHarvester', 'Nmap Scripting Engine', 'node-fetch', 'node-superagent', 'node-urllib', 'Nodemeter', 'NodePing', 'node\.io', 'nominet\.org\.uk', 'nominet\.uk', 'Norton-Safeweb', 'Notifixious', 'notifyninja', 'NotionEmbedder', 'nuhk', 'nutch', 'Nuzzel', 'nWormFeedFinder', 'nyawc\/', 'Nymesis', 'NYU', 'Observatory\/', 'Ocelli\/', 'Octopus', 'oegp', 'Offline Explorer', 'Offline Navigator', 'OgScrper', 'okhttp', 'omgili', 'OMSC', 'Online Domain Tools', 'Open Source RSS', 'OpenCalaisSemanticProxy', 'Openfind', 'OpenLinkProfiler', 'Openstat\/', 'OpenVAS', 'OPPO A33', 'Optimizer', 'Orbiter', 'OrgProbe\/', 'orion-semantics', 'Outlook-Express', 'Outlook-iOS', 'Owler', 'Owlin', 'ownCloud News', 'ow\.ly', 'OxfordCloudService', 'page scorer', 'Page Valet', 'page2rss', 'PageFreezer', 'PageGrabber', 'PagePeeker', 'PageScorer', 'Pagespeed\/', 'PageThing', 'page_verifier', 'Panopta', 'panscient', 'Papa Foto', 'parsijoo', 'Pavuk', 'PayPal IPN', 'pcBrowser', 'Pcore-HTTP', 'PDF24 URL To PDF', 'Pearltrees', 'PECL::HTTP', 'peerindex', 'Peew', 'PeoplePal', 'Perlu -', 'PhantomJS Screenshoter', 'PhantomJS\/', 'Photon\/', 'php-requests', 'phpservermon', 'Pi-Monster', 'Picscout', 'Picsearch', 'PictureFinder', 'Pimonster', 'Pingability', 'PingAdmin\.Ru', 'Pingdom', 'Pingoscope', 'PingSpot', 'ping\.blo\.gs', 'pinterest\.com', 'Pixray', 'Pizilla', 'Plagger\/', 'Pleroma ', 'Ploetz \+ Zeller', 'Plukkie', 'plumanalytics', 'PocketImageCache', 'PocketParser', 'Pockey', 'PodcastAddict\/', 'POE-Component-Client-HTTP', 'Polymail\/', 'Pompos', 'Porkbun', 'Port Monitor', 'postano', 'postfix-mta-sts-resolver', 'PostmanRuntime', 'postplanner\.com', 'PostPost', 'postrank', 'PowerPoint\/', 'Prebid', 'Prerender', 'Priceonomics Analysis Engine', 'PrintFriendly', 'PritTorrent', 'Prlog', 'probethenet', 'Project ?25499', 'Project-Resonance', 'prospectb2b', 'Protopage', 'ProWebWalker', 'proximic', 'PRTG Network Monitor', 'pshtt, https scanning', 'PTST ', 'PTST\/[0-9]+', 'Pump', 'Python-httplib2', 'python-httpx', 'python-requests', 'Python-urllib', 'Qirina Hurdler', 'QQDownload', 'QrafterPro', 'Qseero', 'Qualidator', 'QueryN Metasearch', 'queuedriver', 'quic-go-HTTP\/', 'QuiteRSS', 'Quora Link Preview', 'Qwantify', 'Radian6', 'RadioPublicImageResizer', 'Railgun\/', 'RankActive', 'RankFlex', 'RankSonicSiteAuditor', 'RapidLoad\/', 'Re-re Studio', 'ReactorNetty', 'Readability', 'RealDownload', 'RealPlayer%20Downloader', 'RebelMouse', 'Recorder', 'RecurPost\/', 'redback\/', 'ReederForMac', 'Reeder\/', 'ReGet', 'RepoMonkey', 'request\.js', 'reqwest\/', 'ResponseCodeTest', 'RestSharp', 'Riddler', 'Rival IQ', 'Robosourcer', 'Robozilla', 'ROI Hunter', 'RPT-HTTPClient', 'RSSMix\/', 'RSSOwl', 'RyowlEngine', 'safe-agent-scanner', 'SalesIntelligent', 'Saleslift', 'SAP NetWeaver Application Server', 'SauceNAO', 'SBIder', 'sc-downloader', 'scalaj-http', 'Scamadviser-Frontend', 'ScanAlert', 'scan\.lol', 'Scoop', 'scooter', 'ScopeContentAG-HTTP-Client', 'ScoutJet', 'ScoutURLMonitor', 'ScrapeBox Page Scanner', 'Scrapy', 'Screaming', 'ScreenShotService', 'Scrubby', 'Scrutiny\/', 'Search37', 'searchenginepromotionhelp', 'Searchestate', 'SearchExpress', 'SearchSight', 'SearchWP', 'search\.thunderstone', 'Seeker', 'semanticdiscovery', 'semanticjuice', 'Semiocast HTTP client', 'Semrush', 'Sendsay\.Ru', 'sentry\/', 'SEO Browser', 'Seo Servis', 'seo-nastroj\.cz', 'seo4ajax', 'Seobility', 'SEOCentro', 'SeoCheck', 'seocompany', 'SEOkicks', 'SEOlizer', 'Seomoz', 'SEOprofiler', 'seoscanners', 'SEOsearch', 'seositecheckup', 'SEOstats', 'servernfo', 'sexsearcher', 'Seznam', 'Shelob', 'Shodan', 'Shoppimon', 'ShopWiki', 'ShortLinkTranslate', 'shortURL lengthener', 'shrinktheweb', 'Sideqik', 'Siege', 'SimplePie', 'SimplyFast', 'Siphon', 'SISTRIX', 'Site Sucker', 'Site-Shot\/', 'Site24x7', 'SiteBar', 'Sitebeam', 'Sitebulb\/', 'SiteCondor', 'SiteExplorer', 'SiteGuardian', 'Siteimprove', 'SiteIndexed', 'Sitemap(s)? Generator', 'SitemapGenerator', 'SiteMonitor', 'Siteshooter B0t', 'SiteSnagger', 'SiteSucker', 'SiteTruth', 'Sitevigil', 'sitexy\.com', 'SkypeUriPreview', 'Slack\/', 'sli-systems\.com', 'slider\.com', 'slurp', 'SlySearch', 'SmartDownload', 'SMRF URL Expander', 'SMUrlExpander', 'Snake', 'Snappy', 'SnapSearch', 'Snarfer\/', 'SniffRSS', 'sniptracker', 'Snoopy', 'SnowHaze Search', 'sogou web', 'SortSite', 'Sottopop', 'sovereign\.ai', 'SpaceBison', 'SpamExperts', 'Spammen', 'Spanner', 'spaziodati', 'SPDYCheck', 'Specificfeeds', 'speedy', 'SPEng', 'Spinn3r', 'spray-can', 'Sprinklr ', 'spyonweb', 'sqlmap', 'Sqlworm', 'Sqworm', 'SSL Labs', 'ssl-tools', 'StackRambler', 'Statastico\/', 'Statically-', 'StatusCake', 'Steeler', 'Stratagems Kumo', 'Stripe\/', 'Stroke\.cz', 'StudioFACA', 'StumbleUpon', 'suchen', 'Sucuri', 'summify', 'SuperHTTP', 'Surphace Scout', 'Suzuran', 'swcd ', 'Symfony BrowserKit', 'Symfony2 BrowserKit', 'Synapse\/', 'Syndirella\/', 'SynHttpClient-Built', 'Sysomos', 'sysscan', 'Szukacz', 'T0PHackTeam', 'tAkeOut', 'Tarantula\/', 'Taringa UGC', 'TarmotGezgin', 'tchelebi\.io', 'techiaith\.cymru', 'Teleport', 'Telesoft', 'Telesphoreo', 'Telesphorep', 'Tenon\.io', 'teoma', 'terrainformatica', 'Test Certificate Info', 'testuri', 'Tetrahedron', 'TextRazor Downloader', 'The Drop Reaper', 'The Expert HTML Source Viewer', 'The Intraformant', 'The Knowledge AI', 'theinternetrules', 'TheNomad', 'Thinklab', 'Thumbor', 'Thumbshots', 'ThumbSniper', 'timewe\.net', 'TinEye', 'Tiny Tiny RSS', 'TLSProbe\/', 'Toata', 'topster', 'touche\.com', 'Traackr\.com', 'tracemyfile', 'Trackuity', 'TrapitAgent', 'Trendiction', 'Trendsmap', 'trendspottr', 'truwoGPS', 'TryJsoup', 'TulipChain', 'Turingos', 'Turnitin', 'tweetedtimes', 'Tweetminster', 'Tweezler\/', 'twibble', 'Twice', 'Twikle', 'Twingly', 'Twisted PageGetter', 'Typhoeus', 'ubermetrics-technologies', 'uclassify', 'UdmSearch', 'ultimate_sitemap_parser', 'unchaos', 'unirest-java', 'UniversalFeedParser', 'unshortenit', 'Unshorten\.It', 'Untiny', 'UnwindFetchor', 'updated', 'updown\.io daemon', 'Upflow', 'Uptimia', 'URL Verifier', 'Urlcheckr', 'URLitor', 'urlresolver', 'Urlstat', 'URLTester', 'UrlTrends Ranking Updater', 'URLy Warning', 'URLy\.Warning', 'URL\/Emacs', 'Vacuum', 'Vagabondo', 'VB Project', 'vBSEO', 'VCI', 'via ggpht\.com GoogleImageProxy', 'Virusdie', 'visionutils', 'Visual Rights Group', 'vkShare', 'VoidEYE', 'Voil', 'voltron', 'voyager\/', 'VSAgent\/', 'VSB-TUO\/', 'Vulnbusters Meter', 'VYU2', 'w3af\.org', 'W3C-checklink', 'W3C-mobileOK', 'W3C_Unicorn', 'WAC-OFU', 'WakeletLinkExpander', 'WallpapersHD', 'Wallpapers\/[0-9]+', 'wangling', 'Wappalyzer', 'WatchMouse', 'WbSrch\/', 'WDT\.io', 'Web Auto', 'Web Collage', 'Web Enhancer', 'Web Fetch', 'Web Fuck', 'Web Pix', 'Web Sauger', 'Web spyder', 'Web Sucker', 'web-capture\.net', 'Web-sniffer', 'Webalta', 'Webauskunft', 'WebAuto', 'WebCapture', 'WebClient\/', 'webcollage', 'WebCookies', 'WebCopier', 'WebCorp', 'WebDataStats', 'WebDoc', 'WebEnhancer', 'WebFetch', 'WebFuck', 'WebGazer', 'WebGo IS', 'WebImageCollector', 'WebImages', 'WebIndex', 'webkit2png', 'WebLeacher', 'webmastercoffee', 'webmon ', 'WebPix', 'WebReaper', 'WebSauger', 'webscreenie', 'Webshag', 'Webshot', 'Website Quester', 'websitepulse agent', 'WebsiteQuester', 'Websnapr', 'WebSniffer', 'Webster', 'WebStripper', 'WebSucker', 'webtech\/', 'WebThumbnail', 'Webthumb\/', 'WebWhacker', 'WebZIP', 'WeLikeLinks', 'WEPA', 'WeSEE', 'wf84', 'Wfuzz\/', 'wget', 'WhatCMS', 'WhatsApp', 'WhatsMyIP', 'WhatWeb', 'WhereGoes\?', 'Whibse', 'WhoAPI\/', 'WhoRunsCoinHive', 'Whynder Magnet', 'Windows-RSS-Platform', 'WinHttp-Autoproxy-Service', 'WinHTTP\/', 'WinPodder', 'wkhtmlto', 'wmtips', 'Woko', 'Wolfram HTTPClient', 'woorankreview', 'WordPress\/', 'WordupinfoSearch', 'Word\/', 'worldping-api', 'wotbox', 'WP Engine Install Performance API', 'WP Rocket', 'wpif', 'wprecon\.com survey', 'WPScan', 'wscheck', 'Wtrace', 'WWW-Collector-E', 'WWW-Mechanize', 'WWW::Document', 'WWW::Mechanize', 'WWWOFFLE', 'www\.monitor\.us', 'x09Mozilla', 'x22Mozilla', 'XaxisSemanticsClassifier', 'XenForo\/', 'Xenu Link Sleuth', 'XING-contenttabreceiver', 'xpymep([0-9]?)\.exe', 'Y!J-[A-Z][A-Z][A-Z]', 'Yaanb', 'yacy', 'Yahoo Link Preview', 'YahooCacheSystem', 'YahooMailProxy', 'YahooYSMcm', 'YandeG', 'Yandex(?!Search)', 'yanga', 'yeti', 'Yo-yo', 'Yoleo Consumer', 'yomins\.com', 'yoogliFetchAgent', 'YottaaMonitor', 'Your-Website-Sucks', 'yourls\.org', 'YoYs\.net', 'YP\.PL', 'Zabbix', 'Zade', 'Zao', 'Zauba', 'Zemanta Aggregator', 'Zend\\\\Http\\\\Client', 'Zend_Http_Client', 'Zermelo', 'Zeus ', 'zgrab', 'ZnajdzFoto', 'ZnHTTP', 'Zombie\.js', 'Zoom\.Mac', 'ZoteroTranslationServer', 'ZyBorg', '[a-z0-9\-_]*(bot|crawl|archiver|transcoder|spider|uptime|validator|fetcher|cron|checker|reader|extractor|monitoring|analyzer|scraper)', ); } crawler-detect/src/Fixtures/Headers.php 0000644 00000002207 15025017654 0014143 0 ustar 00 <?php /* * This file is part of Crawler Detect - the web crawler detection library. * * (c) Mark Beech <m@rkbee.ch> * * This source file is subject to the MIT license that is bundled * with this source code in the file LICENSE. */ namespace Jaybizzle\CrawlerDetect\Fixtures; class Headers extends AbstractProvider { /** * All possible HTTP headers that represent the user agent string. * * @var array */ protected $data = array( // The default User-Agent string. 'HTTP_USER_AGENT', // Header can occur on devices using Opera Mini. 'HTTP_X_OPERAMINI_PHONE_UA', // Vodafone specific header: http://www.seoprinciple.com/mobile-web-community-still-angry-at-vodafone/24/ 'HTTP_X_DEVICE_USER_AGENT', 'HTTP_X_ORIGINAL_USER_AGENT', 'HTTP_X_SKYFIRE_PHONE', 'HTTP_X_BOLT_PHONE_UA', 'HTTP_DEVICE_STOCK_UA', 'HTTP_X_UCBROWSER_DEVICE_UA', // Sometimes, bots (especially Google) use a genuine user agent, but fill this header in with their email address 'HTTP_FROM', 'HTTP_X_SCANNER', // Seen in use by Netsparker ); } crawler-detect/src/Fixtures/AbstractProvider.php 0000644 00000001042 15025017654 0016042 0 ustar 00 <?php /* * This file is part of Crawler Detect - the web crawler detection library. * * (c) Mark Beech <m@rkbee.ch> * * This source file is subject to the MIT license that is bundled * with this source code in the file LICENSE. */ namespace Jaybizzle\CrawlerDetect\Fixtures; abstract class AbstractProvider { /** * The data set. * * @var array */ protected $data; /** * Return the data set. * * @return array */ public function getAll() { return $this->data; } } crawler-detect/src/Fixtures/Exclusions.php 0000644 00000003321 15025017654 0014722 0 ustar 00 <?php /* * This file is part of Crawler Detect - the web crawler detection library. * * (c) Mark Beech <m@rkbee.ch> * * This source file is subject to the MIT license that is bundled * with this source code in the file LICENSE. */ namespace Jaybizzle\CrawlerDetect\Fixtures; class Exclusions extends AbstractProvider { /** * List of strings to remove from the user agent before running the crawler regex * Over a large list of user agents, this gives us about a 55% speed increase! * * @var array */ protected $data = array( 'Safari.[\d\.]*', 'Firefox.[\d\.]*', ' Chrome.[\d\.]*', 'Chromium.[\d\.]*', 'MSIE.[\d\.]', 'Opera\/[\d\.]*', 'Mozilla.[\d\.]*', 'AppleWebKit.[\d\.]*', 'Trident.[\d\.]*', 'Windows NT.[\d\.]*', 'Android [\d\.]*', 'Macintosh.', 'Ubuntu', 'Linux', '[ ]Intel', 'Mac OS X [\d_]*', '(like )?Gecko(.[\d\.]*)?', 'KHTML,', 'CriOS.[\d\.]*', 'CPU iPhone OS ([0-9_])* like Mac OS X', 'CPU OS ([0-9_])* like Mac OS X', 'iPod', 'compatible', 'x86_..', 'i686', 'x64', 'X11', 'rv:[\d\.]*', 'Version.[\d\.]*', 'WOW64', 'Win64', 'Dalvik.[\d\.]*', ' \.NET CLR [\d\.]*', 'Presto.[\d\.]*', 'Media Center PC', 'BlackBerry', 'Build', 'Opera Mini\/\d{1,2}\.\d{1,2}\.[\d\.]*\/\d{1,2}\.', 'Opera', ' \.NET[\d\.]*', 'cubot', '; M bot', '; CRONO', '; B bot', '; IDbot', '; ID bot', '; POWER BOT', 'OCTOPUS-CORE', ); } crawler-detect/raw/Exclusions.txt 0000644 00000001177 15025017654 0013152 0 ustar 00 Safari.[\d\.]* Firefox.[\d\.]* Chrome.[\d\.]* Chromium.[\d\.]* MSIE.[\d\.] Opera\/[\d\.]* Mozilla.[\d\.]* AppleWebKit.[\d\.]* Trident.[\d\.]* Windows NT.[\d\.]* Android [\d\.]* Macintosh. Ubuntu Linux [ ]Intel Mac OS X [\d_]* (like )?Gecko(.[\d\.]*)? KHTML, CriOS.[\d\.]* CPU iPhone OS ([0-9_])* like Mac OS X CPU OS ([0-9_])* like Mac OS X iPod compatible x86_.. i686 x64 X11 rv:[\d\.]* Version.[\d\.]* WOW64 Win64 Dalvik.[\d\.]* \.NET CLR [\d\.]* Presto.[\d\.]* Media Center PC BlackBerry Build Opera Mini\/\d{1,2}\.\d{1,2}\.[\d\.]*\/\d{1,2}\. Opera \.NET[\d\.]* cubot ; M bot ; CRONO ; B bot ; IDbot ; ID bot ; POWER BOT OCTOPUS-CORE crawler-detect/raw/Crawlers.txt 0000644 00000041141 15025017654 0012573 0 ustar 00 YLT ^Aether ^Amazon Simple Notification Service Agent$ ^Amazon-Route53-Health-Check-Service ^b0t$ ^bluefish ^Calypso v\/ ^COMODO DCV ^Corax ^DangDang ^DavClnt ^DHSH ^docker\/[0-9] ^Expanse ^FDM ^git\/ ^Goose\/ ^Grabber ^Gradle\/ ^HTTPClient\/ ^HTTPing ^Java\/ ^Jeode\/ ^Jetty\/ ^Mail\/ ^Mget ^Microsoft URL Control ^Mikrotik\/ ^Netlab360 ^NG\/[0-9\.] ^NING\/ ^npm\/ ^Nuclei ^PHP-AYMAPI\/ ^PHP\/ ^pip\/ ^pnpm\/ ^RMA\/ ^Ruby|Ruby\/[0-9] ^Swurl ^TLS tester ^twine\/ ^ureq ^VSE\/[0-9] ^WordPress\.com ^XRL\/[0-9] ^ZmEu 008\/ 13TABS 192\.comAgent 2GDPR\/ 2ip\.ru 404enemy 7Siters 80legs a3logics\.in A6-Indexer Abonti Aboundex aboutthedomain Accoona-AI-Agent acebookexternalhit\/ acoon acrylicapps\.com\/pulp Acunetix AdAuth\/ adbeat AddThis ADmantX AdminLabs adressendeutschland adreview\/ adscanner adstxt-worker Adstxtaggregator adstxt\.com Adyen HttpClient AffiliateLabz\/ affilimate-puppeteer agentslug AHC aihit aiohttp\/ Airmail akka-http\/ akula\/ alertra alexa site audit Alibaba\.Security\.Heimdall Alligator allloadin AllSubmitter alyze\.info amagit Anarchie AndroidDownloadManager Anemone AngleSharp annotate_google Anthill Anturis Agent Ant\.com AnyEvent-HTTP\/ Apache Ant\/ Apache Droid Apache OpenOffice Apache-HttpAsyncClient Apache-HttpClient ApacheBench Apexoo apimon\.de APIs-Google AportWorm\/ AppBeat\/ AppEngine-Google AppleSyndication Aprc\/[0-9] Arachmo arachnode Arachnophilia aria2 Arukereso asafaweb Asana\/ Ask Jeeves AskQuickly ASPSeek Asterias Astute asynchttp Attach attohttpc autocite AutomaticWPTester Autonomy awin\.com AWS Security Scanner axios\/ a\.pr-cy\.ru B-l-i-t-z-B-O-T Backlink-Ceck backlink-check BacklinkHttpStatus BackStreet BackupLand BackWeb Bad-Neighborhood Badass baidu\.com Bandit basicstate BatchFTP Battleztar Bazinga baypup\/ BazQux BBBike BCKLINKS BDFetch BegunAdvertising Bewica-security-scan Bidtellect BigBozz Bigfoot biglotron BingLocalSearch BingPreview binlar biNu image cacher Bitacle Bitrix link preview biz_Directory BKCTwitterUnshortener\/ Black Hole Blackboard Safeassign BlackWidow BlockNote\.Net BlogBridge Bloglines Bloglovin BlogPulseLive BlogSearch Blogtrottr BlowFish boitho\.com-dc Boost\.Beast BPImageWalker Braintree-Webhooks Branch Metrics API Branch-Passthrough Brandprotect BrandVerity Brandwatch Brodie\/ Browsershots BUbiNG Buck\/ Buddy BuiltWith Bullseye BunnySlippers Burf Search Butterfly\/ BuzzSumo CAAM\/[0-9] CakePHP Calculon Canary%20Mail CaretNail catexplorador CC Metadata Scaper Cegbfeieh censys centuryb.o.t9[at]gmail.com Cerberian Drtrs CERT\.at-Statistics-Survey cf-facebook cg-eye changedetection ChangesMeter Charlotte chatterino-api-cache CheckHost checkprivacy CherryPicker ChinaClaw Chirp\/ chkme\.com Chlooe Chromaxa CirrusExplorer CISPA Vulnerability Notification CISPA Web Analyser Citoid CJNetworkQuality Clarsentia clips\.ua\.ac\.be Cloud mapping CloudEndure CloudFlare-AlwaysOnline Cloudflare-Healthchecks Cloudinary cmcm\.com coccoc cognitiveseo ColdFusion colly - CommaFeed Commons-HttpClient commonscan contactbigdatafr contentkingapp Contextual Code Sites Explorer convera CookieReports copyright sheriff CopyRightCheck Copyscape cortex\/ Cosmos4j\.feedback Covario-IDS Craw\/ Crescent Criteo Crowsnest CSHttp CSSCheck Cula\/ curb Curious George curl cuwhois\/ cybo\.com DAP\/NetHTTP DareBoost DatabaseDriverMysqli DataCha0s DatadogSynthetics Datafeedwatch Datanyze DataparkSearch dataprovider DataXu Daum(oa)?[ \/][0-9] dBpoweramp ddline deeris delve\.ai Demon DeuSu developers\.google\.com\/\+\/web\/snippet\/ Devil Digg Digincore DigitalPebble Dirbuster Discourse Forum Onebox Dispatch\/ Disqus\/ DittoSpyder dlvr DMBrowser DNSPod-reporting docoloc Dolphin http client DomainAppender DomainLabz Domains Project\/ Donuts Content Explorer dotMailer content retrieval dotSemantic downforeveryoneorjustme Download Wonder downnotifier DowntimeDetector Drip drupact Drupal \(\+http:\/\/drupal\.org\/\) DTS Agent dubaiindex DuplexWeb-Google DynatraceSynthetic EARTHCOM Easy-Thumb EasyDL Ebingbong ec2linkfinder eCairn-Grabber eCatch ECCP eContext\/ Ecxi EirGrabber ElectricMonk elefent EMail Exractor EMail Wolf EmailWolf Embarcadero Embed PHP Library Embedly endo\/ europarchive\.org evc-batch EventMachine HttpClient Everwall Link Expander Evidon Evrinid ExactSearch ExaleadCloudview Excel\/ exif ExoRank Exploratodo Express WebPictures Extreme Picture Finder EyeNetIE ezooms facebookexternalhit facebookexternalua facebookplatform fairshare Faraday v fasthttp Faveeo Favicon downloader faviconarchive faviconkit FavOrg Feed Wrangler Feedable\/ Feedbin FeedBooster FeedBucket FeedBunch\/ FeedBurner feeder Feedly FeedshowOnline Feedshow\/ Feedspot FeedViewer\/ Feedwind\/ FeedZcollector feeltiptop Fetch API Fetch\/[0-9] Fever\/[0-9] FHscan Fiery%20Feeds Filestack Fimap findlink findthatfile FlashGet FlipboardBrowserProxy FlipboardProxy FlipboardRSS Flock\/ Florienzh\/ fluffy Flunky flynxapp forensiq ForusP FoundSeoTool free thumbnails Freeuploader FreshRSS frontman Funnelback Fuzz Faster U Fool G-i-g-a-b-o-t g00g1e\.net ganarvisitas gdnplus\.com geek-tools Genieo GentleSource GetCode Getintent GetLinkInfo getprismatic GetRight getroot GetURLInfo\/ GetWeb Geziyor Ghost Inspector GigablastOpenSource GIS-LABS github-camo GitHub-Hookshot github\.com Go http package Go [\d\.]* package http Go!Zilla Go-Ahead-Got-It Go-http-client go-mtasts\/ gobuster gobyus Gofeed gofetch Goldfire Server GomezAgent gooblog Goodzer\/ Google AppsViewer Google Desktop Google favicon Google Keyword Suggestion Google Keyword Tool Google Page Speed Insights Google PP Default Google Search Console Google Web Preview Google-Ads-Creatives-Assistant Google-Ads-Overview Google-Adwords Google-Apps-Script Google-Calendar-Importer Google-HotelAdsVerifier Google-HTTP-Java-Client Google-Podcast Google-Publisher-Plugin Google-Read-Aloud Google-SearchByImage Google-Site-Verification Google-SMTP-STS Google-speakr Google-Structured-Data-Testing-Tool Google-Transparency-Report google-xrawler Google-Youtube-Links GoogleDocs GoogleHC\/ GoogleProber GoogleProducer GoogleSites Gookey GoSpotCheck gosquared-thumbnailer Gotit GoZilla grabify GrabNet Grafula Grammarly GrapeFX GreatNews Gregarius GRequests grokkit grouphigh grub-client gSOAP\/ GT::WWW GTmetrix GuzzleHttp gvfs\/ HAA(A)?RTLAND http client Haansoft hackney\/ Hadi Agent HappyApps-WebCheck Hardenize Hatena Havij HaxerMen HeadlessChrome HEADMasterSEO HeartRails_Capture help@dataminr\.com heritrix Hexometer historious hkedcity hledejLevne\.cz Hloader HMView Holmes HonesoSearchEngine HootSuite Image proxy Hootsuite-WebFeed hosterstats HostTracker ht:\/\/check htdig HTMLparser htmlyse HTTP Banner Detection http-get HTTP-Header-Abfrage http-kit http-request\/ HTTP-Tiny HTTP::Lite http:\/\/www.neomo.de\/ HttpComponents httphr HTTPie HTTPMon httpRequest httpscheck httpssites_power httpunit HttpUrlConnection http\.rb\/ HTTP_Compression_Test http_get http_request2 http_requester httrack huaweisymantec HubSpot HubSpot-Link-Resolver Humanlinks i2kconnect\/ Iblog ichiro Id-search IdeelaborPlagiaat IDG Twitter Links Resolver IDwhois\/ Iframely igdeSpyder iGooglePortal IlTrovatore Image Fetch Image Sucker ImageEngine\/ ImageVisu\/ Imagga imagineeasy imgsizer InAGist inbound\.li parser InDesign%20CC Indy Library InetURL infegy infohelfer InfoTekies InfoWizards Reciprocal Link inpwrd\.com instabid Instapaper Integrity integromedb Intelliseek InterGET Internet Ninja InternetSeer internetVista monitor internetwache internet_archive intraVnews IODC IOI iplabel ips-agent IPS\/[0-9] IPWorks HTTP\/S Component iqdb\/ Iria Irokez isitup\.org iskanie isUp\.li iThemes Sync\/ IZaBEE iZSearch JAHHO janforman Jaunt\/ Java.*outbrain javelin\.io Jbrofuzz Jersey\/ JetCar Jigsaw Jobboerse JobFeed discovery Jobg8 URL Monitor jobo Jobrapido Jobsearch1\.5 JoinVision Generic JolokiaPwn Joomla Jorgee JS-Kit JungleKeyThumbnail JustView Kaspersky Lab CFR link resolver Kelny\/ Kerrigan\/ KeyCDN Keyword Density Keywords Research khttp\/ KickFire KimonoLabs\/ Kml-Google knows\.is KOCMOHABT kouio kube-probe kubectl kulturarw3 KumKie Larbin Lavf\/ leakix\.net LeechFTP LeechGet letsencrypt Lftp LibVLC LibWeb Libwhisker libwww Licorne Liferea\/ Lighthouse Lightspeedsystems Likse limber\.io Link Valet LinkAlarm\/ LinkAnalyser linkCheck linkdex LinkExaminer linkfluence linkpeek LinkPreview LinkScan LinksManager LinkTiger LinkWalker link_thumbnailer Lipperhey Litemage_walker livedoor ScreenShot LoadImpactRload localsearch-web LongURL API longurl-r-package looid\.com looksystems\.net ltx71 lua-resty-http Lucee \(CFML Engine\) Lush Http Client lwp-request lwp-trivial LWP::Simple lycos LYT\.SR L\.webis mabontland MacOutlook\/ Mag-Net MagpieRSS Mail::STS MailChimp Mail\.Ru Majestic12 makecontact\/ Mandrill MapperCmd marketinggrader MarkMonitor MarkWatch Mass Downloader masscan\/ Mata Hari mattermost Mediametric Mediapartners-Google mediawords MegaIndex\.ru MeltwaterNews Melvil Rawi MemGator Metaspinner MetaURI MFC_Tear_Sample Microsearch Microsoft Data Access Microsoft Office Microsoft Outlook Microsoft Windows Network Diagnostics Microsoft-WebDAV-MiniRedir Microsoft\.Data\.Mashup MIDown tool MIIxpc Mindjet Miniature\.io Miniflux mio_httpc Miro-HttpClient Mister PiX mixdata dot com mixed-content-scan mixnode Mnogosearch mogimogi Mojeek Mojolicious \(Perl\) Mollie monitis Monitority\/ Monit\/ montastic MonTools Moreover Morfeus Fucking Scanner Morning Paper MovableType mowser Mrcgiguy Mr\.4x3 Powered MS Web Services Client Protocol MSFrontPage mShots MuckRack\/ muhstik-scan MVAClient MxToolbox\/ myseosnapshot nagios Najdi\.si Name Intelligence NameFo\.com Nameprotect nationalarchives Navroad NearSite Needle Nessus Net Vampire NetAnts NETCRAFT NetLyzer NetMechanic NetNewsWire Netpursual netresearch NetShelter ContentScan Netsparker NetSystemsResearch nettle NetTrack Netvibes NetZIP Neustar WPM NeutrinoAPI NewRelicPinger NewsBlur .*Finder NewsGator newsme newspaper\/ Nexgate Ruby Client NG-Search nghttp2 Nibbler NICErsPRO NihilScio Nikto nineconnections NLNZ_IAHarvester Nmap Scripting Engine node-fetch node-superagent node-urllib Nodemeter NodePing node\.io nominet\.org\.uk nominet\.uk Norton-Safeweb Notifixious notifyninja NotionEmbedder nuhk nutch Nuzzel nWormFeedFinder nyawc\/ Nymesis NYU Observatory\/ Ocelli\/ Octopus oegp Offline Explorer Offline Navigator OgScrper okhttp omgili OMSC Online Domain Tools Open Source RSS OpenCalaisSemanticProxy Openfind OpenLinkProfiler Openstat\/ OpenVAS OPPO A33 Optimizer Orbiter OrgProbe\/ orion-semantics Outlook-Express Outlook-iOS Owler Owlin ownCloud News ow\.ly OxfordCloudService page scorer Page Valet page2rss PageFreezer PageGrabber PagePeeker PageScorer Pagespeed\/ PageThing page_verifier Panopta panscient Papa Foto parsijoo Pavuk PayPal IPN pcBrowser Pcore-HTTP PDF24 URL To PDF Pearltrees PECL::HTTP peerindex Peew PeoplePal Perlu - PhantomJS Screenshoter PhantomJS\/ Photon\/ php-requests phpservermon Pi-Monster Picscout Picsearch PictureFinder Pimonster Pingability PingAdmin\.Ru Pingdom Pingoscope PingSpot ping\.blo\.gs pinterest\.com Pixray Pizilla Plagger\/ Pleroma Ploetz \+ Zeller Plukkie plumanalytics PocketImageCache PocketParser Pockey PodcastAddict\/ POE-Component-Client-HTTP Polymail\/ Pompos Porkbun Port Monitor postano postfix-mta-sts-resolver PostmanRuntime postplanner\.com PostPost postrank PowerPoint\/ Prebid Prerender Priceonomics Analysis Engine PrintFriendly PritTorrent Prlog probethenet Project ?25499 Project-Resonance prospectb2b Protopage ProWebWalker proximic PRTG Network Monitor pshtt, https scanning PTST PTST\/[0-9]+ Pump Python-httplib2 python-httpx python-requests Python-urllib Qirina Hurdler QQDownload QrafterPro Qseero Qualidator QueryN Metasearch queuedriver quic-go-HTTP\/ QuiteRSS Quora Link Preview Qwantify Radian6 RadioPublicImageResizer Railgun\/ RankActive RankFlex RankSonicSiteAuditor RapidLoad\/ Re-re Studio ReactorNetty Readability RealDownload RealPlayer%20Downloader RebelMouse Recorder RecurPost\/ redback\/ ReederForMac Reeder\/ ReGet RepoMonkey request\.js reqwest\/ ResponseCodeTest RestSharp Riddler Rival IQ Robosourcer Robozilla ROI Hunter RPT-HTTPClient RSSMix\/ RSSOwl RyowlEngine safe-agent-scanner SalesIntelligent Saleslift SAP NetWeaver Application Server SauceNAO SBIder sc-downloader scalaj-http Scamadviser-Frontend ScanAlert scan\.lol Scoop scooter ScopeContentAG-HTTP-Client ScoutJet ScoutURLMonitor ScrapeBox Page Scanner Scrapy Screaming ScreenShotService Scrubby Scrutiny\/ Search37 searchenginepromotionhelp Searchestate SearchExpress SearchSight SearchWP search\.thunderstone Seeker semanticdiscovery semanticjuice Semiocast HTTP client Semrush Sendsay\.Ru sentry\/ SEO Browser Seo Servis seo-nastroj\.cz seo4ajax Seobility SEOCentro SeoCheck seocompany SEOkicks SEOlizer Seomoz SEOprofiler seoscanners SEOsearch seositecheckup SEOstats servernfo sexsearcher Seznam Shelob Shodan Shoppimon ShopWiki ShortLinkTranslate shortURL lengthener shrinktheweb Sideqik Siege SimplePie SimplyFast Siphon SISTRIX Site Sucker Site-Shot\/ Site24x7 SiteBar Sitebeam Sitebulb\/ SiteCondor SiteExplorer SiteGuardian Siteimprove SiteIndexed Sitemap(s)? Generator SitemapGenerator SiteMonitor Siteshooter B0t SiteSnagger SiteSucker SiteTruth Sitevigil sitexy\.com SkypeUriPreview Slack\/ sli-systems\.com slider\.com slurp SlySearch SmartDownload SMRF URL Expander SMUrlExpander Snake Snappy SnapSearch Snarfer\/ SniffRSS sniptracker Snoopy SnowHaze Search sogou web SortSite Sottopop sovereign\.ai SpaceBison SpamExperts Spammen Spanner spaziodati SPDYCheck Specificfeeds speedy SPEng Spinn3r spray-can Sprinklr spyonweb sqlmap Sqlworm Sqworm SSL Labs ssl-tools StackRambler Statastico\/ Statically- StatusCake Steeler Stratagems Kumo Stripe\/ Stroke\.cz StudioFACA StumbleUpon suchen Sucuri summify SuperHTTP Surphace Scout Suzuran swcd Symfony BrowserKit Symfony2 BrowserKit Synapse\/ Syndirella\/ SynHttpClient-Built Sysomos sysscan Szukacz T0PHackTeam tAkeOut Tarantula\/ Taringa UGC TarmotGezgin tchelebi\.io techiaith\.cymru Teleport Telesoft Telesphoreo Telesphorep Tenon\.io teoma terrainformatica Test Certificate Info testuri Tetrahedron TextRazor Downloader The Drop Reaper The Expert HTML Source Viewer The Intraformant The Knowledge AI theinternetrules TheNomad Thinklab Thumbor Thumbshots ThumbSniper timewe\.net TinEye Tiny Tiny RSS TLSProbe\/ Toata topster touche\.com Traackr\.com tracemyfile Trackuity TrapitAgent Trendiction Trendsmap trendspottr truwoGPS TryJsoup TulipChain Turingos Turnitin tweetedtimes Tweetminster Tweezler\/ twibble Twice Twikle Twingly Twisted PageGetter Typhoeus ubermetrics-technologies uclassify UdmSearch ultimate_sitemap_parser unchaos unirest-java UniversalFeedParser unshortenit Unshorten\.It Untiny UnwindFetchor updated updown\.io daemon Upflow Uptimia URL Verifier Urlcheckr URLitor urlresolver Urlstat URLTester UrlTrends Ranking Updater URLy Warning URLy\.Warning URL\/Emacs Vacuum Vagabondo VB Project vBSEO VCI via ggpht\.com GoogleImageProxy Virusdie visionutils Visual Rights Group vkShare VoidEYE Voil voltron voyager\/ VSAgent\/ VSB-TUO\/ Vulnbusters Meter VYU2 w3af\.org W3C-checklink W3C-mobileOK W3C_Unicorn WAC-OFU WakeletLinkExpander WallpapersHD Wallpapers\/[0-9]+ wangling Wappalyzer WatchMouse WbSrch\/ WDT\.io Web Auto Web Collage Web Enhancer Web Fetch Web Fuck Web Pix Web Sauger Web spyder Web Sucker web-capture\.net Web-sniffer Webalta Webauskunft WebAuto WebCapture WebClient\/ webcollage WebCookies WebCopier WebCorp WebDataStats WebDoc WebEnhancer WebFetch WebFuck WebGazer WebGo IS WebImageCollector WebImages WebIndex webkit2png WebLeacher webmastercoffee webmon WebPix WebReaper WebSauger webscreenie Webshag Webshot Website Quester websitepulse agent WebsiteQuester Websnapr WebSniffer Webster WebStripper WebSucker webtech\/ WebThumbnail Webthumb\/ WebWhacker WebZIP WeLikeLinks WEPA WeSEE wf84 Wfuzz\/ wget WhatCMS WhatsApp WhatsMyIP WhatWeb WhereGoes\? Whibse WhoAPI\/ WhoRunsCoinHive Whynder Magnet Windows-RSS-Platform WinHttp-Autoproxy-Service WinHTTP\/ WinPodder wkhtmlto wmtips Woko Wolfram HTTPClient woorankreview WordPress\/ WordupinfoSearch Word\/ worldping-api wotbox WP Engine Install Performance API WP Rocket wpif wprecon\.com survey WPScan wscheck Wtrace WWW-Collector-E WWW-Mechanize WWW::Document WWW::Mechanize WWWOFFLE www\.monitor\.us x09Mozilla x22Mozilla XaxisSemanticsClassifier XenForo\/ Xenu Link Sleuth XING-contenttabreceiver xpymep([0-9]?)\.exe Y!J-[A-Z][A-Z][A-Z] Yaanb yacy Yahoo Link Preview YahooCacheSystem YahooMailProxy YahooYSMcm YandeG Yandex(?!Search) yanga yeti Yo-yo Yoleo Consumer yomins\.com yoogliFetchAgent YottaaMonitor Your-Website-Sucks yourls\.org YoYs\.net YP\.PL Zabbix Zade Zao Zauba Zemanta Aggregator Zend\\Http\\Client Zend_Http_Client Zermelo Zeus zgrab ZnajdzFoto ZnHTTP Zombie\.js Zoom\.Mac ZoteroTranslationServer ZyBorg [a-z0-9\-_]*(bot|crawl|archiver|transcoder|spider|uptime|validator|fetcher|cron|checker|reader|extractor|monitoring|analyzer|scraper) crawler-detect/raw/Crawlers.json 0000644 00000047410 15025017654 0012732 0 ustar 00 [" YLT","^Aether","^Amazon Simple Notification Service Agent$","^Amazon-Route53-Health-Check-Service","^b0t$","^bluefish ","^Calypso v\\\/","^COMODO DCV","^Corax","^DangDang","^DavClnt","^DHSH","^docker\\\/[0-9]","^Expanse","^FDM ","^git\\\/","^Goose\\\/","^Grabber","^Gradle\\\/","^HTTPClient\\\/","^HTTPing","^Java\\\/","^Jeode\\\/","^Jetty\\\/","^Mail\\\/","^Mget","^Microsoft URL Control","^Mikrotik\\\/","^Netlab360","^NG\\\/[0-9\\.]","^NING\\\/","^npm\\\/","^Nuclei","^PHP-AYMAPI\\\/","^PHP\\\/","^pip\\\/","^pnpm\\\/","^RMA\\\/","^Ruby|Ruby\\\/[0-9]","^Swurl ","^TLS tester ","^twine\\\/","^ureq","^VSE\\\/[0-9]","^WordPress\\.com","^XRL\\\/[0-9]","^ZmEu","008\\\/","13TABS","192\\.comAgent","2GDPR\\\/","2ip\\.ru","404enemy","7Siters","80legs","a3logics\\.in","A6-Indexer","Abonti","Aboundex","aboutthedomain","Accoona-AI-Agent","acebookexternalhit\\\/","acoon","acrylicapps\\.com\\\/pulp","Acunetix","AdAuth\\\/","adbeat","AddThis","ADmantX","AdminLabs","adressendeutschland","adreview\\\/","adscanner","adstxt-worker","Adstxtaggregator","adstxt\\.com","Adyen HttpClient","AffiliateLabz\\\/","affilimate-puppeteer","agentslug","AHC","aihit","aiohttp\\\/","Airmail","akka-http\\\/","akula\\\/","alertra","alexa site audit","Alibaba\\.Security\\.Heimdall","Alligator","allloadin","AllSubmitter","alyze\\.info","amagit","Anarchie","AndroidDownloadManager","Anemone","AngleSharp","annotate_google","Anthill","Anturis Agent","Ant\\.com","AnyEvent-HTTP\\\/","Apache Ant\\\/","Apache Droid","Apache OpenOffice","Apache-HttpAsyncClient","Apache-HttpClient","ApacheBench","Apexoo","apimon\\.de","APIs-Google","AportWorm\\\/","AppBeat\\\/","AppEngine-Google","AppleSyndication","Aprc\\\/[0-9]","Arachmo","arachnode","Arachnophilia","aria2","Arukereso","asafaweb","Asana\\\/","Ask Jeeves","AskQuickly","ASPSeek","Asterias","Astute","asynchttp","Attach","attohttpc","autocite","AutomaticWPTester","Autonomy","awin\\.com","AWS Security Scanner","axios\\\/","a\\.pr-cy\\.ru","B-l-i-t-z-B-O-T","Backlink-Ceck","backlink-check","BacklinkHttpStatus","BackStreet","BackupLand","BackWeb","Bad-Neighborhood","Badass","baidu\\.com","Bandit","basicstate","BatchFTP","Battleztar Bazinga","baypup\\\/","BazQux","BBBike","BCKLINKS","BDFetch","BegunAdvertising","Bewica-security-scan","Bidtellect","BigBozz","Bigfoot","biglotron","BingLocalSearch","BingPreview","binlar","biNu image cacher","Bitacle","Bitrix link preview","biz_Directory","BKCTwitterUnshortener\\\/","Black Hole","Blackboard Safeassign","BlackWidow","BlockNote\\.Net","BlogBridge","Bloglines","Bloglovin","BlogPulseLive","BlogSearch","Blogtrottr","BlowFish","boitho\\.com-dc","Boost\\.Beast","BPImageWalker","Braintree-Webhooks","Branch Metrics API","Branch-Passthrough","Brandprotect","BrandVerity","Brandwatch","Brodie\\\/","Browsershots","BUbiNG","Buck\\\/","Buddy","BuiltWith","Bullseye","BunnySlippers","Burf Search","Butterfly\\\/","BuzzSumo","CAAM\\\/[0-9]","CakePHP","Calculon","Canary%20Mail","CaretNail","catexplorador","CC Metadata Scaper","Cegbfeieh","censys","centuryb.o.t9[at]gmail.com","Cerberian Drtrs","CERT\\.at-Statistics-Survey","cf-facebook","cg-eye","changedetection","ChangesMeter","Charlotte","chatterino-api-cache","CheckHost","checkprivacy","CherryPicker","ChinaClaw","Chirp\\\/","chkme\\.com","Chlooe","Chromaxa","CirrusExplorer","CISPA Vulnerability Notification","CISPA Web Analyser","Citoid","CJNetworkQuality","Clarsentia","clips\\.ua\\.ac\\.be","Cloud mapping","CloudEndure","CloudFlare-AlwaysOnline","Cloudflare-Healthchecks","Cloudinary","cmcm\\.com","coccoc","cognitiveseo","ColdFusion","colly -","CommaFeed","Commons-HttpClient","commonscan","contactbigdatafr","contentkingapp","Contextual Code Sites Explorer","convera","CookieReports","copyright sheriff","CopyRightCheck","Copyscape","cortex\\\/","Cosmos4j\\.feedback","Covario-IDS","Craw\\\/","Crescent","Criteo","Crowsnest","CSHttp","CSSCheck","Cula\\\/","curb","Curious George","curl","cuwhois\\\/","cybo\\.com","DAP\\\/NetHTTP","DareBoost","DatabaseDriverMysqli","DataCha0s","DatadogSynthetics","Datafeedwatch","Datanyze","DataparkSearch","dataprovider","DataXu","Daum(oa)?[ \\\/][0-9]","dBpoweramp","ddline","deeris","delve\\.ai","Demon","DeuSu","developers\\.google\\.com\\\/\\+\\\/web\\\/snippet\\\/","Devil","Digg","Digincore","DigitalPebble","Dirbuster","Discourse Forum Onebox","Dispatch\\\/","Disqus\\\/","DittoSpyder","dlvr","DMBrowser","DNSPod-reporting","docoloc","Dolphin http client","DomainAppender","DomainLabz","Domains Project\\\/","Donuts Content Explorer","dotMailer content retrieval","dotSemantic","downforeveryoneorjustme","Download Wonder","downnotifier","DowntimeDetector","Drip","drupact","Drupal \\(\\+http:\\\/\\\/drupal\\.org\\\/\\)","DTS Agent","dubaiindex","DuplexWeb-Google","DynatraceSynthetic","EARTHCOM","Easy-Thumb","EasyDL","Ebingbong","ec2linkfinder","eCairn-Grabber","eCatch","ECCP","eContext\\\/","Ecxi","EirGrabber","ElectricMonk","elefent","EMail Exractor","EMail Wolf","EmailWolf","Embarcadero","Embed PHP Library","Embedly","endo\\\/","europarchive\\.org","evc-batch","EventMachine HttpClient","Everwall Link Expander","Evidon","Evrinid","ExactSearch","ExaleadCloudview","Excel\\\/","exif","ExoRank","Exploratodo","Express WebPictures","Extreme Picture Finder","EyeNetIE","ezooms","facebookexternalhit","facebookexternalua","facebookplatform","fairshare","Faraday v","fasthttp","Faveeo","Favicon downloader","faviconarchive","faviconkit","FavOrg","Feed Wrangler","Feedable\\\/","Feedbin","FeedBooster","FeedBucket","FeedBunch\\\/","FeedBurner","feeder","Feedly","FeedshowOnline","Feedshow\\\/","Feedspot","FeedViewer\\\/","Feedwind\\\/","FeedZcollector","feeltiptop","Fetch API","Fetch\\\/[0-9]","Fever\\\/[0-9]","FHscan","Fiery%20Feeds","Filestack","Fimap","findlink","findthatfile","FlashGet","FlipboardBrowserProxy","FlipboardProxy","FlipboardRSS","Flock\\\/","Florienzh\\\/","fluffy","Flunky","flynxapp","forensiq","ForusP","FoundSeoTool","free thumbnails","Freeuploader","FreshRSS","frontman","Funnelback","Fuzz Faster U Fool","G-i-g-a-b-o-t","g00g1e\\.net","ganarvisitas","gdnplus\\.com","geek-tools","Genieo","GentleSource","GetCode","Getintent","GetLinkInfo","getprismatic","GetRight","getroot","GetURLInfo\\\/","GetWeb","Geziyor","Ghost Inspector","GigablastOpenSource","GIS-LABS","github-camo","GitHub-Hookshot","github\\.com","Go http package","Go [\\d\\.]* package http","Go!Zilla","Go-Ahead-Got-It","Go-http-client","go-mtasts\\\/","gobuster","gobyus","Gofeed","gofetch","Goldfire Server","GomezAgent","gooblog","Goodzer\\\/","Google AppsViewer","Google Desktop","Google favicon","Google Keyword Suggestion","Google Keyword Tool","Google Page Speed Insights","Google PP Default","Google Search Console","Google Web Preview","Google-Ads-Creatives-Assistant","Google-Ads-Overview","Google-Adwords","Google-Apps-Script","Google-Calendar-Importer","Google-HotelAdsVerifier","Google-HTTP-Java-Client","Google-Podcast","Google-Publisher-Plugin","Google-Read-Aloud","Google-SearchByImage","Google-Site-Verification","Google-SMTP-STS","Google-speakr","Google-Structured-Data-Testing-Tool","Google-Transparency-Report","google-xrawler","Google-Youtube-Links","GoogleDocs","GoogleHC\\\/","GoogleProber","GoogleProducer","GoogleSites","Gookey","GoSpotCheck","gosquared-thumbnailer","Gotit","GoZilla","grabify","GrabNet","Grafula","Grammarly","GrapeFX","GreatNews","Gregarius","GRequests","grokkit","grouphigh","grub-client","gSOAP\\\/","GT::WWW","GTmetrix","GuzzleHttp","gvfs\\\/","HAA(A)?RTLAND http client","Haansoft","hackney\\\/","Hadi Agent","HappyApps-WebCheck","Hardenize","Hatena","Havij","HaxerMen","HeadlessChrome","HEADMasterSEO","HeartRails_Capture","help@dataminr\\.com","heritrix","Hexometer","historious","hkedcity","hledejLevne\\.cz","Hloader","HMView","Holmes","HonesoSearchEngine","HootSuite Image proxy","Hootsuite-WebFeed","hosterstats","HostTracker","ht:\\\/\\\/check","htdig","HTMLparser","htmlyse","HTTP Banner Detection","http-get","HTTP-Header-Abfrage","http-kit","http-request\\\/","HTTP-Tiny","HTTP::Lite","http:\\\/\\\/www.neomo.de\\\/","HttpComponents","httphr","HTTPie","HTTPMon","httpRequest","httpscheck","httpssites_power","httpunit","HttpUrlConnection","http\\.rb\\\/","HTTP_Compression_Test","http_get","http_request2","http_requester","httrack","huaweisymantec","HubSpot ","HubSpot-Link-Resolver","Humanlinks","i2kconnect\\\/","Iblog","ichiro","Id-search","IdeelaborPlagiaat","IDG Twitter Links Resolver","IDwhois\\\/","Iframely","igdeSpyder","iGooglePortal","IlTrovatore","Image Fetch","Image Sucker","ImageEngine\\\/","ImageVisu\\\/","Imagga","imagineeasy","imgsizer","InAGist","inbound\\.li parser","InDesign%20CC","Indy Library","InetURL","infegy","infohelfer","InfoTekies","InfoWizards Reciprocal Link","inpwrd\\.com","instabid","Instapaper","Integrity","integromedb","Intelliseek","InterGET","Internet Ninja","InternetSeer","internetVista monitor","internetwache","internet_archive","intraVnews","IODC","IOI","iplabel","ips-agent","IPS\\\/[0-9]","IPWorks HTTP\\\/S Component","iqdb\\\/","Iria","Irokez","isitup\\.org","iskanie","isUp\\.li","iThemes Sync\\\/","IZaBEE","iZSearch","JAHHO","janforman","Jaunt\\\/","Java.*outbrain","javelin\\.io","Jbrofuzz","Jersey\\\/","JetCar","Jigsaw","Jobboerse","JobFeed discovery","Jobg8 URL Monitor","jobo","Jobrapido","Jobsearch1\\.5","JoinVision Generic","JolokiaPwn","Joomla","Jorgee","JS-Kit","JungleKeyThumbnail","JustView","Kaspersky Lab CFR link resolver","Kelny\\\/","Kerrigan\\\/","KeyCDN","Keyword Density","Keywords Research","khttp\\\/","KickFire","KimonoLabs\\\/","Kml-Google","knows\\.is","KOCMOHABT","kouio","kube-probe","kubectl","kulturarw3","KumKie","Larbin","Lavf\\\/","leakix\\.net","LeechFTP","LeechGet","letsencrypt","Lftp","LibVLC","LibWeb","Libwhisker","libwww","Licorne","Liferea\\\/","Lighthouse","Lightspeedsystems","Likse","limber\\.io","Link Valet","LinkAlarm\\\/","LinkAnalyser","linkCheck","linkdex","LinkExaminer","linkfluence","linkpeek","LinkPreview","LinkScan","LinksManager","LinkTiger","LinkWalker","link_thumbnailer","Lipperhey","Litemage_walker","livedoor ScreenShot","LoadImpactRload","localsearch-web","LongURL API","longurl-r-package","looid\\.com","looksystems\\.net","ltx71","lua-resty-http","Lucee \\(CFML Engine\\)","Lush Http Client","lwp-request","lwp-trivial","LWP::Simple","lycos","LYT\\.SR","L\\.webis","mabontland","MacOutlook\\\/","Mag-Net","MagpieRSS","Mail::STS","MailChimp","Mail\\.Ru","Majestic12","makecontact\\\/","Mandrill","MapperCmd","marketinggrader","MarkMonitor","MarkWatch","Mass Downloader","masscan\\\/","Mata Hari","mattermost","Mediametric","Mediapartners-Google","mediawords","MegaIndex\\.ru","MeltwaterNews","Melvil Rawi","MemGator","Metaspinner","MetaURI","MFC_Tear_Sample","Microsearch","Microsoft Data Access","Microsoft Office","Microsoft Outlook","Microsoft Windows Network Diagnostics","Microsoft-WebDAV-MiniRedir","Microsoft\\.Data\\.Mashup","MIDown tool","MIIxpc","Mindjet","Miniature\\.io","Miniflux","mio_httpc","Miro-HttpClient","Mister PiX","mixdata dot com","mixed-content-scan","mixnode","Mnogosearch","mogimogi","Mojeek","Mojolicious \\(Perl\\)","Mollie","monitis","Monitority\\\/","Monit\\\/","montastic","MonTools","Moreover","Morfeus Fucking Scanner","Morning Paper","MovableType","mowser","Mrcgiguy","Mr\\.4x3 Powered","MS Web Services Client Protocol","MSFrontPage","mShots","MuckRack\\\/","muhstik-scan","MVAClient","MxToolbox\\\/","myseosnapshot","nagios","Najdi\\.si","Name Intelligence","NameFo\\.com","Nameprotect","nationalarchives","Navroad","NearSite","Needle","Nessus","Net Vampire","NetAnts","NETCRAFT","NetLyzer","NetMechanic","NetNewsWire","Netpursual","netresearch","NetShelter ContentScan","Netsparker","NetSystemsResearch","nettle","NetTrack","Netvibes","NetZIP","Neustar WPM","NeutrinoAPI","NewRelicPinger","NewsBlur .*Finder","NewsGator","newsme","newspaper\\\/","Nexgate Ruby Client","NG-Search","nghttp2","Nibbler","NICErsPRO","NihilScio","Nikto","nineconnections","NLNZ_IAHarvester","Nmap Scripting Engine","node-fetch","node-superagent","node-urllib","Nodemeter","NodePing","node\\.io","nominet\\.org\\.uk","nominet\\.uk","Norton-Safeweb","Notifixious","notifyninja","NotionEmbedder","nuhk","nutch","Nuzzel","nWormFeedFinder","nyawc\\\/","Nymesis","NYU","Observatory\\\/","Ocelli\\\/","Octopus","oegp","Offline Explorer","Offline Navigator","OgScrper","okhttp","omgili","OMSC","Online Domain Tools","Open Source RSS","OpenCalaisSemanticProxy","Openfind","OpenLinkProfiler","Openstat\\\/","OpenVAS","OPPO A33","Optimizer","Orbiter","OrgProbe\\\/","orion-semantics","Outlook-Express","Outlook-iOS","Owler","Owlin","ownCloud News","ow\\.ly","OxfordCloudService","page scorer","Page Valet","page2rss","PageFreezer","PageGrabber","PagePeeker","PageScorer","Pagespeed\\\/","PageThing","page_verifier","Panopta","panscient","Papa Foto","parsijoo","Pavuk","PayPal IPN","pcBrowser","Pcore-HTTP","PDF24 URL To PDF","Pearltrees","PECL::HTTP","peerindex","Peew","PeoplePal","Perlu -","PhantomJS Screenshoter","PhantomJS\\\/","Photon\\\/","php-requests","phpservermon","Pi-Monster","Picscout","Picsearch","PictureFinder","Pimonster","Pingability","PingAdmin\\.Ru","Pingdom","Pingoscope","PingSpot","ping\\.blo\\.gs","pinterest\\.com","Pixray","Pizilla","Plagger\\\/","Pleroma ","Ploetz \\+ Zeller","Plukkie","plumanalytics","PocketImageCache","PocketParser","Pockey","PodcastAddict\\\/","POE-Component-Client-HTTP","Polymail\\\/","Pompos","Porkbun","Port Monitor","postano","postfix-mta-sts-resolver","PostmanRuntime","postplanner\\.com","PostPost","postrank","PowerPoint\\\/","Prebid","Prerender","Priceonomics Analysis Engine","PrintFriendly","PritTorrent","Prlog","probethenet","Project ?25499","Project-Resonance","prospectb2b","Protopage","ProWebWalker","proximic","PRTG Network Monitor","pshtt, https scanning","PTST ","PTST\\\/[0-9]+","Pump","Python-httplib2","python-httpx","python-requests","Python-urllib","Qirina Hurdler","QQDownload","QrafterPro","Qseero","Qualidator","QueryN Metasearch","queuedriver","quic-go-HTTP\\\/","QuiteRSS","Quora Link Preview","Qwantify","Radian6","RadioPublicImageResizer","Railgun\\\/","RankActive","RankFlex","RankSonicSiteAuditor","RapidLoad\\\/","Re-re Studio","ReactorNetty","Readability","RealDownload","RealPlayer%20Downloader","RebelMouse","Recorder","RecurPost\\\/","redback\\\/","ReederForMac","Reeder\\\/","ReGet","RepoMonkey","request\\.js","reqwest\\\/","ResponseCodeTest","RestSharp","Riddler","Rival IQ","Robosourcer","Robozilla","ROI Hunter","RPT-HTTPClient","RSSMix\\\/","RSSOwl","RyowlEngine","safe-agent-scanner","SalesIntelligent","Saleslift","SAP NetWeaver Application Server","SauceNAO","SBIder","sc-downloader","scalaj-http","Scamadviser-Frontend","ScanAlert","scan\\.lol","Scoop","scooter","ScopeContentAG-HTTP-Client","ScoutJet","ScoutURLMonitor","ScrapeBox Page Scanner","Scrapy","Screaming","ScreenShotService","Scrubby","Scrutiny\\\/","Search37","searchenginepromotionhelp","Searchestate","SearchExpress","SearchSight","SearchWP","search\\.thunderstone","Seeker","semanticdiscovery","semanticjuice","Semiocast HTTP client","Semrush","Sendsay\\.Ru","sentry\\\/","SEO Browser","Seo Servis","seo-nastroj\\.cz","seo4ajax","Seobility","SEOCentro","SeoCheck","seocompany","SEOkicks","SEOlizer","Seomoz","SEOprofiler","seoscanners","SEOsearch","seositecheckup","SEOstats","servernfo","sexsearcher","Seznam","Shelob","Shodan","Shoppimon","ShopWiki","ShortLinkTranslate","shortURL lengthener","shrinktheweb","Sideqik","Siege","SimplePie","SimplyFast","Siphon","SISTRIX","Site Sucker","Site-Shot\\\/","Site24x7","SiteBar","Sitebeam","Sitebulb\\\/","SiteCondor","SiteExplorer","SiteGuardian","Siteimprove","SiteIndexed","Sitemap(s)? Generator","SitemapGenerator","SiteMonitor","Siteshooter B0t","SiteSnagger","SiteSucker","SiteTruth","Sitevigil","sitexy\\.com","SkypeUriPreview","Slack\\\/","sli-systems\\.com","slider\\.com","slurp","SlySearch","SmartDownload","SMRF URL Expander","SMUrlExpander","Snake","Snappy","SnapSearch","Snarfer\\\/","SniffRSS","sniptracker","Snoopy","SnowHaze Search","sogou web","SortSite","Sottopop","sovereign\\.ai","SpaceBison","SpamExperts","Spammen","Spanner","spaziodati","SPDYCheck","Specificfeeds","speedy","SPEng","Spinn3r","spray-can","Sprinklr ","spyonweb","sqlmap","Sqlworm","Sqworm","SSL Labs","ssl-tools","StackRambler","Statastico\\\/","Statically-","StatusCake","Steeler","Stratagems Kumo","Stripe\\\/","Stroke\\.cz","StudioFACA","StumbleUpon","suchen","Sucuri","summify","SuperHTTP","Surphace Scout","Suzuran","swcd ","Symfony BrowserKit","Symfony2 BrowserKit","Synapse\\\/","Syndirella\\\/","SynHttpClient-Built","Sysomos","sysscan","Szukacz","T0PHackTeam","tAkeOut","Tarantula\\\/","Taringa UGC","TarmotGezgin","tchelebi\\.io","techiaith\\.cymru","Teleport","Telesoft","Telesphoreo","Telesphorep","Tenon\\.io","teoma","terrainformatica","Test Certificate Info","testuri","Tetrahedron","TextRazor Downloader","The Drop Reaper","The Expert HTML Source Viewer","The Intraformant","The Knowledge AI","theinternetrules","TheNomad","Thinklab","Thumbor","Thumbshots","ThumbSniper","timewe\\.net","TinEye","Tiny Tiny RSS","TLSProbe\\\/","Toata","topster","touche\\.com","Traackr\\.com","tracemyfile","Trackuity","TrapitAgent","Trendiction","Trendsmap","trendspottr","truwoGPS","TryJsoup","TulipChain","Turingos","Turnitin","tweetedtimes","Tweetminster","Tweezler\\\/","twibble","Twice","Twikle","Twingly","Twisted PageGetter","Typhoeus","ubermetrics-technologies","uclassify","UdmSearch","ultimate_sitemap_parser","unchaos","unirest-java","UniversalFeedParser","unshortenit","Unshorten\\.It","Untiny","UnwindFetchor","updated","updown\\.io daemon","Upflow","Uptimia","URL Verifier","Urlcheckr","URLitor","urlresolver","Urlstat","URLTester","UrlTrends Ranking Updater","URLy Warning","URLy\\.Warning","URL\\\/Emacs","Vacuum","Vagabondo","VB Project","vBSEO","VCI","via ggpht\\.com GoogleImageProxy","Virusdie","visionutils","Visual Rights Group","vkShare","VoidEYE","Voil","voltron","voyager\\\/","VSAgent\\\/","VSB-TUO\\\/","Vulnbusters Meter","VYU2","w3af\\.org","W3C-checklink","W3C-mobileOK","W3C_Unicorn","WAC-OFU","WakeletLinkExpander","WallpapersHD","Wallpapers\\\/[0-9]+","wangling","Wappalyzer","WatchMouse","WbSrch\\\/","WDT\\.io","Web Auto","Web Collage","Web Enhancer","Web Fetch","Web Fuck","Web Pix","Web Sauger","Web spyder","Web Sucker","web-capture\\.net","Web-sniffer","Webalta","Webauskunft","WebAuto","WebCapture","WebClient\\\/","webcollage","WebCookies","WebCopier","WebCorp","WebDataStats","WebDoc","WebEnhancer","WebFetch","WebFuck","WebGazer","WebGo IS","WebImageCollector","WebImages","WebIndex","webkit2png","WebLeacher","webmastercoffee","webmon ","WebPix","WebReaper","WebSauger","webscreenie","Webshag","Webshot","Website Quester","websitepulse agent","WebsiteQuester","Websnapr","WebSniffer","Webster","WebStripper","WebSucker","webtech\\\/","WebThumbnail","Webthumb\\\/","WebWhacker","WebZIP","WeLikeLinks","WEPA","WeSEE","wf84","Wfuzz\\\/","wget","WhatCMS","WhatsApp","WhatsMyIP","WhatWeb","WhereGoes\\?","Whibse","WhoAPI\\\/","WhoRunsCoinHive","Whynder Magnet","Windows-RSS-Platform","WinHttp-Autoproxy-Service","WinHTTP\\\/","WinPodder","wkhtmlto","wmtips","Woko","Wolfram HTTPClient","woorankreview","WordPress\\\/","WordupinfoSearch","Word\\\/","worldping-api","wotbox","WP Engine Install Performance API","WP Rocket","wpif","wprecon\\.com survey","WPScan","wscheck","Wtrace","WWW-Collector-E","WWW-Mechanize","WWW::Document","WWW::Mechanize","WWWOFFLE","www\\.monitor\\.us","x09Mozilla","x22Mozilla","XaxisSemanticsClassifier","XenForo\\\/","Xenu Link Sleuth","XING-contenttabreceiver","xpymep([0-9]?)\\.exe","Y!J-[A-Z][A-Z][A-Z]","Yaanb","yacy","Yahoo Link Preview","YahooCacheSystem","YahooMailProxy","YahooYSMcm","YandeG","Yandex(?!Search)","yanga","yeti","Yo-yo","Yoleo Consumer","yomins\\.com","yoogliFetchAgent","YottaaMonitor","Your-Website-Sucks","yourls\\.org","YoYs\\.net","YP\\.PL","Zabbix","Zade","Zao","Zauba","Zemanta Aggregator","Zend\\\\Http\\\\Client","Zend_Http_Client","Zermelo","Zeus ","zgrab","ZnajdzFoto","ZnHTTP","Zombie\\.js","Zoom\\.Mac","ZoteroTranslationServer","ZyBorg","[a-z0-9\\-_]*(bot|crawl|archiver|transcoder|spider|uptime|validator|fetcher|cron|checker|reader|extractor|monitoring|analyzer|scraper)"] crawler-detect/raw/Headers.txt 0000644 00000000320 15025017654 0012356 0 ustar 00 HTTP_USER_AGENT HTTP_X_OPERAMINI_PHONE_UA HTTP_X_DEVICE_USER_AGENT HTTP_X_ORIGINAL_USER_AGENT HTTP_X_SKYFIRE_PHONE HTTP_X_BOLT_PHONE_UA HTTP_DEVICE_STOCK_UA HTTP_X_UCBROWSER_DEVICE_UA HTTP_FROM HTTP_X_SCANNER crawler-detect/raw/Headers.json 0000644 00000000346 15025017654 0012520 0 ustar 00 ["HTTP_USER_AGENT","HTTP_X_OPERAMINI_PHONE_UA","HTTP_X_DEVICE_USER_AGENT","HTTP_X_ORIGINAL_USER_AGENT","HTTP_X_SKYFIRE_PHONE","HTTP_X_BOLT_PHONE_UA","HTTP_DEVICE_STOCK_UA","HTTP_X_UCBROWSER_DEVICE_UA","HTTP_FROM","HTTP_X_SCANNER"] crawler-detect/raw/Exclusions.json 0000644 00000001430 15025017654 0013274 0 ustar 00 ["Safari.[\\d\\.]*","Firefox.[\\d\\.]*"," Chrome.[\\d\\.]*","Chromium.[\\d\\.]*","MSIE.[\\d\\.]","Opera\\\/[\\d\\.]*","Mozilla.[\\d\\.]*","AppleWebKit.[\\d\\.]*","Trident.[\\d\\.]*","Windows NT.[\\d\\.]*","Android [\\d\\.]*","Macintosh.","Ubuntu","Linux","[ ]Intel","Mac OS X [\\d_]*","(like )?Gecko(.[\\d\\.]*)?","KHTML,","CriOS.[\\d\\.]*","CPU iPhone OS ([0-9_])* like Mac OS X","CPU OS ([0-9_])* like Mac OS X","iPod","compatible","x86_..","i686","x64","X11","rv:[\\d\\.]*","Version.[\\d\\.]*","WOW64","Win64","Dalvik.[\\d\\.]*"," \\.NET CLR [\\d\\.]*","Presto.[\\d\\.]*","Media Center PC","BlackBerry","Build","Opera Mini\\\/\\d{1,2}\\.\\d{1,2}\\.[\\d\\.]*\\\/\\d{1,2}\\.","Opera"," \\.NET[\\d\\.]*","cubot","; M bot","; CRONO","; B bot","; IDbot","; ID bot","; POWER BOT","OCTOPUS-CORE"] crawler-detect/.php_cs.dist 0000644 00000002054 15025017654 0011676 0 ustar 00 <?php $finder = Symfony\Component\Finder\Finder::create() ->in([ __DIR__.'/src', __DIR__.'/tests', ]) ->name('*.php') ->ignoreDotFiles(true) ->ignoreVCS(true); return PhpCsFixer\Config::create() ->setRules([ '@PSR2' => true, 'array_syntax' => ['syntax' => 'long'], 'ordered_imports' => ['sortAlgorithm' => 'alpha'], 'no_unused_imports' => true, 'not_operator_with_successor_space' => true, 'trailing_comma_in_multiline_array' => true, 'phpdoc_scalar' => true, 'unary_operator_spaces' => true, 'binary_operator_spaces' => true, 'blank_line_before_statement' => [ 'statements' => ['break', 'continue', 'declare', 'return', 'throw', 'try'], ], 'phpdoc_single_line_var_spacing' => true, 'phpdoc_var_without_name' => true, 'method_argument_space' => [ 'on_multiline' => 'ensure_fully_multiline', 'keep_multiple_spaces_after_comma' => true, ], ]) ->setFinder($finder); crawler-detect/README.md 0000644 00000007565 15025017654 0010752 0 ustar 00 <p align="center"><a href="https://crawlerdetect.io/" target="_blank"><img src="https://cloud.githubusercontent.com/assets/340752/23082173/1bd1a396-f550-11e6-8aba-4d3c75edea2f.png" width="321" height="219" /></a><br><br> <a href="https://crawlerdetect.io/" target="_blank">crawlerdetect.io</a> <br><br> </p> <p align="center"> <a href="https://github.com/JayBizzle/Crawler-Detect/actions"><img alt="GitHub Workflow Status" src="https://img.shields.io/github/actions/workflow/status/JayBizzle/Crawler-Detect/test.yml?branch=master&style=flat-square"></a> <a href="https://packagist.org/packages/jaybizzle/crawler-detect"><img src="https://img.shields.io/packagist/dm/JayBizzle/Crawler-Detect.svg?style=flat-square" /></a> <a href="https://github.com/JayBizzle/Crawler-Detect"><img src="https://img.shields.io/badge/license-MIT-ff69b4.svg?style=flat-square" /></a> <a href="https://packagist.org/packages/jaybizzle/crawler-detect"><img src="https://img.shields.io/packagist/v/jaybizzle/Crawler-Detect.svg?style=flat-square" /></a> <a href="https://coveralls.io/github/JayBizzle/Crawler-Detect"><img src="https://img.shields.io/coveralls/JayBizzle/Crawler-Detect/master.svg?style=flat-square" /></a> </p> ## About CrawlerDetect CrawlerDetect is a PHP class for detecting bots/crawlers/spiders via the `user agent` and `http_from` header. Currently able to detect 1,000's of bots/spiders/crawlers. ### Installation ``` composer require jaybizzle/crawler-detect ``` ### Usage ```PHP use Jaybizzle\CrawlerDetect\CrawlerDetect; $CrawlerDetect = new CrawlerDetect; // Check the user agent of the current 'visitor' if($CrawlerDetect->isCrawler()) { // true if crawler user agent detected } // Pass a user agent as a string if($CrawlerDetect->isCrawler('Mozilla/5.0 (compatible; Sosospider/2.0; +http://help.soso.com/webspider.htm)')) { // true if crawler user agent detected } // Output the name of the bot that matched (if any) echo $CrawlerDetect->getMatches(); ``` ### Contributing If you find a bot/spider/crawler user agent that CrawlerDetect fails to detect, please submit a pull request with the regex pattern added to the `$data` array in `Fixtures/Crawlers.php` and add the failing user agent to `tests/crawlers.txt`. Failing that, just create an issue with the user agent you have found, and we'll take it from there :) ### Laravel Package If you would like to use this with Laravel, please see [Laravel-Crawler-Detect](https://github.com/JayBizzle/Laravel-Crawler-Detect) ### Symfony Bundle To use this library with Symfony 2/3/4, check out the [CrawlerDetectBundle](https://github.com/nicolasmure/CrawlerDetectBundle). ### YII2 Extension To use this library with the YII2 framework, check out [yii2-crawler-detect](https://github.com/AlikDex/yii2-crawler-detect). ### ES6 Library To use this library with NodeJS or any ES6 application based, check out [es6-crawler-detect](https://github.com/JefferyHus/es6-crawler-detect). ### Python Library To use this library in a Python project, check out [crawlerdetect](https://github.com/moskrc/CrawlerDetect). ### JVM Library (written in Java) To use this library in a JVM project (including Java, Scala, Kotlin, etc.), check out [CrawlerDetect](https://github.com/nekosoftllc/crawler-detect). ### .NET Library To use this library in a .net standard (including .net core) based project, check out [NetCrawlerDetect](https://github.com/gplumb/NetCrawlerDetect). ### Ruby Gem To use this library with Ruby on Rails or any Ruby-based application, check out [crawler_detect](https://github.com/loadkpi/crawler_detect) gem. ### Go Module To use this library with Go, check out the [crawlerdetect](https://github.com/x-way/crawlerdetect) module. _Parts of this class are based on the brilliant [MobileDetect](https://github.com/serbanghita/Mobile-Detect)_ [](https://github.com/JayBizzle/Crawler-Detect) crawler-detect/LICENSE 0000644 00000002073 15025017654 0010465 0 ustar 00 The MIT License (MIT) Copyright (c) 2015-2020 Mark Beech Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the "Software"), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions: The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software. THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. crawler-detect/.github/workflows/php-cs-fixer.yml 0000644 00000001156 15025017654 0016106 0 ustar 00 name: Check & fix styling on: [ push ] jobs: php-cs-fixer: runs-on: ubuntu-latest steps: - name: Checkout code uses: actions/checkout@v2 with: ref: ${{ github.head_ref }} - name: Run PHP CS Fixer uses: docker://oskarstark/php-cs-fixer-ga:2.18.6 with: args: --config=.php_cs.dist --allow-risky=yes - name: Commit changes uses: stefanzweifel/git-auto-commit-action@v4 with: commit_message: Fix styling crawler-detect/.github/workflows/test.yml 0000644 00000002737 15025017654 0014566 0 ustar 00 name: Test on: push: branches: - "master" pull_request: jobs: build: runs-on: ubuntu-latest strategy: fail-fast: true matrix: php: [5.3, 5.4, 5.5, 5.6, 7.0, 7.1, 7.2, 7.3, 7.4, 8.0, 8.1, 8.2] name: PHP:${{ matrix.php }} steps: - name: Checkout uses: actions/checkout@v2 - name: Setup PHP, with composer uses: shivammathur/setup-php@v2 with: php-version: ${{ matrix.php }} tools: composer:v2 coverage: xdebug - name: Get composer cache directory id: composer-cache run: echo "::set-output name=dir::$(composer config cache-files-dir)" - name: Cache composer dependencies uses: actions/cache@v2 with: path: ${{ steps.composer-cache.outputs.dir }} key: dependencies-php-${{ matrix.php }}-composer-${{ hashFiles('composer.json') }} restore-keys: dependencies-php-${{ matrix.php }}-composer- - name: Install Composer dependencies run: | composer install --prefer-dist --no-interaction --no-suggest - name: Run Unit tests run: | vendor/bin/phpunit --coverage-clover=tests/logs/clover.xml - name: Upload coverage results to Coveralls env: COVERALLS_REPO_TOKEN: ${{ secrets.GITHUB_TOKEN }} run: | composer global require php-coveralls/php-coveralls "^1.0" coveralls --coverage_clover=tests/logs/clover.xml -v crawler-detect/export.php 0000644 00000001732 15025017654 0011513 0 ustar 00 <?php /* * This file is part of Crawler Detect - the web crawler detection library. * * (c) Mark Beech <m@rkbee.ch> * * This source file is subject to the MIT license that is bundled * with this source code in the file LICENSE. */ require 'src/Fixtures/AbstractProvider.php'; require 'src/Fixtures/Crawlers.php'; require 'src/Fixtures/Exclusions.php'; require 'src/Fixtures/Headers.php'; $src = array( 'Crawlers', 'Exclusions', 'Headers', ); foreach ($src as $class) { $class = "Jaybizzle\\CrawlerDetect\\Fixtures\\$class"; $object = new $class; outputJson($object); outputTxt($object); } function outputJson($object) { $className = (new ReflectionClass($object))->getShortName(); file_put_contents("raw/$className.json", json_encode($object->getAll())); } function outputTxt($object) { $className = (new ReflectionClass($object))->getShortName(); file_put_contents("raw/$className.txt", implode(PHP_EOL, $object->getAll())); }
| ver. 1.4 |
.
| PHP 8.1.32 | Generation time: 0 |
proxy
|
phpinfo
|
Settings