Inspection of "Add Apache-HttpClient/ and Java/" - JayBizzle/Crawler-Detect - Measure and Improve Code Quality continuously with Scrutinizer

Completed

Push — master ( 082cfe...e31477 )

by Mark

created 2016-04-05 13:06 UTC

Status

Spacing +2 added lines, -2 removed lines patch added patch discarded remove patch

@@ -461,7 +461,7 @@  discard block
 block discarded – undo
     public function setHttpHeaders($httpHeaders = null)
     {
         // use global _SERVER if $httpHeaders aren't defined
-        if (!is_array($httpHeaders) || !count($httpHeaders)) {
+        if ( ! is_array($httpHeaders) || ! count($httpHeaders)) {
             $httpHeaders = $_SERVER;
         }
         // clear existing headers
@@ -492,7 +492,7 @@  discard block
 block discarded – undo
                 }
             }
 
-            return $this->userAgent = (!empty($this->userAgent) ? trim($this->userAgent) : null);
+            return $this->userAgent = ( ! empty($this->userAgent) ? trim($this->userAgent) : null);
         }
     }
 

Please login to merge, or discard this patch.

Indentation +491 added lines, -491 removed lines patch added patch discarded remove patch

@@ -4,514 +4,514 @@
 block discarded – undo
 
 class CrawlerDetect
 {
-    /**
-     * The user agent.
-     *
-     * @var null
-     */
-    protected $userAgent = null;
+	/**
+	 * The user agent.
+	 *
+	 * @var null
+	 */
+	protected $userAgent = null;
 
-    /**
-     * Headers that contain a user agent.
-     *
-     * @var array
-     */
-    protected $httpHeaders = array();
+	/**
+	 * Headers that contain a user agent.
+	 *
+	 * @var array
+	 */
+	protected $httpHeaders = array();
 
-    /**
-     * Store regex matches.
-     *
-     * @var array
-     */
-    protected $matches = array();
+	/**
+	 * Store regex matches.
+	 *
+	 * @var array
+	 */
+	protected $matches = array();
 
-    /**
-     * List of strings to remove from the user agent before running the crawler regex
-     * Over a large list of user agents, this gives us about a 55% speed increase!
-     *
-     * @var array
-     */
-    protected static $ignore = array(
-        'Safari.[\d\.]*',
-        'Firefox.[\d\.]*',
-        'Chrome.[\d\.]*',
-        'Chromium.[\d\.]*',
-        'MSIE.[\d\.]',
-        'Opera\/[\d\.]*',
-        'Mozilla.[\d\.]*',
-        'AppleWebKit.[\d\.]*',
-        'Trident.[\d\.]*',
-        'Windows NT.[\d\.]*',
-        'Android.[\d\.]*',
-        'Macintosh.',
-        'Ubuntu',
-        'Linux',
-        '[ ]Intel',
-        'Mac OS X [\d_]*',
-        '(like )?Gecko(.[\d\.]*)?',
-        'KHTML',
-        'CriOS.[\d\.]*',
-        'CPU iPhone OS ([0-9_])* like Mac OS X',
-        'CPU OS ([0-9_])* like Mac OS X',
-        'iPod',
-        'compatible',
-        'x86_..',
-        'i686',
-        'x64',
-        'X11',
-        'rv:[\d\.]*',
-        'Version.[\d\.]*',
-        'WOW64',
-        'Win64',
-        'Dalvik.[\d\.]*',
-        ' \.NET CLR [\d\.]*',
-        'Presto.[\d\.]*',
-        'Media Center PC',
-        'BlackBerry',
-        'Build',
-        'Opera Mini\/\d{1,2}\.\d{1,2}\.[\d\.]*\/\d{1,2}\.',
-        'Opera',
-        ' \.NET[\d\.]*',
-        '\(|\)|;|,', // Remove the following characters ( ) : ,
-    );
+	/**
+	 * List of strings to remove from the user agent before running the crawler regex
+	 * Over a large list of user agents, this gives us about a 55% speed increase!
+	 *
+	 * @var array
+	 */
+	protected static $ignore = array(
+		'Safari.[\d\.]*',
+		'Firefox.[\d\.]*',
+		'Chrome.[\d\.]*',
+		'Chromium.[\d\.]*',
+		'MSIE.[\d\.]',
+		'Opera\/[\d\.]*',
+		'Mozilla.[\d\.]*',
+		'AppleWebKit.[\d\.]*',
+		'Trident.[\d\.]*',
+		'Windows NT.[\d\.]*',
+		'Android.[\d\.]*',
+		'Macintosh.',
+		'Ubuntu',
+		'Linux',
+		'[ ]Intel',
+		'Mac OS X [\d_]*',
+		'(like )?Gecko(.[\d\.]*)?',
+		'KHTML',
+		'CriOS.[\d\.]*',
+		'CPU iPhone OS ([0-9_])* like Mac OS X',
+		'CPU OS ([0-9_])* like Mac OS X',
+		'iPod',
+		'compatible',
+		'x86_..',
+		'i686',
+		'x64',
+		'X11',
+		'rv:[\d\.]*',
+		'Version.[\d\.]*',
+		'WOW64',
+		'Win64',
+		'Dalvik.[\d\.]*',
+		' \.NET CLR [\d\.]*',
+		'Presto.[\d\.]*',
+		'Media Center PC',
+		'BlackBerry',
+		'Build',
+		'Opera Mini\/\d{1,2}\.\d{1,2}\.[\d\.]*\/\d{1,2}\.',
+		'Opera',
+		' \.NET[\d\.]*',
+		'\(|\)|;|,', // Remove the following characters ( ) : ,
+	);
 
-    /**
-     * Array of regular expressions to match against the user agent.
-     *
-     * @var array
-     */
-    protected static $crawlers = array(
-        '.*Java.*outbrain',
-        '008\\/',
-        '^NING\\/',
-        'A6-Indexer',
-        'Aboundex',
-        'Accoona-AI-Agent',
-        'acoon',
-        'AddThis',
-        'ADmantX',
-        'AHC',
-        'Airmail',
-        'Anemone',
-        'Apache-HttpClient\/',
-        'Arachmo',
-        'archive-com',
-        'B-l-i-t-z-B-O-T',
-        'Backlink-Ceck\.de',
-        'BazQux',
-        'bibnum\.bnf',
-        'biglotron',
-        'BingPreview',
-        'binlar',
-        'Bloglovin',
-        'Blogtrottr',
-        'boitho\.com-dc',
-        'Browsershots',
-        'BUbiNG',
-        'Butterfly\\/',
-        'BuzzSumo',
-        'CapsuleChecker',
-        'CC Metadata Scaper',
-        'Cerberian Drtrs',
-        'changedetection',
-        'Charlotte',
-        'clips\.ua\.ac\.be',
-        'CloudFlare-AlwaysOnline',
-        'coccoc',
-        'CommaFeed',
-        'Commons-HttpClient',
-        'convera',
-        'cosmos',
-        'Covario-IDS',
-        'Curious George',
-        'curl',
-        'CyberPatrol',
-        'DataparkSearch',
-        'dataprovider',
-        'Daum(oa)?[ \\/][0-9]',
-        'Digg',
-        'DomainAppender',
-        'Dragonfly File Reader',
-        'drupact',
-        'EARTHCOM',
-        'ec2linkfinder',
-        'ECCP',
-        'ElectricMonk',
-        'EMail Exractor',
-        'EmailWolf',
-        'Embed PHP Library',
-        'Embedly',
-        'europarchive\.org',
-        'EventMachine HttpClient',
-        'ExactSearch',
-        'ExaleadCloudview',
-        'eZ Publish Link Validator',
-        'ezooms',
-        'facebookexternalhit',
-        'facebookplatform',
-        'Feed Wrangler',
-        'Feedbin',
-        'FeedBurner',
-        'Feedfetcher-Google',
-        'Feedly',
-        'Feedspot',
-        'FeedValidator',
-        'Fever',
-        'findlink',
-        'findthatfile',
-        'Flamingo_SearchEngine',
-        'fluffy',
-        'g00g1e\.net',
-        'Genieo',
-        'getprismatic\.com',
-        'GigablastOpenSource',
-        'Go-http-client',
-        'Google favicon',
-        'Google Keyword Suggestion',
-        'Google Page Speed Insights',
-        'Google-HTTP-Java-Client',
-        'google_partner_monitoring',
-        'GoogleProducer',
-        'grub-client',
-        'heritrix',
-        'Holmes',
-        'htdig',
-        'HTTPMon',
-        'httpunit',
-        'http_request2',
-        'httrack',
-        'HubPages.*crawlingpolicy',
-        'HubSpot Marketing Grader',
-        'ichiro',
-        'IDG Twitter Links Resolver',
-        'igdeSpyder',
-        'InAGist',
-        'infegy',
-        'InfoWizards Reciprocal Link System PRO',
-        'inpwrd\.com',
-        'integromedb',
-        'IODC',
-        'IOI',
-        'ips-agent',
-        'iZSearch',
-        '^Java\/',
-        'Jigsaw',
-        'Jobrapido',
-        'kouio',
-        'L\.webis',
-        'Larbin',
-        'libwww',
-        'Link Valet',
-        'linkCheck',
-        'linkdex',
-        'LinkExaminer',
-        'LinkWalker',
-        'Lipperhey',
-        'LongURL API',
-        'ltx71',
-        'lwp-trivial',
-        'lycos',
-        'mabontland',
-        'MagpieRSS',
-        'Mediapartners-Google',
-        'Mediapartners-Google',
-        'MegaIndex\.ru',
-        'MetaURI',
-        'Mnogosearch',
-        'mogimogi',
-        'Morning Paper',
-        'Mrcgiguy',
-        'MVAClient',
-        'Netcraft Web Server Survey',
-        'NetcraftSurveyAgent',
-        'NetLyzer FastProbe',
-        'netresearch',
-        'Netvibes',
-        'NewsBlur .*(Fetcher|Finder)',
-        'NewsGator',
-        'newsme',
-        'NG-Search',
-        'nineconnections\.com',
-        'nominet\.org\.uk',
-        'Notifixious',
-        'nuhk',
-        'nutch',
-        'Nymesis',
-        'oegp',
-        'Omea Reader',
-        'online link validator',
-        'Online Website Link Checker',
-        'Orbiter',
-        'ow\.ly',
-        'page2rss',
-        'PagePeeker',
-        'panscient',
-        'Peew',
-        'phpcrawl',
-        'phpservermon',
-        'Pingdom\.com',
-        'Pinterest',
-        'Pizilla',
-        'Ploetz \+ Zeller',
-        'Plukkie',
-        'PocketParser',
-        'Pompos',
-        'postano',
-        'PostPost',
-        'postrank',
-        'proximic',
-        'Pulsepoint XT3 web scraper',
-        'Python-httplib2',
-        'python-requests',
-        'Python-urllib',
-        'Qseero',
-        'Qwantify',
-        'Radian6',
-        'RebelMouse',
-        'REL Link Checker',
-        'RetrevoPageAnalyzer',
-        'Riddler',
-        'Robosourcer',
-        'ROI Hunter',
-        'Ruby',
-        'SalesIntelligent',
-        'SBIder',
-        'scooter',
-        'ScoutJet',
-        'ScoutURLMonitor',
-        'Scrapy',
-        'Scrubby',
-        'SearchSight',
-        'semanticdiscovery',
-        'SEOstats',
-        'Server Density Service Monitoring.*',
-        'servernfo\.com',
-        'Seznam screenshot-generator',
-        'ShopWiki',
-        'SilverReader',
-        'SimplePie',
-        'Site24x7',
-        'SiteBar',
-        'siteexplorer\.info',
-        'Siteimprove\.com',
-        'SkypeUriPreview',
-        'slider\.com',
-        'slurp',
-        'Snappy',
-        'SNK Siteshooter B0t',
-        'sogou',
-        'SortSite',
-        'speedy',
-        'Spinn3r',
-        'Springshare Link Checker',
-        'Sqworm',
-        'StackRambler',
-        'Stratagems Kumo',
-        'summify',
-        'teoma',
-        'theoldreader\.com',
-        'TinEye',
-        'Tiny Tiny RSS',
-        'Traackr.com',
-        'truwoGPS',
-        'tweetedtimes\.com',
-        'Twikle',
-        'Typhoeus',
-        'ubermetrics-technologies',
-        'UdmSearch',
-        'UnwindFetchor',
-        'updated',
-        'URLChecker',
-        'urlresolver',
-        'Vagabondo',
-        'Validator\.nu\\/LV',
-        'via ggpht\.com GoogleImageProxy',
-        'Vivante Link Checker',
-        'Vortex',
-        'voyager\\/',
-        'VYU2',
-        'W3C-checklink',
-        'W3C-mobileOK',
-        'W3C_CSS_Validator_JFouffa',
-        'W3C_I18n-Checker',
-        'W3C_Unicorn',
-        'W3C_Validator',
-        'web-capture\.net',
-        'webcollage',
-        'WebIndex',
-        'webmon ',
-        'websitepulse[+ ]checker',
-        'Websquash\.com',
-        'WebThumbnail',
-        'WeSEE:Search',
-        'wf84',
-        'wget',
-        'WomlpeFactory',
-        'wotbox',
-        'www\.monitor\.us',
-        'XaxisSemanticsClassifier',
-        'Xenu Link Sleuth',
-        'XML Sitemaps Generator',
-        'Y!J-ASR',
-        'yacy',
-        'Yahoo Ad monitoring',
-        'Yahoo Link Preview',
-        'YahooSeeker',
-        'yandex',
-        'yanga',
-        'yeti',
-        'yoogliFetchAgent',
-        'YottaaMonitor',
-        'Zao',
-        'ZyBorg',
-        '[a-z0-9\\-_]*((?<!cu)bot|crawler|archiver|transcoder|spider)',
-    );
+	/**
+	 * Array of regular expressions to match against the user agent.
+	 *
+	 * @var array
+	 */
+	protected static $crawlers = array(
+		'.*Java.*outbrain',
+		'008\\/',
+		'^NING\\/',
+		'A6-Indexer',
+		'Aboundex',
+		'Accoona-AI-Agent',
+		'acoon',
+		'AddThis',
+		'ADmantX',
+		'AHC',
+		'Airmail',
+		'Anemone',
+		'Apache-HttpClient\/',
+		'Arachmo',
+		'archive-com',
+		'B-l-i-t-z-B-O-T',
+		'Backlink-Ceck\.de',
+		'BazQux',
+		'bibnum\.bnf',
+		'biglotron',
+		'BingPreview',
+		'binlar',
+		'Bloglovin',
+		'Blogtrottr',
+		'boitho\.com-dc',
+		'Browsershots',
+		'BUbiNG',
+		'Butterfly\\/',
+		'BuzzSumo',
+		'CapsuleChecker',
+		'CC Metadata Scaper',
+		'Cerberian Drtrs',
+		'changedetection',
+		'Charlotte',
+		'clips\.ua\.ac\.be',
+		'CloudFlare-AlwaysOnline',
+		'coccoc',
+		'CommaFeed',
+		'Commons-HttpClient',
+		'convera',
+		'cosmos',
+		'Covario-IDS',
+		'Curious George',
+		'curl',
+		'CyberPatrol',
+		'DataparkSearch',
+		'dataprovider',
+		'Daum(oa)?[ \\/][0-9]',
+		'Digg',
+		'DomainAppender',
+		'Dragonfly File Reader',
+		'drupact',
+		'EARTHCOM',
+		'ec2linkfinder',
+		'ECCP',
+		'ElectricMonk',
+		'EMail Exractor',
+		'EmailWolf',
+		'Embed PHP Library',
+		'Embedly',
+		'europarchive\.org',
+		'EventMachine HttpClient',
+		'ExactSearch',
+		'ExaleadCloudview',
+		'eZ Publish Link Validator',
+		'ezooms',
+		'facebookexternalhit',
+		'facebookplatform',
+		'Feed Wrangler',
+		'Feedbin',
+		'FeedBurner',
+		'Feedfetcher-Google',
+		'Feedly',
+		'Feedspot',
+		'FeedValidator',
+		'Fever',
+		'findlink',
+		'findthatfile',
+		'Flamingo_SearchEngine',
+		'fluffy',
+		'g00g1e\.net',
+		'Genieo',
+		'getprismatic\.com',
+		'GigablastOpenSource',
+		'Go-http-client',
+		'Google favicon',
+		'Google Keyword Suggestion',
+		'Google Page Speed Insights',
+		'Google-HTTP-Java-Client',
+		'google_partner_monitoring',
+		'GoogleProducer',
+		'grub-client',
+		'heritrix',
+		'Holmes',
+		'htdig',
+		'HTTPMon',
+		'httpunit',
+		'http_request2',
+		'httrack',
+		'HubPages.*crawlingpolicy',
+		'HubSpot Marketing Grader',
+		'ichiro',
+		'IDG Twitter Links Resolver',
+		'igdeSpyder',
+		'InAGist',
+		'infegy',
+		'InfoWizards Reciprocal Link System PRO',
+		'inpwrd\.com',
+		'integromedb',
+		'IODC',
+		'IOI',
+		'ips-agent',
+		'iZSearch',
+		'^Java\/',
+		'Jigsaw',
+		'Jobrapido',
+		'kouio',
+		'L\.webis',
+		'Larbin',
+		'libwww',
+		'Link Valet',
+		'linkCheck',
+		'linkdex',
+		'LinkExaminer',
+		'LinkWalker',
+		'Lipperhey',
+		'LongURL API',
+		'ltx71',
+		'lwp-trivial',
+		'lycos',
+		'mabontland',
+		'MagpieRSS',
+		'Mediapartners-Google',
+		'Mediapartners-Google',
+		'MegaIndex\.ru',
+		'MetaURI',
+		'Mnogosearch',
+		'mogimogi',
+		'Morning Paper',
+		'Mrcgiguy',
+		'MVAClient',
+		'Netcraft Web Server Survey',
+		'NetcraftSurveyAgent',
+		'NetLyzer FastProbe',
+		'netresearch',
+		'Netvibes',
+		'NewsBlur .*(Fetcher|Finder)',
+		'NewsGator',
+		'newsme',
+		'NG-Search',
+		'nineconnections\.com',
+		'nominet\.org\.uk',
+		'Notifixious',
+		'nuhk',
+		'nutch',
+		'Nymesis',
+		'oegp',
+		'Omea Reader',
+		'online link validator',
+		'Online Website Link Checker',
+		'Orbiter',
+		'ow\.ly',
+		'page2rss',
+		'PagePeeker',
+		'panscient',
+		'Peew',
+		'phpcrawl',
+		'phpservermon',
+		'Pingdom\.com',
+		'Pinterest',
+		'Pizilla',
+		'Ploetz \+ Zeller',
+		'Plukkie',
+		'PocketParser',
+		'Pompos',
+		'postano',
+		'PostPost',
+		'postrank',
+		'proximic',
+		'Pulsepoint XT3 web scraper',
+		'Python-httplib2',
+		'python-requests',
+		'Python-urllib',
+		'Qseero',
+		'Qwantify',
+		'Radian6',
+		'RebelMouse',
+		'REL Link Checker',
+		'RetrevoPageAnalyzer',
+		'Riddler',
+		'Robosourcer',
+		'ROI Hunter',
+		'Ruby',
+		'SalesIntelligent',
+		'SBIder',
+		'scooter',
+		'ScoutJet',
+		'ScoutURLMonitor',
+		'Scrapy',
+		'Scrubby',
+		'SearchSight',
+		'semanticdiscovery',
+		'SEOstats',
+		'Server Density Service Monitoring.*',
+		'servernfo\.com',
+		'Seznam screenshot-generator',
+		'ShopWiki',
+		'SilverReader',
+		'SimplePie',
+		'Site24x7',
+		'SiteBar',
+		'siteexplorer\.info',
+		'Siteimprove\.com',
+		'SkypeUriPreview',
+		'slider\.com',
+		'slurp',
+		'Snappy',
+		'SNK Siteshooter B0t',
+		'sogou',
+		'SortSite',
+		'speedy',
+		'Spinn3r',
+		'Springshare Link Checker',
+		'Sqworm',
+		'StackRambler',
+		'Stratagems Kumo',
+		'summify',
+		'teoma',
+		'theoldreader\.com',
+		'TinEye',
+		'Tiny Tiny RSS',
+		'Traackr.com',
+		'truwoGPS',
+		'tweetedtimes\.com',
+		'Twikle',
+		'Typhoeus',
+		'ubermetrics-technologies',
+		'UdmSearch',
+		'UnwindFetchor',
+		'updated',
+		'URLChecker',
+		'urlresolver',
+		'Vagabondo',
+		'Validator\.nu\\/LV',
+		'via ggpht\.com GoogleImageProxy',
+		'Vivante Link Checker',
+		'Vortex',
+		'voyager\\/',
+		'VYU2',
+		'W3C-checklink',
+		'W3C-mobileOK',
+		'W3C_CSS_Validator_JFouffa',
+		'W3C_I18n-Checker',
+		'W3C_Unicorn',
+		'W3C_Validator',
+		'web-capture\.net',
+		'webcollage',
+		'WebIndex',
+		'webmon ',
+		'websitepulse[+ ]checker',
+		'Websquash\.com',
+		'WebThumbnail',
+		'WeSEE:Search',
+		'wf84',
+		'wget',
+		'WomlpeFactory',
+		'wotbox',
+		'www\.monitor\.us',
+		'XaxisSemanticsClassifier',
+		'Xenu Link Sleuth',
+		'XML Sitemaps Generator',
+		'Y!J-ASR',
+		'yacy',
+		'Yahoo Ad monitoring',
+		'Yahoo Link Preview',
+		'YahooSeeker',
+		'yandex',
+		'yanga',
+		'yeti',
+		'yoogliFetchAgent',
+		'YottaaMonitor',
+		'Zao',
+		'ZyBorg',
+		'[a-z0-9\\-_]*((?<!cu)bot|crawler|archiver|transcoder|spider)',
+	);
 
-    /**
-     * All possible HTTP headers that represent the
-     * User-Agent string.
-     *
-     * @var array
-     */
-    protected static $uaHttpHeaders = array(
-        // The default User-Agent string.
-        'HTTP_USER_AGENT',
-        // Header can occur on devices using Opera Mini.
-        'HTTP_X_OPERAMINI_PHONE_UA',
-        // Vodafone specific header: http://www.seoprinciple.com/mobile-web-community-still-angry-at-vodafone/24/
-        'HTTP_X_DEVICE_USER_AGENT',
-        'HTTP_X_ORIGINAL_USER_AGENT',
-        'HTTP_X_SKYFIRE_PHONE',
-        'HTTP_X_BOLT_PHONE_UA',
-        'HTTP_DEVICE_STOCK_UA',
-        'HTTP_X_UCBROWSER_DEVICE_UA',
-    );
+	/**
+	 * All possible HTTP headers that represent the
+	 * User-Agent string.
+	 *
+	 * @var array
+	 */
+	protected static $uaHttpHeaders = array(
+		// The default User-Agent string.
+		'HTTP_USER_AGENT',
+		// Header can occur on devices using Opera Mini.
+		'HTTP_X_OPERAMINI_PHONE_UA',
+		// Vodafone specific header: http://www.seoprinciple.com/mobile-web-community-still-angry-at-vodafone/24/
+		'HTTP_X_DEVICE_USER_AGENT',
+		'HTTP_X_ORIGINAL_USER_AGENT',
+		'HTTP_X_SKYFIRE_PHONE',
+		'HTTP_X_BOLT_PHONE_UA',
+		'HTTP_DEVICE_STOCK_UA',
+		'HTTP_X_UCBROWSER_DEVICE_UA',
+	);
 
-    /**
-     * Class constructor.
-     */
-    public function __construct(array $headers = null, $userAgent = null)
-    {
-        $this->setHttpHeaders($headers);
-        $this->setUserAgent($userAgent);
-    }
+	/**
+	 * Class constructor.
+	 */
+	public function __construct(array $headers = null, $userAgent = null)
+	{
+		$this->setHttpHeaders($headers);
+		$this->setUserAgent($userAgent);
+	}
 
-    /**
-     * Set HTTP headers.
-     *
-     * @param array $httpHeaders
-     */
-    public function setHttpHeaders($httpHeaders = null)
-    {
-        // use global _SERVER if $httpHeaders aren't defined
-        if (!is_array($httpHeaders) || !count($httpHeaders)) {
-            $httpHeaders = $_SERVER;
-        }
-        // clear existing headers
-        $this->httpHeaders = array();
-        // Only save HTTP headers. In PHP land, that means only _SERVER vars that
-        // start with HTTP_.
-        foreach ($httpHeaders as $key => $value) {
-            if (substr($key, 0, 5) === 'HTTP_') {
-                $this->httpHeaders[$key] = $value;
-            }
-        }
-    }
+	/**
+	 * Set HTTP headers.
+	 *
+	 * @param array $httpHeaders
+	 */
+	public function setHttpHeaders($httpHeaders = null)
+	{
+		// use global _SERVER if $httpHeaders aren't defined
+		if (!is_array($httpHeaders) || !count($httpHeaders)) {
+			$httpHeaders = $_SERVER;
+		}
+		// clear existing headers
+		$this->httpHeaders = array();
+		// Only save HTTP headers. In PHP land, that means only _SERVER vars that
+		// start with HTTP_.
+		foreach ($httpHeaders as $key => $value) {
+			if (substr($key, 0, 5) === 'HTTP_') {
+				$this->httpHeaders[$key] = $value;
+			}
+		}
+	}
 
-    /**
-     * Return user agent headers.
-     *
-     * @return array
-     */
-    public function getUaHttpHeaders()
-    {
-        return self::$uaHttpHeaders;
-    }
+	/**
+	 * Return user agent headers.
+	 *
+	 * @return array
+	 */
+	public function getUaHttpHeaders()
+	{
+		return self::$uaHttpHeaders;
+	}
 
-    /**
-     * Set the user agent.
-     *
-     * @param string $userAgent
-     */
-    public function setUserAgent($userAgent = null)
-    {
-        if (false === empty($userAgent)) {
-            return $this->userAgent = $userAgent;
-        } else {
-            $this->userAgent = null;
-            foreach ($this->getUaHttpHeaders() as $altHeader) {
-                if (false === empty($this->httpHeaders[$altHeader])) { // @todo: should use getHttpHeader(), but it would be slow.
-                    $this->userAgent .= $this->httpHeaders[$altHeader].' ';
-                }
-            }
+	/**
+	 * Set the user agent.
+	 *
+	 * @param string $userAgent
+	 */
+	public function setUserAgent($userAgent = null)
+	{
+		if (false === empty($userAgent)) {
+			return $this->userAgent = $userAgent;
+		} else {
+			$this->userAgent = null;
+			foreach ($this->getUaHttpHeaders() as $altHeader) {
+				if (false === empty($this->httpHeaders[$altHeader])) { // @todo: should use getHttpHeader(), but it would be slow.
+					$this->userAgent .= $this->httpHeaders[$altHeader].' ';
+				}
+			}
 
-            return $this->userAgent = (!empty($this->userAgent) ? trim($this->userAgent) : null);
-        }
-    }
+			return $this->userAgent = (!empty($this->userAgent) ? trim($this->userAgent) : null);
+		}
+	}
 
-    /**
-     * Return the array of crawler regexs.
-     *
-     * @return array
-     */
-    public function getCrawlers()
-    {
-        return self::$crawlers;
-    }
+	/**
+	 * Return the array of crawler regexs.
+	 *
+	 * @return array
+	 */
+	public function getCrawlers()
+	{
+		return self::$crawlers;
+	}
 
-    /**
-     * Build the user agent regex.
-     *
-     * @return string
-     */
-    public function getRegex()
-    {
-        return '('.implode('|', self::$crawlers).')';
-    }
+	/**
+	 * Build the user agent regex.
+	 *
+	 * @return string
+	 */
+	public function getRegex()
+	{
+		return '('.implode('|', self::$crawlers).')';
+	}
 
-    /**
-     * Build the replacement regex.
-     *
-     * @return string
-     */
-    public function getIgnored()
-    {
-        return '('.implode('|', self::$ignore).')';
-    }
+	/**
+	 * Build the replacement regex.
+	 *
+	 * @return string
+	 */
+	public function getIgnored()
+	{
+		return '('.implode('|', self::$ignore).')';
+	}
 
-    /**
-     * Check user agent string against the regex.
-     *
-     * @param string $userAgent
-     *
-     * @return bool
-     */
-    public function isCrawler($userAgent = null)
-    {
-        $agent = is_null($userAgent) ? $this->userAgent : $userAgent;
+	/**
+	 * Check user agent string against the regex.
+	 *
+	 * @param string $userAgent
+	 *
+	 * @return bool
+	 */
+	public function isCrawler($userAgent = null)
+	{
+		$agent = is_null($userAgent) ? $this->userAgent : $userAgent;
 
-        $agent = preg_replace('/'.$this->getIgnored().'/i', '', $agent);
+		$agent = preg_replace('/'.$this->getIgnored().'/i', '', $agent);
 
-        if (trim($agent) === false) {
-            return false;
-        } else {
-            $result = preg_match('/'.$this->getRegex().'/i', trim($agent), $matches);
-        }
+		if (trim($agent) === false) {
+			return false;
+		} else {
+			$result = preg_match('/'.$this->getRegex().'/i', trim($agent), $matches);
+		}
 
-        if ($matches) {
-            $this->matches = $matches;
-        }
+		if ($matches) {
+			$this->matches = $matches;
+		}
 
-        return (bool) $result;
-    }
+		return (bool) $result;
+	}
 
-    /**
-     * Return the matches.
-     *
-     * @return string
-     */
-    public function getMatches()
-    {
-        return $this->matches[0];
-    }
+	/**
+	 * Return the matches.
+	 *
+	 * @return string
+	 */
+	public function getMatches()
+	{
+		return $this->matches[0];
+	}
 }

Please login to merge, or discard this patch.

tests/UATests.php 1 patch

Indentation +51 added lines, -51 removed lines patch added patch discarded remove patch

@@ -2,55 +2,55 @@
 block discarded – undo
 
 class UserAgentTest extends PHPUnit_Framework_TestCase
 {
-    protected $CrawlerDetect;
-
-    public function setUp()
-    {
-        $this->CrawlerDetect = new Jaybizzle\CrawlerDetect\CrawlerDetect();
-    }
-
-    public function testBots()
-    {
-        $lines = file(__DIR__.'/crawlers.txt', FILE_IGNORE_NEW_LINES | FILE_SKIP_EMPTY_LINES);
-
-        foreach ($lines as $line) {
-            $test = $this->CrawlerDetect->isCrawler($line);
-            $this->assertEquals($test, true, $line);
-        }
-    }
-
-    public function testDevices()
-    {
-        $lines = file(__DIR__.'/devices.txt', FILE_IGNORE_NEW_LINES | FILE_SKIP_EMPTY_LINES);
-
-        foreach ($lines as $line) {
-            $test = $this->CrawlerDetect->isCrawler($line);
-            $this->assertEquals($test, false, $line);
-        }
-    }
-
-    public function testReturnsCorrectMatchedBotName()
-    {
-        $test = $this->CrawlerDetect->isCrawler('Mozilla/5.0 (iPhone; CPU iPhone OS 7_1 like Mac OS X) AppleWebKit (KHTML, like Gecko) Mobile (compatible; Yahoo Ad monitoring; https://help.yahoo.com/kb/yahoo-ad-monitoring-SLN24857.html)');
-
-        $matches = $this->CrawlerDetect->getMatches();
-
-        $this->assertEquals($this->CrawlerDetect->getMatches(), 'Yahoo Ad monitoring', $matches);
-    }
-
-    public function testForRegexCollision()
-    {
-        $crawlers = $this->CrawlerDetect->getCrawlers();
-
-        foreach ($crawlers as $regex) {
-            foreach ($crawlers as $compare) {
-                // Dont check this regex against itself
-                if ($regex != $compare) {
-                    preg_match('/'.$regex.'/i', stripslashes($compare), $matches);
-
-                    $this->assertEmpty($matches, $regex.' collided with '.$compare);
-                }
-            }
-        }
-    }
+	protected $CrawlerDetect;
+
+	public function setUp()
+	{
+		$this->CrawlerDetect = new Jaybizzle\CrawlerDetect\CrawlerDetect();
+	}
+
+	public function testBots()
+	{
+		$lines = file(__DIR__.'/crawlers.txt', FILE_IGNORE_NEW_LINES | FILE_SKIP_EMPTY_LINES);
+
+		foreach ($lines as $line) {
+			$test = $this->CrawlerDetect->isCrawler($line);
+			$this->assertEquals($test, true, $line);
+		}
+	}
+
+	public function testDevices()
+	{
+		$lines = file(__DIR__.'/devices.txt', FILE_IGNORE_NEW_LINES | FILE_SKIP_EMPTY_LINES);
+
+		foreach ($lines as $line) {
+			$test = $this->CrawlerDetect->isCrawler($line);
+			$this->assertEquals($test, false, $line);
+		}
+	}
+
+	public function testReturnsCorrectMatchedBotName()
+	{
+		$test = $this->CrawlerDetect->isCrawler('Mozilla/5.0 (iPhone; CPU iPhone OS 7_1 like Mac OS X) AppleWebKit (KHTML, like Gecko) Mobile (compatible; Yahoo Ad monitoring; https://help.yahoo.com/kb/yahoo-ad-monitoring-SLN24857.html)');
+
+		$matches = $this->CrawlerDetect->getMatches();
+
+		$this->assertEquals($this->CrawlerDetect->getMatches(), 'Yahoo Ad monitoring', $matches);
+	}
+
+	public function testForRegexCollision()
+	{
+		$crawlers = $this->CrawlerDetect->getCrawlers();
+
+		foreach ($crawlers as $regex) {
+			foreach ($crawlers as $compare) {
+				// Dont check this regex against itself
+				if ($regex != $compare) {
+					preg_match('/'.$regex.'/i', stripslashes($compare), $matches);
+
+					$this->assertEmpty($matches, $regex.' collided with '.$compare);
+				}
+			}
+		}
+	}
 }

Please login to merge, or discard this patch.

		@@ -461,7 +461,7 @@ discard block
		block discarded – undo
461	461	public function setHttpHeaders($httpHeaders = null)
462	462	{
463	463	// use global _SERVER if $httpHeaders aren't defined
464		- if (!is_array($httpHeaders) \|\| !count($httpHeaders)) {
	464	+ if ( ! is_array($httpHeaders) \|\| ! count($httpHeaders)) {
465	465	$httpHeaders = $_SERVER;
466	466	}
467	467	// clear existing headers
		@@ -492,7 +492,7 @@ discard block
		block discarded – undo
492	492	}
493	493	}
494	494
495		- return $this->userAgent = (!empty($this->userAgent) ? trim($this->userAgent) : null);
	495	+ return $this->userAgent = ( ! empty($this->userAgent) ? trim($this->userAgent) : null);
496	496	}
497	497	}
498	498

		@@ -2,55 +2,55 @@
		block discarded – undo
2	2
3	3	class UserAgentTest extends PHPUnit_Framework_TestCase
4	4	{
5		- protected $CrawlerDetect;
6		-
7		- public function setUp()
8		- {
9		- $this->CrawlerDetect = new Jaybizzle\CrawlerDetect\CrawlerDetect();
10		- }
11		-
12		- public function testBots()
13		- {
14		- $lines = file(__DIR__.'/crawlers.txt', FILE_IGNORE_NEW_LINES \| FILE_SKIP_EMPTY_LINES);
15		-
16		- foreach ($lines as $line) {
17		- $test = $this->CrawlerDetect->isCrawler($line);
18		- $this->assertEquals($test, true, $line);
19		- }
20		- }
21		-
22		- public function testDevices()
23		- {
24		- $lines = file(__DIR__.'/devices.txt', FILE_IGNORE_NEW_LINES \| FILE_SKIP_EMPTY_LINES);
25		-
26		- foreach ($lines as $line) {
27		- $test = $this->CrawlerDetect->isCrawler($line);
28		- $this->assertEquals($test, false, $line);
29		- }
30		- }
31		-
32		- public function testReturnsCorrectMatchedBotName()
33		- {
34		- $test = $this->CrawlerDetect->isCrawler('Mozilla/5.0 (iPhone; CPU iPhone OS 7_1 like Mac OS X) AppleWebKit (KHTML, like Gecko) Mobile (compatible; Yahoo Ad monitoring; https://help.yahoo.com/kb/yahoo-ad-monitoring-SLN24857.html)');
35		-
36		- $matches = $this->CrawlerDetect->getMatches();
37		-
38		- $this->assertEquals($this->CrawlerDetect->getMatches(), 'Yahoo Ad monitoring', $matches);
39		- }
40		-
41		- public function testForRegexCollision()
42		- {
43		- $crawlers = $this->CrawlerDetect->getCrawlers();
44		-
45		- foreach ($crawlers as $regex) {
46		- foreach ($crawlers as $compare) {
47		- // Dont check this regex against itself
48		- if ($regex != $compare) {
49		- preg_match('/'.$regex.'/i', stripslashes($compare), $matches);
50		-
51		- $this->assertEmpty($matches, $regex.' collided with '.$compare);
52		- }
53		- }
54		- }
55		- }
	5	+ protected $CrawlerDetect;
	6	+
	7	+ public function setUp()
	8	+ {
	9	+ $this->CrawlerDetect = new Jaybizzle\CrawlerDetect\CrawlerDetect();
	10	+ }
	11	+
	12	+ public function testBots()
	13	+ {
	14	+ $lines = file(__DIR__.'/crawlers.txt', FILE_IGNORE_NEW_LINES \| FILE_SKIP_EMPTY_LINES);
	15	+
	16	+ foreach ($lines as $line) {
	17	+ $test = $this->CrawlerDetect->isCrawler($line);
	18	+ $this->assertEquals($test, true, $line);
	19	+ }
	20	+ }
	21	+
	22	+ public function testDevices()
	23	+ {
	24	+ $lines = file(__DIR__.'/devices.txt', FILE_IGNORE_NEW_LINES \| FILE_SKIP_EMPTY_LINES);
	25	+
	26	+ foreach ($lines as $line) {
	27	+ $test = $this->CrawlerDetect->isCrawler($line);
	28	+ $this->assertEquals($test, false, $line);
	29	+ }
	30	+ }
	31	+
	32	+ public function testReturnsCorrectMatchedBotName()
	33	+ {
	34	+ $test = $this->CrawlerDetect->isCrawler('Mozilla/5.0 (iPhone; CPU iPhone OS 7_1 like Mac OS X) AppleWebKit (KHTML, like Gecko) Mobile (compatible; Yahoo Ad monitoring; https://help.yahoo.com/kb/yahoo-ad-monitoring-SLN24857.html)');
	35	+
	36	+ $matches = $this->CrawlerDetect->getMatches();
	37	+
	38	+ $this->assertEquals($this->CrawlerDetect->getMatches(), 'Yahoo Ad monitoring', $matches);
	39	+ }
	40	+
	41	+ public function testForRegexCollision()
	42	+ {
	43	+ $crawlers = $this->CrawlerDetect->getCrawlers();
	44	+
	45	+ foreach ($crawlers as $regex) {
	46	+ foreach ($crawlers as $compare) {
	47	+ // Dont check this regex against itself
	48	+ if ($regex != $compare) {
	49	+ preg_match('/'.$regex.'/i', stripslashes($compare), $matches);
	50	+
	51	+ $this->assertEmpty($matches, $regex.' collided with '.$compare);
	52	+ }
	53	+ }
	54	+ }
	55	+ }
56	56	}

JayBizzle / Crawler-Detect

Push — master ( 082cfe...e31477 )

Status

Category

Spacing +2 added lines, -2 removed lines patch added patch discarded remove patch

Indentation +491 added lines, -491 removed lines patch added patch discarded remove patch

Indentation +51 added lines, -51 removed lines patch added patch discarded remove patch