Inspection of "Merge pull request #3 from codysnider/codysnider/c..." - codysnider/tt-rss - Measure and Improve Code Quality continuously with Scrutinizer

Passed

Push — master ( 5a5c41...fade3b )

by Cody

created 2019-12-20 20:43 UTC

Status

Indentation +1 added lines, -1 removed lines patch added patch discarded remove patch

@@ -6,5 +6,5 @@
 block discarded – undo
 
 class DOMEntityReference extends \DOMEntityReference
 {
-    use NodeTrait;
+	use NodeTrait;
 }

Please login to merge, or discard this patch.

af_readability/vendor/andreskrey/Readability/Nodes/DOM/DOMNotation.php 1 patch

Indentation +1 added lines, -1 removed lines patch added patch discarded remove patch

@@ -6,5 +6,5 @@
 block discarded – undo
 
 class DOMNotation extends \DOMNotation
 {
-    use NodeTrait;
+	use NodeTrait;
 }

Please login to merge, or discard this patch.

af_readability/vendor/andreskrey/Readability/Nodes/DOM/DOMComment.php 1 patch

Indentation +1 added lines, -1 removed lines patch added patch discarded remove patch

@@ -6,5 +6,5 @@
 block discarded – undo
 
 class DOMComment extends \DOMComment
 {
-    use NodeTrait;
+	use NodeTrait;
 }

Please login to merge, or discard this patch.

vendor/andreskrey/Readability/Nodes/DOM/DOMDocumentFragment.php 1 patch

Indentation +1 added lines, -1 removed lines patch added patch discarded remove patch

@@ -6,5 +6,5 @@
 block discarded – undo
 
 class DOMDocumentFragment extends \DOMDocumentFragment
 {
-    use NodeTrait;
+	use NodeTrait;
 }

Please login to merge, or discard this patch.

af_readability/vendor/andreskrey/Readability/Nodes/DOM/DOMNodeList.php 1 patch

Indentation +58 added lines, -58 removed lines patch added patch discarded remove patch

@@ -14,69 +14,69 @@
 block discarded – undo
  */
 class DOMNodeList implements \Countable, \IteratorAggregate
 {
-    /**
-     * @var array
-     */
-    protected $items = [];
+	/**
+	 * @var array
+	 */
+	protected $items = [];
 
-    /**
-     * @var int
-     */
-    protected $length = 0;
+	/**
+	 * @var int
+	 */
+	protected $length = 0;
 
-    /**
-     * To allow access to length in the same way that DOMNodeList allows.
-     *
-     * {@inheritdoc}
-     */
-    public function __get($name)
-    {
-        switch ($name) {
-            case 'length':
-                return $this->length;
-            default:
-                trigger_error(sprintf('Undefined property: %s::%s', static::class, $name));
-        }
-    }
+	/**
+	 * To allow access to length in the same way that DOMNodeList allows.
+	 *
+	 * {@inheritdoc}
+	 */
+	public function __get($name)
+	{
+		switch ($name) {
+			case 'length':
+				return $this->length;
+			default:
+				trigger_error(sprintf('Undefined property: %s::%s', static::class, $name));
+		}
+	}
 
-    /**
-     * @param DOMNode|DOMElement|DOMComment $node
-     *
-     * @return DOMNodeList
-     */
-    public function add($node)
-    {
-        $this->items[] = $node;
-        $this->length++;
+	/**
+	 * @param DOMNode|DOMElement|DOMComment $node
+	 *
+	 * @return DOMNodeList
+	 */
+	public function add($node)
+	{
+		$this->items[] = $node;
+		$this->length++;
 
-        return $this;
-    }
+		return $this;
+	}
 
-    /**
-     * @param int $offset
-     *
-     * @return DOMNode|DOMElement|DOMComment
-     */
-    public function item(int $offset)
-    {
-        return $this->items[$offset];
-    }
+	/**
+	 * @param int $offset
+	 *
+	 * @return DOMNode|DOMElement|DOMComment
+	 */
+	public function item(int $offset)
+	{
+		return $this->items[$offset];
+	}
 
-    /**
-     * @return int|void
-     */
-    public function count(): int
-    {
-        return $this->length;
-    }
+	/**
+	 * @return int|void
+	 */
+	public function count(): int
+	{
+		return $this->length;
+	}
 
-    /**
-     * To make it compatible with iterator_to_array() function.
-     *
-     * {@inheritdoc}
-     */
-    public function getIterator(): \ArrayIterator
-    {
-        return new \ArrayIterator($this->items);
-    }
+	/**
+	 * To make it compatible with iterator_to_array() function.
+	 *
+	 * {@inheritdoc}
+	 */
+	public function getIterator(): \ArrayIterator
+	{
+		return new \ArrayIterator($this->items);
+	}
 }

Please login to merge, or discard this patch.

af_readability/vendor/andreskrey/Readability/Nodes/DOM/DOMDocument.php 1 patch

Indentation +19 added lines, -19 removed lines patch added patch discarded remove patch

@@ -6,25 +6,25 @@
 block discarded – undo
 
 class DOMDocument extends \DOMDocument
 {
-    use NodeTrait;
+	use NodeTrait;
 
-    public function __construct($version, $encoding)
-    {
-        parent::__construct($version, $encoding);
+	public function __construct($version, $encoding)
+	{
+		parent::__construct($version, $encoding);
 
-        $this->registerNodeClass('DOMAttr', DOMAttr::class);
-        $this->registerNodeClass('DOMCdataSection', DOMCdataSection::class);
-        $this->registerNodeClass('DOMCharacterData', DOMCharacterData::class);
-        $this->registerNodeClass('DOMComment', DOMComment::class);
-        $this->registerNodeClass('DOMDocument', self::class);
-        $this->registerNodeClass('DOMDocumentFragment', DOMDocumentFragment::class);
-        $this->registerNodeClass('DOMDocumentType', DOMDocumentType::class);
-        $this->registerNodeClass('DOMElement', DOMElement::class);
-        $this->registerNodeClass('DOMEntity', DOMEntity::class);
-        $this->registerNodeClass('DOMEntityReference', DOMEntityReference::class);
-        $this->registerNodeClass('DOMNode', DOMNode::class);
-        $this->registerNodeClass('DOMNotation', DOMNotation::class);
-        $this->registerNodeClass('DOMProcessingInstruction', DOMProcessingInstruction::class);
-        $this->registerNodeClass('DOMText', DOMText::class);
-    }
+		$this->registerNodeClass('DOMAttr', DOMAttr::class);
+		$this->registerNodeClass('DOMCdataSection', DOMCdataSection::class);
+		$this->registerNodeClass('DOMCharacterData', DOMCharacterData::class);
+		$this->registerNodeClass('DOMComment', DOMComment::class);
+		$this->registerNodeClass('DOMDocument', self::class);
+		$this->registerNodeClass('DOMDocumentFragment', DOMDocumentFragment::class);
+		$this->registerNodeClass('DOMDocumentType', DOMDocumentType::class);
+		$this->registerNodeClass('DOMElement', DOMElement::class);
+		$this->registerNodeClass('DOMEntity', DOMEntity::class);
+		$this->registerNodeClass('DOMEntityReference', DOMEntityReference::class);
+		$this->registerNodeClass('DOMNode', DOMNode::class);
+		$this->registerNodeClass('DOMNotation', DOMNotation::class);
+		$this->registerNodeClass('DOMProcessingInstruction', DOMProcessingInstruction::class);
+		$this->registerNodeClass('DOMText', DOMText::class);
+	}
 }

Please login to merge, or discard this patch.

af_readability/vendor/andreskrey/Readability/Nodes/DOM/DOMEntity.php 1 patch

Indentation +1 added lines, -1 removed lines patch added patch discarded remove patch

@@ -6,5 +6,5 @@
 block discarded – undo
 
 class DOMEntity extends \DOMEntity
 {
-    use NodeTrait;
+	use NodeTrait;
 }

Please login to merge, or discard this patch.

plugins/af_readability/vendor/andreskrey/Readability/Nodes/NodeUtility.php 1 patch

Indentation +158 added lines, -158 removed lines patch added patch discarded remove patch

@@ -12,126 +12,126 @@  discard block
 block discarded – undo
  */
 class NodeUtility
 {
-    /**
-     * Collection of regexps to check the node usability.
-     *
-     * @var array
-     */
-    public static $regexps = [
-        'unlikelyCandidates' => '/-ad-|banner|breadcrumbs|combx|comment|community|cover-wrap|disqus|extra|foot|header|legends|menu|related|remark|replies|rss|shoutbox|sidebar|skyscraper|social|sponsor|supplemental|ad-break|agegate|pagination|pager|popup|yom-remote/i',
-        'okMaybeItsACandidate' => '/and|article|body|column|main|shadow/i',
-        'extraneous' => '/print|archive|comment|discuss|e[\-]?mail|share|reply|all|login|sign|single|utility/i',
-        'byline' => '/byline|author|dateline|writtenby|p-author/i',
-        'replaceFonts' => '/<(\/?)font[^>]*>/gi',
-        'normalize' => '/\s{2,}/',
-        'videos' => '/\/\/(www\.)?((dailymotion|youtube|youtube-nocookie|player\.vimeo|v\.qq)\.com|(archive|upload\.wikimedia)\.org|player\.twitch\.tv)/i',
-        'nextLink' => '/(next|weiter|continue|>([^\|]|$)|»([^\|]|$))/i',
-        'prevLink' => '/(prev|earl|old|new|<|«)/i',
-        'whitespace' => '/^\s*$/',
-        'hasContent' => '/\S$/',
-        'positive' => '/article|body|content|entry|hentry|h-entry|main|page|pagination|post|text|blog|story/i',
-        'negative' => '/hidden|^hid$| hid$| hid |^hid |banner|combx|comment|com-|contact|foot|footer|footnote|masthead|media|meta|outbrain|promo|related|scroll|share|shoutbox|sidebar|skyscraper|sponsor|shopping|tags|tool|widget/i',
-        // \x{00A0} is the unicode version of &nbsp;
-        'onlyWhitespace' => '/\x{00A0}|\s+/u'
-    ];
-
-    /**
-     * Imported from the Element class on league\html-to-markdown.
-     *
-     * @param $node
-     *
-     * @return DOMElement
-     */
-    public static function nextElement($node)
-    {
-        $next = $node;
-        while ($next
-            && $next->nodeType !== XML_ELEMENT_NODE
-            && $next->isWhitespace()) {
-            $next = $next->nextSibling;
-        }
-
-        return $next;
-    }
-
-    /**
-     * Changes the node tag name. Since tagName on DOMElement is a read only value, this must be done creating a new
-     * element with the new tag name and importing it to the main DOMDocument.
-     *
-     * @param DOMNode $node
-     * @param string $value
-     * @param bool $importAttributes
-     *
-     * @return DOMNode
-     */
-    public static function setNodeTag($node, $value, $importAttributes = true)
-    {
-        $new = new DOMDocument('1.0', 'utf-8');
-        $new->appendChild($new->createElement($value));
-
-        $children = $node->childNodes;
-        /** @var $children \DOMNodeList $i */
-        for ($i = 0; $i < $children->length; $i++) {
-            $import = $new->importNode($children->item($i), true);
-            $new->firstChild->appendChild($import);
-        }
-
-        if ($importAttributes) {
-            // Import attributes from the original node.
-            foreach ($node->attributes as $attribute) {
-                $new->firstChild->setAttribute($attribute->nodeName, $attribute->nodeValue);
-            }
-        }
-
-        // The import must be done on the firstChild of $new, since $new is a DOMDocument and not a DOMElement.
-        $import = $node->ownerDocument->importNode($new->firstChild, true);
-        $node->parentNode->replaceChild($import, $node);
-
-        return $import;
-    }
-
-    /**
-     * Removes the current node and returns the next node to be parsed (child, sibling or parent).
-     *
-     * @param DOMNode $node
-     *
-     * @return DOMNode
-     */
-    public static function removeAndGetNext($node)
-    {
-        $nextNode = self::getNextNode($node, true);
-        $node->parentNode->removeChild($node);
-
-        return $nextNode;
-    }
-
-    /**
-     * Remove the selected node.
-     *
-     * @param $node DOMElement
-     *
-     * @return void
-     **/
-    public static function removeNode($node)
-    {
-        $parent = $node->parentNode;
-        if ($parent) {
-            $parent->removeChild($node);
-        }
-    }
-
-    /**
-     * Returns the next node. First checks for children (if the flag allows it), then for siblings, and finally
-     * for parents.
-     *
-     * @param DOMNode $originalNode
-     * @param bool $ignoreSelfAndKids
-     *
-     * @return DOMNode
-     */
-    public static function getNextNode($originalNode, $ignoreSelfAndKids = false)
-    {
-        /*
+	/**
+	 * Collection of regexps to check the node usability.
+	 *
+	 * @var array
+	 */
+	public static $regexps = [
+		'unlikelyCandidates' => '/-ad-|banner|breadcrumbs|combx|comment|community|cover-wrap|disqus|extra|foot|header|legends|menu|related|remark|replies|rss|shoutbox|sidebar|skyscraper|social|sponsor|supplemental|ad-break|agegate|pagination|pager|popup|yom-remote/i',
+		'okMaybeItsACandidate' => '/and|article|body|column|main|shadow/i',
+		'extraneous' => '/print|archive|comment|discuss|e[\-]?mail|share|reply|all|login|sign|single|utility/i',
+		'byline' => '/byline|author|dateline|writtenby|p-author/i',
+		'replaceFonts' => '/<(\/?)font[^>]*>/gi',
+		'normalize' => '/\s{2,}/',
+		'videos' => '/\/\/(www\.)?((dailymotion|youtube|youtube-nocookie|player\.vimeo|v\.qq)\.com|(archive|upload\.wikimedia)\.org|player\.twitch\.tv)/i',
+		'nextLink' => '/(next|weiter|continue|>([^\|]|$)|»([^\|]|$))/i',
+		'prevLink' => '/(prev|earl|old|new|<|«)/i',
+		'whitespace' => '/^\s*$/',
+		'hasContent' => '/\S$/',
+		'positive' => '/article|body|content|entry|hentry|h-entry|main|page|pagination|post|text|blog|story/i',
+		'negative' => '/hidden|^hid$| hid$| hid |^hid |banner|combx|comment|com-|contact|foot|footer|footnote|masthead|media|meta|outbrain|promo|related|scroll|share|shoutbox|sidebar|skyscraper|sponsor|shopping|tags|tool|widget/i',
+		// \x{00A0} is the unicode version of &nbsp;
+		'onlyWhitespace' => '/\x{00A0}|\s+/u'
+	];
+
+	/**
+	 * Imported from the Element class on league\html-to-markdown.
+	 *
+	 * @param $node
+	 *
+	 * @return DOMElement
+	 */
+	public static function nextElement($node)
+	{
+		$next = $node;
+		while ($next
+			&& $next->nodeType !== XML_ELEMENT_NODE
+			&& $next->isWhitespace()) {
+			$next = $next->nextSibling;
+		}
+
+		return $next;
+	}
+
+	/**
+	 * Changes the node tag name. Since tagName on DOMElement is a read only value, this must be done creating a new
+	 * element with the new tag name and importing it to the main DOMDocument.
+	 *
+	 * @param DOMNode $node
+	 * @param string $value
+	 * @param bool $importAttributes
+	 *
+	 * @return DOMNode
+	 */
+	public static function setNodeTag($node, $value, $importAttributes = true)
+	{
+		$new = new DOMDocument('1.0', 'utf-8');
+		$new->appendChild($new->createElement($value));
+
+		$children = $node->childNodes;
+		/** @var $children \DOMNodeList $i */
+		for ($i = 0; $i < $children->length; $i++) {
+			$import = $new->importNode($children->item($i), true);
+			$new->firstChild->appendChild($import);
+		}
+
+		if ($importAttributes) {
+			// Import attributes from the original node.
+			foreach ($node->attributes as $attribute) {
+				$new->firstChild->setAttribute($attribute->nodeName, $attribute->nodeValue);
+			}
+		}
+
+		// The import must be done on the firstChild of $new, since $new is a DOMDocument and not a DOMElement.
+		$import = $node->ownerDocument->importNode($new->firstChild, true);
+		$node->parentNode->replaceChild($import, $node);
+
+		return $import;
+	}
+
+	/**
+	 * Removes the current node and returns the next node to be parsed (child, sibling or parent).
+	 *
+	 * @param DOMNode $node
+	 *
+	 * @return DOMNode
+	 */
+	public static function removeAndGetNext($node)
+	{
+		$nextNode = self::getNextNode($node, true);
+		$node->parentNode->removeChild($node);
+
+		return $nextNode;
+	}
+
+	/**
+	 * Remove the selected node.
+	 *
+	 * @param $node DOMElement
+	 *
+	 * @return void
+	 **/
+	public static function removeNode($node)
+	{
+		$parent = $node->parentNode;
+		if ($parent) {
+			$parent->removeChild($node);
+		}
+	}
+
+	/**
+	 * Returns the next node. First checks for children (if the flag allows it), then for siblings, and finally
+	 * for parents.
+	 *
+	 * @param DOMNode $originalNode
+	 * @param bool $ignoreSelfAndKids
+	 *
+	 * @return DOMNode
+	 */
+	public static function getNextNode($originalNode, $ignoreSelfAndKids = false)
+	{
+		/*
          * Traverse the DOM from node to node, starting at the node passed in.
          * Pass true for the second parameter to indicate this node itself
          * (and its kids) are going away, and we want the next node over.
@@ -139,42 +139,42 @@  discard block
 block discarded – undo
          * Calling this in a loop will traverse the DOM depth-first.
          */
 
-        // First check for kids if those aren't being ignored
-        if (!$ignoreSelfAndKids && $originalNode->firstChild) {
-            return $originalNode->firstChild;
-        }
-
-        // Then for siblings...
-        if ($originalNode->nextSibling) {
-            return $originalNode->nextSibling;
-        }
-
-        // And finally, move up the parent chain *and* find a sibling
-        // (because this is depth-first traversal, we will have already
-        // seen the parent nodes themselves).
-        do {
-            $originalNode = $originalNode->parentNode;
-        } while ($originalNode && !$originalNode->nextSibling);
-
-        return ($originalNode) ? $originalNode->nextSibling : $originalNode;
-    }
-
-    /**
-     * Remove all empty DOMNodes from DOMNodeLists.
-     *
-     * @param \DOMNodeList $list
-     *
-     * @return DOMNodeList
-     */
-    public static function filterTextNodes(\DOMNodeList $list)
-    {
-        $newList = new DOMNodeList();
-        foreach ($list as $node) {
-            if ($node->nodeType !== XML_TEXT_NODE || mb_strlen(trim($node->nodeValue))) {
-                $newList->add($node);
-            }
-        }
-
-        return $newList;
-    }
+		// First check for kids if those aren't being ignored
+		if (!$ignoreSelfAndKids && $originalNode->firstChild) {
+			return $originalNode->firstChild;
+		}
+
+		// Then for siblings...
+		if ($originalNode->nextSibling) {
+			return $originalNode->nextSibling;
+		}
+
+		// And finally, move up the parent chain *and* find a sibling
+		// (because this is depth-first traversal, we will have already
+		// seen the parent nodes themselves).
+		do {
+			$originalNode = $originalNode->parentNode;
+		} while ($originalNode && !$originalNode->nextSibling);
+
+		return ($originalNode) ? $originalNode->nextSibling : $originalNode;
+	}
+
+	/**
+	 * Remove all empty DOMNodes from DOMNodeLists.
+	 *
+	 * @param \DOMNodeList $list
+	 *
+	 * @return DOMNodeList
+	 */
+	public static function filterTextNodes(\DOMNodeList $list)
+	{
+		$newList = new DOMNodeList();
+		foreach ($list as $node) {
+			if ($node->nodeType !== XML_TEXT_NODE || mb_strlen(trim($node->nodeValue))) {
+				$newList->add($node);
+			}
+		}
+
+		return $newList;
+	}
 }

Please login to merge, or discard this patch.

plugins/af_readability/vendor/andreskrey/Readability/Nodes/NodeTrait.php 1 patch

Indentation +553 added lines, -553 removed lines patch added patch discarded remove patch

@@ -13,75 +13,75 @@  discard block
 block discarded – undo
  */
 trait NodeTrait
 {
-    /**
-     * Content score of the node. Used to determine the value of the content.
-     *
-     * @var int
-     */
-    public $contentScore = 0;
-
-    /**
-     * Flag for initialized status.
-     *
-     * @var bool
-     */
-    private $initialized = false;
-
-    /**
-     * Flag data tables.
-     *
-     * @var bool
-     */
-    private $readabilityDataTable = false;
-
-    /**
-     * @var array
-     */
-    private $divToPElements = [
-        'a',
-        'blockquote',
-        'dl',
-        'div',
-        'img',
-        'ol',
-        'p',
-        'pre',
-        'table',
-        'ul',
-        'select',
-    ];
-
-    /**
-     * The commented out elements qualify as phrasing content but tend to be
-     * removed by readability when put into paragraphs, so we ignore them here.
-     *
-     * @var array
-     */
-    private $phrasing_elems = [
-        // 'CANVAS', 'IFRAME', 'SVG', 'VIDEO',
-        'abbr', 'audio', 'b', 'bdo', 'br', 'button', 'cite', 'code', 'data',
-        'datalist', 'dfn', 'em', 'embed', 'i', 'img', 'input', 'kbd', 'label',
-        'mark', 'math', 'meter', 'noscript', 'object', 'output', 'progress', 'q',
-        'ruby', 'samp', 'script', 'select', 'small', 'span', 'strong', 'sub',
-        'sup', 'textarea', 'time', 'var', 'wbr'
-    ];
-
-    /**
-     * initialized getter.
-     *
-     * @return bool
-     */
-    public function isInitialized()
-    {
-        return $this->initialized;
-    }
-
-    /**
-     * @return bool
-     */
-    public function isReadabilityDataTable()
-    {
-        /*
+	/**
+	 * Content score of the node. Used to determine the value of the content.
+	 *
+	 * @var int
+	 */
+	public $contentScore = 0;
+
+	/**
+	 * Flag for initialized status.
+	 *
+	 * @var bool
+	 */
+	private $initialized = false;
+
+	/**
+	 * Flag data tables.
+	 *
+	 * @var bool
+	 */
+	private $readabilityDataTable = false;
+
+	/**
+	 * @var array
+	 */
+	private $divToPElements = [
+		'a',
+		'blockquote',
+		'dl',
+		'div',
+		'img',
+		'ol',
+		'p',
+		'pre',
+		'table',
+		'ul',
+		'select',
+	];
+
+	/**
+	 * The commented out elements qualify as phrasing content but tend to be
+	 * removed by readability when put into paragraphs, so we ignore them here.
+	 *
+	 * @var array
+	 */
+	private $phrasing_elems = [
+		// 'CANVAS', 'IFRAME', 'SVG', 'VIDEO',
+		'abbr', 'audio', 'b', 'bdo', 'br', 'button', 'cite', 'code', 'data',
+		'datalist', 'dfn', 'em', 'embed', 'i', 'img', 'input', 'kbd', 'label',
+		'mark', 'math', 'meter', 'noscript', 'object', 'output', 'progress', 'q',
+		'ruby', 'samp', 'script', 'select', 'small', 'span', 'strong', 'sub',
+		'sup', 'textarea', 'time', 'var', 'wbr'
+	];
+
+	/**
+	 * initialized getter.
+	 *
+	 * @return bool
+	 */
+	public function isInitialized()
+	{
+		return $this->initialized;
+	}
+
+	/**
+	 * @return bool
+	 */
+	public function isReadabilityDataTable()
+	{
+		/*
          * This is a workaround that I'd like to remove in the future.
          * Seems that although we are extending the base DOMElement and adding custom properties (like this one,
          * 'readabilityDataTable'), these properties get lost when you search for elements with getElementsByTagName.
@@ -91,388 +91,388 @@  discard block
 block discarded – undo
          *
          * @see https://stackoverflow.com/questions/35654709/php-registernodeclass-and-reusing-variable-names
          */
-        return $this->hasAttribute('readabilityDataTable')
-            && $this->getAttribute('readabilityDataTable') === '1';
+		return $this->hasAttribute('readabilityDataTable')
+			&& $this->getAttribute('readabilityDataTable') === '1';
 //        return $this->readabilityDataTable;
-    }
-
-    /**
-     * @param bool $param
-     */
-    public function setReadabilityDataTable($param)
-    {
-        // Can't be "true" because DOMDocument casts it to "1"
-        $this->setAttribute('readabilityDataTable', $param ? '1' : '0');
+	}
+
+	/**
+	 * @param bool $param
+	 */
+	public function setReadabilityDataTable($param)
+	{
+		// Can't be "true" because DOMDocument casts it to "1"
+		$this->setAttribute('readabilityDataTable', $param ? '1' : '0');
 //        $this->readabilityDataTable = $param;
-    }
-
-    /**
-     * Initializer. Calculates the current score of the node and returns a full Readability object.
-     *
-     * @ TODO: I don't like the weightClasses param. How can we get the config here?
-     *
-     * @param $weightClasses bool Weight classes?
-     *
-     * @return static
-     */
-    public function initializeNode($weightClasses)
-    {
-        if (!$this->isInitialized()) {
-            $contentScore = 0;
-
-            switch ($this->nodeName) {
-                case 'div':
-                    $contentScore += 5;
-                    break;
-
-                case 'pre':
-                case 'td':
-                case 'blockquote':
-                    $contentScore += 3;
-                    break;
-
-                case 'address':
-                case 'ol':
-                case 'ul':
-                case 'dl':
-                case 'dd':
-                case 'dt':
-                case 'li':
-                case 'form':
-                    $contentScore -= 3;
-                    break;
-
-                case 'h1':
-                case 'h2':
-                case 'h3':
-                case 'h4':
-                case 'h5':
-                case 'h6':
-                case 'th':
-                    $contentScore -= 5;
-                    break;
-            }
-
-            $this->contentScore = $contentScore + ($weightClasses ? $this->getClassWeight() : 0);
-
-            $this->initialized = true;
-        }
-
-        return $this;
-    }
-
-    /**
-     * Override for native getAttribute method. Some nodes have the getAttribute method, some don't, so we need
-     * to check first the existence of the attributes property.
-     *
-     * @param $attributeName string Attribute to retrieve
-     *
-     * @return string
-     */
-    public function getAttribute($attributeName)
-    {
-        if (!is_null($this->attributes)) {
-            return parent::getAttribute($attributeName);
-        }
-
-        return '';
-    }
-
-    /**
-     * Override for native hasAttribute.
-     *
-     * @param $attributeName
-     *
-     * @return bool
-     *
-     * @see getAttribute
-     */
-    public function hasAttribute($attributeName)
-    {
-        if (!is_null($this->attributes)) {
-            return parent::hasAttribute($attributeName);
-        }
-
-        return false;
-    }
-
-    /**
-     * Get the ancestors of the current node.
-     *
-     * @param int|bool $maxLevel Max amount of ancestors to get. False for all of them
-     *
-     * @return array
-     */
-    public function getNodeAncestors($maxLevel = 3)
-    {
-        $ancestors = [];
-        $level = 0;
-
-        $node = $this->parentNode;
-
-        while ($node && !($node instanceof DOMDocument)) {
-            $ancestors[] = $node;
-            $level++;
-            if ($level === $maxLevel) {
-                break;
-            }
-            $node = $node->parentNode;
-        }
-
-        return $ancestors;
-    }
-
-    /**
-     * Returns all links from the current element.
-     *
-     * @return array
-     */
-    public function getAllLinks()
-    {
-        return iterator_to_array($this->getElementsByTagName('a'));
-    }
-
-    /**
-     * Get the density of links as a percentage of the content
-     * This is the amount of text that is inside a link divided by the total text in the node.
-     *
-     * @return int
-     */
-    public function getLinkDensity()
-    {
-        $linkLength = 0;
-        $textLength = mb_strlen($this->getTextContent(true));
-
-        if (!$textLength) {
-            return 0;
-        }
-
-        $links = $this->getAllLinks();
-
-        if ($links) {
-            /** @var DOMElement $link */
-            foreach ($links as $link) {
-                $linkLength += mb_strlen($link->getTextContent(true));
-            }
-        }
-
-        return $linkLength / $textLength;
-    }
-
-    /**
-     * Calculates the weight of the class/id of the current element.
-     *
-     * @return int
-     */
-    public function getClassWeight()
-    {
-        $weight = 0;
-
-        // Look for a special classname
-        $class = $this->getAttribute('class');
-        if (trim($class)) {
-            if (preg_match(NodeUtility::$regexps['negative'], $class)) {
-                $weight -= 25;
-            }
-
-            if (preg_match(NodeUtility::$regexps['positive'], $class)) {
-                $weight += 25;
-            }
-        }
-
-        // Look for a special ID
-        $id = $this->getAttribute('id');
-        if (trim($id)) {
-            if (preg_match(NodeUtility::$regexps['negative'], $id)) {
-                $weight -= 25;
-            }
-
-            if (preg_match(NodeUtility::$regexps['positive'], $id)) {
-                $weight += 25;
-            }
-        }
-
-        return $weight;
-    }
-
-    /**
-     * Returns the full text of the node.
-     *
-     * @param bool $normalize Normalize white space?
-     *
-     * @return string
-     */
-    public function getTextContent($normalize = false)
-    {
-        $nodeValue = $this->nodeValue;
-        if ($normalize) {
-            $nodeValue = trim(preg_replace('/\s{2,}/', ' ', $nodeValue));
-        }
-
-        return $nodeValue;
-    }
-
-    /**
-     * Returns the children of the current node.
-     *
-     * @param bool $filterEmptyDOMText Filter empty DOMText nodes?
-     *
-     * @deprecated Use NodeUtility::filterTextNodes, function will be removed in version 3.0
-     *
-     * @return array
-     */
-    public function getChildren($filterEmptyDOMText = false)
-    {
-        @trigger_error('getChildren was replaced with NodeUtility::filterTextNodes and will be removed in version 3.0', E_USER_DEPRECATED);
-
-        $ret = iterator_to_array($this->childNodes);
-        if ($filterEmptyDOMText) {
-            // Array values is used to discard the key order. Needs to be 0 to whatever without skipping any number
-            $ret = array_values(array_filter($ret, function ($node) {
-                return $node->nodeName !== '#text' || mb_strlen(trim($node->nodeValue));
-            }));
-        }
-
-        return $ret;
-    }
-
-    /**
-     * Return an array indicating how many rows and columns this table has.
-     *
-     * @return array
-     */
-    public function getRowAndColumnCount()
-    {
-        $rows = $columns = 0;
-        $trs = $this->getElementsByTagName('tr');
-        foreach ($trs as $tr) {
-            /** @var \DOMElement $tr */
-            $rowspan = $tr->getAttribute('rowspan');
-            $rows += ($rowspan || 1);
-
-            // Now look for column-related info
-            $columnsInThisRow = 0;
-            $cells = $tr->getElementsByTagName('td');
-            foreach ($cells as $cell) {
-                /** @var \DOMElement $cell */
-                $colspan = $cell->getAttribute('colspan');
-                $columnsInThisRow += ($colspan || 1);
-            }
-            $columns = max($columns, $columnsInThisRow);
-        }
-
-        return ['rows' => $rows, 'columns' => $columns];
-    }
-
-    /**
-     * Creates a new node based on the text content of the original node.
-     *
-     * @param $originalNode DOMNode
-     * @param $tagName string
-     *
-     * @return DOMElement
-     */
-    public function createNode($originalNode, $tagName)
-    {
-        $text = $originalNode->getTextContent();
-        $newNode = $originalNode->ownerDocument->createElement($tagName, $text);
-
-        return $newNode;
-    }
-
-    /**
-     * Check if a given node has one of its ancestor tag name matching the
-     * provided one.
-     *
-     * @param string $tagName
-     * @param int $maxDepth
-     * @param callable $filterFn
-     *
-     * @return bool
-     */
-    public function hasAncestorTag($tagName, $maxDepth = 3, callable $filterFn = null)
-    {
-        $depth = 0;
-        $node = $this;
-
-        while ($node->parentNode) {
-            if ($maxDepth > 0 && $depth > $maxDepth) {
-                return false;
-            }
-
-            if ($node->parentNode->nodeName === $tagName && (!$filterFn || $filterFn($node->parentNode))) {
-                return true;
-            }
-
-            $node = $node->parentNode;
-            $depth++;
-        }
-
-        return false;
-    }
-
-    /**
-     * Check if this node has only whitespace and a single element with given tag
-     * or if it contains no element with given tag or more than 1 element.
-     *
-     * @param $tag string Name of tag
-     *
-     * @return bool
-     */
-    public function hasSingleTagInsideElement($tag)
-    {
-        // There should be exactly 1 element child with given tag
-        if (count($children = NodeUtility::filterTextNodes($this->childNodes)) !== 1 || $children->item(0)->nodeName !== $tag) {
-            return false;
-        }
-
-        // And there should be no text nodes with real content
-        return array_reduce(iterator_to_array($children), function ($carry, $child) {
-            if (!$carry === false) {
-                return false;
-            }
-
-            /* @var DOMNode $child */
-            return !($child->nodeType === XML_TEXT_NODE && !preg_match('/\S$/', $child->getTextContent()));
-        });
-    }
-
-    /**
-     * Check if the current element has a single child block element.
-     * Block elements are the ones defined in the divToPElements array.
-     *
-     * @return bool
-     */
-    public function hasSingleChildBlockElement()
-    {
-        $result = false;
-        if ($this->hasChildNodes()) {
-            foreach ($this->childNodes as $child) {
-                if (in_array($child->nodeName, $this->divToPElements)) {
-                    $result = true;
-                } else {
-                    // If any of the hasSingleChildBlockElement calls return true, return true then.
-                    /** @var $child DOMElement */
-                    $result = ($result || $child->hasSingleChildBlockElement());
-                }
-            }
-        }
-
-        return $result;
-    }
-
-    /**
-     * Determines if a node has no content or it is just a bunch of dividing lines and/or whitespace.
-     *
-     * @return bool
-     */
-    public function isElementWithoutContent()
-    {
-        return $this instanceof DOMElement &&
-            mb_strlen(preg_replace(NodeUtility::$regexps['onlyWhitespace'], '', $this->textContent)) === 0 &&
-            ($this->childNodes->length === 0 ||
-                $this->childNodes->length === $this->getElementsByTagName('br')->length + $this->getElementsByTagName('hr')->length
-                /*
+	}
+
+	/**
+	 * Initializer. Calculates the current score of the node and returns a full Readability object.
+	 *
+	 * @ TODO: I don't like the weightClasses param. How can we get the config here?
+	 *
+	 * @param $weightClasses bool Weight classes?
+	 *
+	 * @return static
+	 */
+	public function initializeNode($weightClasses)
+	{
+		if (!$this->isInitialized()) {
+			$contentScore = 0;
+
+			switch ($this->nodeName) {
+				case 'div':
+					$contentScore += 5;
+					break;
+
+				case 'pre':
+				case 'td':
+				case 'blockquote':
+					$contentScore += 3;
+					break;
+
+				case 'address':
+				case 'ol':
+				case 'ul':
+				case 'dl':
+				case 'dd':
+				case 'dt':
+				case 'li':
+				case 'form':
+					$contentScore -= 3;
+					break;
+
+				case 'h1':
+				case 'h2':
+				case 'h3':
+				case 'h4':
+				case 'h5':
+				case 'h6':
+				case 'th':
+					$contentScore -= 5;
+					break;
+			}
+
+			$this->contentScore = $contentScore + ($weightClasses ? $this->getClassWeight() : 0);
+
+			$this->initialized = true;
+		}
+
+		return $this;
+	}
+
+	/**
+	 * Override for native getAttribute method. Some nodes have the getAttribute method, some don't, so we need
+	 * to check first the existence of the attributes property.
+	 *
+	 * @param $attributeName string Attribute to retrieve
+	 *
+	 * @return string
+	 */
+	public function getAttribute($attributeName)
+	{
+		if (!is_null($this->attributes)) {
+			return parent::getAttribute($attributeName);
+		}
+
+		return '';
+	}
+
+	/**
+	 * Override for native hasAttribute.
+	 *
+	 * @param $attributeName
+	 *
+	 * @return bool
+	 *
+	 * @see getAttribute
+	 */
+	public function hasAttribute($attributeName)
+	{
+		if (!is_null($this->attributes)) {
+			return parent::hasAttribute($attributeName);
+		}
+
+		return false;
+	}
+
+	/**
+	 * Get the ancestors of the current node.
+	 *
+	 * @param int|bool $maxLevel Max amount of ancestors to get. False for all of them
+	 *
+	 * @return array
+	 */
+	public function getNodeAncestors($maxLevel = 3)
+	{
+		$ancestors = [];
+		$level = 0;
+
+		$node = $this->parentNode;
+
+		while ($node && !($node instanceof DOMDocument)) {
+			$ancestors[] = $node;
+			$level++;
+			if ($level === $maxLevel) {
+				break;
+			}
+			$node = $node->parentNode;
+		}
+
+		return $ancestors;
+	}
+
+	/**
+	 * Returns all links from the current element.
+	 *
+	 * @return array
+	 */
+	public function getAllLinks()
+	{
+		return iterator_to_array($this->getElementsByTagName('a'));
+	}
+
+	/**
+	 * Get the density of links as a percentage of the content
+	 * This is the amount of text that is inside a link divided by the total text in the node.
+	 *
+	 * @return int
+	 */
+	public function getLinkDensity()
+	{
+		$linkLength = 0;
+		$textLength = mb_strlen($this->getTextContent(true));
+
+		if (!$textLength) {
+			return 0;
+		}
+
+		$links = $this->getAllLinks();
+
+		if ($links) {
+			/** @var DOMElement $link */
+			foreach ($links as $link) {
+				$linkLength += mb_strlen($link->getTextContent(true));
+			}
+		}
+
+		return $linkLength / $textLength;
+	}
+
+	/**
+	 * Calculates the weight of the class/id of the current element.
+	 *
+	 * @return int
+	 */
+	public function getClassWeight()
+	{
+		$weight = 0;
+
+		// Look for a special classname
+		$class = $this->getAttribute('class');
+		if (trim($class)) {
+			if (preg_match(NodeUtility::$regexps['negative'], $class)) {
+				$weight -= 25;
+			}
+
+			if (preg_match(NodeUtility::$regexps['positive'], $class)) {
+				$weight += 25;
+			}
+		}
+
+		// Look for a special ID
+		$id = $this->getAttribute('id');
+		if (trim($id)) {
+			if (preg_match(NodeUtility::$regexps['negative'], $id)) {
+				$weight -= 25;
+			}
+
+			if (preg_match(NodeUtility::$regexps['positive'], $id)) {
+				$weight += 25;
+			}
+		}
+
+		return $weight;
+	}
+
+	/**
+	 * Returns the full text of the node.
+	 *
+	 * @param bool $normalize Normalize white space?
+	 *
+	 * @return string
+	 */
+	public function getTextContent($normalize = false)
+	{
+		$nodeValue = $this->nodeValue;
+		if ($normalize) {
+			$nodeValue = trim(preg_replace('/\s{2,}/', ' ', $nodeValue));
+		}
+
+		return $nodeValue;
+	}
+
+	/**
+	 * Returns the children of the current node.
+	 *
+	 * @param bool $filterEmptyDOMText Filter empty DOMText nodes?
+	 *
+	 * @deprecated Use NodeUtility::filterTextNodes, function will be removed in version 3.0
+	 *
+	 * @return array
+	 */
+	public function getChildren($filterEmptyDOMText = false)
+	{
+		@trigger_error('getChildren was replaced with NodeUtility::filterTextNodes and will be removed in version 3.0', E_USER_DEPRECATED);
+
+		$ret = iterator_to_array($this->childNodes);
+		if ($filterEmptyDOMText) {
+			// Array values is used to discard the key order. Needs to be 0 to whatever without skipping any number
+			$ret = array_values(array_filter($ret, function ($node) {
+				return $node->nodeName !== '#text' || mb_strlen(trim($node->nodeValue));
+			}));
+		}
+
+		return $ret;
+	}
+
+	/**
+	 * Return an array indicating how many rows and columns this table has.
+	 *
+	 * @return array
+	 */
+	public function getRowAndColumnCount()
+	{
+		$rows = $columns = 0;
+		$trs = $this->getElementsByTagName('tr');
+		foreach ($trs as $tr) {
+			/** @var \DOMElement $tr */
+			$rowspan = $tr->getAttribute('rowspan');
+			$rows += ($rowspan || 1);
+
+			// Now look for column-related info
+			$columnsInThisRow = 0;
+			$cells = $tr->getElementsByTagName('td');
+			foreach ($cells as $cell) {
+				/** @var \DOMElement $cell */
+				$colspan = $cell->getAttribute('colspan');
+				$columnsInThisRow += ($colspan || 1);
+			}
+			$columns = max($columns, $columnsInThisRow);
+		}
+
+		return ['rows' => $rows, 'columns' => $columns];
+	}
+
+	/**
+	 * Creates a new node based on the text content of the original node.
+	 *
+	 * @param $originalNode DOMNode
+	 * @param $tagName string
+	 *
+	 * @return DOMElement
+	 */
+	public function createNode($originalNode, $tagName)
+	{
+		$text = $originalNode->getTextContent();
+		$newNode = $originalNode->ownerDocument->createElement($tagName, $text);
+
+		return $newNode;
+	}
+
+	/**
+	 * Check if a given node has one of its ancestor tag name matching the
+	 * provided one.
+	 *
+	 * @param string $tagName
+	 * @param int $maxDepth
+	 * @param callable $filterFn
+	 *
+	 * @return bool
+	 */
+	public function hasAncestorTag($tagName, $maxDepth = 3, callable $filterFn = null)
+	{
+		$depth = 0;
+		$node = $this;
+
+		while ($node->parentNode) {
+			if ($maxDepth > 0 && $depth > $maxDepth) {
+				return false;
+			}
+
+			if ($node->parentNode->nodeName === $tagName && (!$filterFn || $filterFn($node->parentNode))) {
+				return true;
+			}
+
+			$node = $node->parentNode;
+			$depth++;
+		}
+
+		return false;
+	}
+
+	/**
+	 * Check if this node has only whitespace and a single element with given tag
+	 * or if it contains no element with given tag or more than 1 element.
+	 *
+	 * @param $tag string Name of tag
+	 *
+	 * @return bool
+	 */
+	public function hasSingleTagInsideElement($tag)
+	{
+		// There should be exactly 1 element child with given tag
+		if (count($children = NodeUtility::filterTextNodes($this->childNodes)) !== 1 || $children->item(0)->nodeName !== $tag) {
+			return false;
+		}
+
+		// And there should be no text nodes with real content
+		return array_reduce(iterator_to_array($children), function ($carry, $child) {
+			if (!$carry === false) {
+				return false;
+			}
+
+			/* @var DOMNode $child */
+			return !($child->nodeType === XML_TEXT_NODE && !preg_match('/\S$/', $child->getTextContent()));
+		});
+	}
+
+	/**
+	 * Check if the current element has a single child block element.
+	 * Block elements are the ones defined in the divToPElements array.
+	 *
+	 * @return bool
+	 */
+	public function hasSingleChildBlockElement()
+	{
+		$result = false;
+		if ($this->hasChildNodes()) {
+			foreach ($this->childNodes as $child) {
+				if (in_array($child->nodeName, $this->divToPElements)) {
+					$result = true;
+				} else {
+					// If any of the hasSingleChildBlockElement calls return true, return true then.
+					/** @var $child DOMElement */
+					$result = ($result || $child->hasSingleChildBlockElement());
+				}
+			}
+		}
+
+		return $result;
+	}
+
+	/**
+	 * Determines if a node has no content or it is just a bunch of dividing lines and/or whitespace.
+	 *
+	 * @return bool
+	 */
+	public function isElementWithoutContent()
+	{
+		return $this instanceof DOMElement &&
+			mb_strlen(preg_replace(NodeUtility::$regexps['onlyWhitespace'], '', $this->textContent)) === 0 &&
+			($this->childNodes->length === 0 ||
+				$this->childNodes->length === $this->getElementsByTagName('br')->length + $this->getElementsByTagName('hr')->length
+				/*
                  * Special PHP DOMDocument case: We also need to count how many DOMText we have inside the node.
                  * If there's an empty tag with an space inside and a BR (for example "<p> <br/></p>) counting only BRs and
                  * HRs will will say that the example has 2 nodes, instead of one. This happens because in DOMDocument,
@@ -480,108 +480,108 @@  discard block
 block discarded – undo
                  * are dealing with (And at this point we know they are empty or are just whitespace, because of the
                  * mb_strlen in this chain of checks).
                  */
-                + count(array_filter(iterator_to_array($this->childNodes), function ($child) {
-                    return $child instanceof DOMText;
-                }))
-
-            );
-    }
-
-    /**
-     * Determine if a node qualifies as phrasing content.
-     * https://developer.mozilla.org/en-US/docs/Web/Guide/HTML/Content_categories#Phrasing_content.
-     *
-     * @return bool
-     */
-    public function isPhrasingContent()
-    {
-        return $this->nodeType === XML_TEXT_NODE || in_array($this->nodeName, $this->phrasing_elems) !== false ||
-            (!is_null($this->childNodes) &&
-                ($this->nodeName === 'a' || $this->nodeName === 'del' || $this->nodeName === 'ins') &&
-                array_reduce(iterator_to_array($this->childNodes), function ($carry, $node) {
-                    return $node->isPhrasingContent() && $carry;
-                }, true)
-            );
-    }
-
-    /**
-     * In the original JS project they check if the node has the style display=none, which unfortunately
-     * in our case we have no way of knowing that. So we just check for the attribute hidden or "display: none".
-     *
-     * Might be a good idea to check for classes or other attributes like 'aria-hidden'
-     *
-     * @return bool
-     */
-    public function isProbablyVisible()
-    {
-        return !preg_match('/display:( )?none/', $this->getAttribute('style')) && !$this->hasAttribute('hidden');
-    }
-
-    /**
-     * @return bool
-     */
-    public function isWhitespace()
-    {
-        return ($this->nodeType === XML_TEXT_NODE && mb_strlen(trim($this->textContent)) === 0) ||
-            ($this->nodeType === XML_ELEMENT_NODE && $this->nodeName === 'br');
-    }
-
-    /**
-     * This is a hack that overcomes the issue of node shifting when scanning and removing nodes.
-     *
-     * In the JS version of getElementsByTagName, if you remove a node it will not appear during the
-     * foreach. This does not happen in PHP DOMDocument, because if you remove a node, it will still appear but as an
-     * orphan node and will give an exception if you try to do anything with it.
-     *
-     * Shifting also occurs when converting parent nodes (like a P to a DIV), which in that case the found nodes are
-     * removed from the foreach "pool" but the internal index of the foreach is not aware and skips over nodes that
-     * never looped over. (index is at position 5, 2 nodes are removed, next one should be node 3, but the foreach tries
-     * to access node 6)
-     *
-     * This function solves this by searching for the nodes on every loop and keeping track of the count differences.
-     * Because on every loop we call getElementsByTagName again, this could cause a performance impact and should be
-     * used only when the results of the search are going to be used to remove the nodes.
-     *
-     * @param string $tag
-     *
-     * @return \Generator
-     */
-    public function shiftingAwareGetElementsByTagName($tag)
-    {
-        /** @var $nodes DOMNodeList */
-        $nodes = $this->getElementsByTagName($tag);
-        $count = $nodes->length;
-
-        for ($i = 0; $i < $count; $i = max(++$i, 0)) {
-            yield $nodes->item($i);
-
-            // Search for all the nodes again
-            $nodes = $this->getElementsByTagName($tag);
-
-            // Subtract the amount of nodes removed from the current index
-            $i -= $count - $nodes->length;
-
-            // Subtract the amount of nodes removed from the current count
-            $count -= ($count - $nodes->length);
-        }
-    }
-
-    /**
-     * Mimics JS's firstElementChild property. PHP only has firstChild which could be any type of DOMNode. Use this
-     * function to get the first one that is an DOMElement node.
-     *
-     * @return \DOMElement|null
-     */
-    public function getFirstElementChild()
-    {
-        if ($this->childNodes instanceof \Traversable) {
-            foreach ($this->childNodes as $node) {
-                if ($node instanceof \DOMElement) {
-                    return $node;
-                }
-            }
-        }
-
-        return null;
-    }
+				+ count(array_filter(iterator_to_array($this->childNodes), function ($child) {
+					return $child instanceof DOMText;
+				}))
+
+			);
+	}
+
+	/**
+	 * Determine if a node qualifies as phrasing content.
+	 * https://developer.mozilla.org/en-US/docs/Web/Guide/HTML/Content_categories#Phrasing_content.
+	 *
+	 * @return bool
+	 */
+	public function isPhrasingContent()
+	{
+		return $this->nodeType === XML_TEXT_NODE || in_array($this->nodeName, $this->phrasing_elems) !== false ||
+			(!is_null($this->childNodes) &&
+				($this->nodeName === 'a' || $this->nodeName === 'del' || $this->nodeName === 'ins') &&
+				array_reduce(iterator_to_array($this->childNodes), function ($carry, $node) {
+					return $node->isPhrasingContent() && $carry;
+				}, true)
+			);
+	}
+
+	/**
+	 * In the original JS project they check if the node has the style display=none, which unfortunately
+	 * in our case we have no way of knowing that. So we just check for the attribute hidden or "display: none".
+	 *
+	 * Might be a good idea to check for classes or other attributes like 'aria-hidden'
+	 *
+	 * @return bool
+	 */
+	public function isProbablyVisible()
+	{
+		return !preg_match('/display:( )?none/', $this->getAttribute('style')) && !$this->hasAttribute('hidden');
+	}
+
+	/**
+	 * @return bool
+	 */
+	public function isWhitespace()
+	{
+		return ($this->nodeType === XML_TEXT_NODE && mb_strlen(trim($this->textContent)) === 0) ||
+			($this->nodeType === XML_ELEMENT_NODE && $this->nodeName === 'br');
+	}
+
+	/**
+	 * This is a hack that overcomes the issue of node shifting when scanning and removing nodes.
+	 *
+	 * In the JS version of getElementsByTagName, if you remove a node it will not appear during the
+	 * foreach. This does not happen in PHP DOMDocument, because if you remove a node, it will still appear but as an
+	 * orphan node and will give an exception if you try to do anything with it.
+	 *
+	 * Shifting also occurs when converting parent nodes (like a P to a DIV), which in that case the found nodes are
+	 * removed from the foreach "pool" but the internal index of the foreach is not aware and skips over nodes that
+	 * never looped over. (index is at position 5, 2 nodes are removed, next one should be node 3, but the foreach tries
+	 * to access node 6)
+	 *
+	 * This function solves this by searching for the nodes on every loop and keeping track of the count differences.
+	 * Because on every loop we call getElementsByTagName again, this could cause a performance impact and should be
+	 * used only when the results of the search are going to be used to remove the nodes.
+	 *
+	 * @param string $tag
+	 *
+	 * @return \Generator
+	 */
+	public function shiftingAwareGetElementsByTagName($tag)
+	{
+		/** @var $nodes DOMNodeList */
+		$nodes = $this->getElementsByTagName($tag);
+		$count = $nodes->length;
+
+		for ($i = 0; $i < $count; $i = max(++$i, 0)) {
+			yield $nodes->item($i);
+
+			// Search for all the nodes again
+			$nodes = $this->getElementsByTagName($tag);
+
+			// Subtract the amount of nodes removed from the current index
+			$i -= $count - $nodes->length;
+
+			// Subtract the amount of nodes removed from the current count
+			$count -= ($count - $nodes->length);
+		}
+	}
+
+	/**
+	 * Mimics JS's firstElementChild property. PHP only has firstChild which could be any type of DOMNode. Use this
+	 * function to get the first one that is an DOMElement node.
+	 *
+	 * @return \DOMElement|null
+	 */
+	public function getFirstElementChild()
+	{
+		if ($this->childNodes instanceof \Traversable) {
+			foreach ($this->childNodes as $node) {
+				if ($node instanceof \DOMElement) {
+					return $node;
+				}
+			}
+		}
+
+		return null;
+	}
 }

Please login to merge, or discard this patch.

		@@ -6,5 +6,5 @@
		block discarded – undo
6	6
7	7	class DOMEntityReference extends \DOMEntityReference
8	8	{
9		- use NodeTrait;
	9	+ use NodeTrait;
10	10	}

		@@ -6,5 +6,5 @@
		block discarded – undo
6	6
7	7	class DOMNotation extends \DOMNotation
8	8	{
9		- use NodeTrait;
	9	+ use NodeTrait;
10	10	}

		@@ -6,5 +6,5 @@
		block discarded – undo
6	6
7	7	class DOMComment extends \DOMComment
8	8	{
9		- use NodeTrait;
	9	+ use NodeTrait;
10	10	}

		@@ -6,5 +6,5 @@
		block discarded – undo
6	6
7	7	class DOMDocumentFragment extends \DOMDocumentFragment
8	8	{
9		- use NodeTrait;
	9	+ use NodeTrait;
10	10	}

		@@ -14,69 +14,69 @@
		block discarded – undo
14	14	*/
15	15	class DOMNodeList implements \Countable, \IteratorAggregate
16	16	{
17		- /**
18		- * @var array
19		- */
20		- protected $items = [];
	17	+ /**
	18	+ * @var array
	19	+ */
	20	+ protected $items = [];
21	21
22		- /**
23		- * @var int
24		- */
25		- protected $length = 0;
	22	+ /**
	23	+ * @var int
	24	+ */
	25	+ protected $length = 0;
26	26
27		- /**
28		- * To allow access to length in the same way that DOMNodeList allows.
29		- *
30		- * {@inheritdoc}
31		- */
32		- public function __get($name)
33		- {
34		- switch ($name) {
35		- case 'length':
36		- return $this->length;
37		- default:
38		- trigger_error(sprintf('Undefined property: %s::%s', static::class, $name));
39		- }
40		- }
	27	+ /**
	28	+ * To allow access to length in the same way that DOMNodeList allows.
	29	+ *
	30	+ * {@inheritdoc}
	31	+ */
	32	+ public function __get($name)
	33	+ {
	34	+ switch ($name) {
	35	+ case 'length':
	36	+ return $this->length;
	37	+ default:
	38	+ trigger_error(sprintf('Undefined property: %s::%s', static::class, $name));
	39	+ }
	40	+ }
41	41
42		- /**
43		- * @param DOMNode\|DOMElement\|DOMComment $node
44		- *
45		- * @return DOMNodeList
46		- */
47		- public function add($node)
48		- {
49		- $this->items[] = $node;
50		- $this->length++;
	42	+ /**
	43	+ * @param DOMNode\|DOMElement\|DOMComment $node
	44	+ *
	45	+ * @return DOMNodeList
	46	+ */
	47	+ public function add($node)
	48	+ {
	49	+ $this->items[] = $node;
	50	+ $this->length++;
51	51
52		- return $this;
53		- }
	52	+ return $this;
	53	+ }
54	54
55		- /**
56		- * @param int $offset
57		- *
58		- * @return DOMNode\|DOMElement\|DOMComment
59		- */
60		- public function item(int $offset)
61		- {
62		- return $this->items[$offset];
63		- }
	55	+ /**
	56	+ * @param int $offset
	57	+ *
	58	+ * @return DOMNode\|DOMElement\|DOMComment
	59	+ */
	60	+ public function item(int $offset)
	61	+ {
	62	+ return $this->items[$offset];
	63	+ }
64	64
65		- /**
66		- * @return int\|void
67		- */
68		- public function count(): int
69		- {
70		- return $this->length;
71		- }
	65	+ /**
	66	+ * @return int\|void
	67	+ */
	68	+ public function count(): int
	69	+ {
	70	+ return $this->length;
	71	+ }
72	72
73		- /**
74		- * To make it compatible with iterator_to_array() function.
75		- *
76		- * {@inheritdoc}
77		- */
78		- public function getIterator(): \ArrayIterator
79		- {
80		- return new \ArrayIterator($this->items);
81		- }
	73	+ /**
	74	+ * To make it compatible with iterator_to_array() function.
	75	+ *
	76	+ * {@inheritdoc}
	77	+ */
	78	+ public function getIterator(): \ArrayIterator
	79	+ {
	80	+ return new \ArrayIterator($this->items);
	81	+ }
82	82	}

		@@ -6,25 +6,25 @@
		block discarded – undo
6	6
7	7	class DOMDocument extends \DOMDocument
8	8	{
9		- use NodeTrait;
	9	+ use NodeTrait;
10	10
11		- public function __construct($version, $encoding)
12		- {
13		- parent::__construct($version, $encoding);
	11	+ public function __construct($version, $encoding)
	12	+ {
	13	+ parent::__construct($version, $encoding);
14	14
15		- $this->registerNodeClass('DOMAttr', DOMAttr::class);
16		- $this->registerNodeClass('DOMCdataSection', DOMCdataSection::class);
17		- $this->registerNodeClass('DOMCharacterData', DOMCharacterData::class);
18		- $this->registerNodeClass('DOMComment', DOMComment::class);
19		- $this->registerNodeClass('DOMDocument', self::class);
20		- $this->registerNodeClass('DOMDocumentFragment', DOMDocumentFragment::class);
21		- $this->registerNodeClass('DOMDocumentType', DOMDocumentType::class);
22		- $this->registerNodeClass('DOMElement', DOMElement::class);
23		- $this->registerNodeClass('DOMEntity', DOMEntity::class);
24		- $this->registerNodeClass('DOMEntityReference', DOMEntityReference::class);
25		- $this->registerNodeClass('DOMNode', DOMNode::class);
26		- $this->registerNodeClass('DOMNotation', DOMNotation::class);
27		- $this->registerNodeClass('DOMProcessingInstruction', DOMProcessingInstruction::class);
28		- $this->registerNodeClass('DOMText', DOMText::class);
29		- }
	15	+ $this->registerNodeClass('DOMAttr', DOMAttr::class);
	16	+ $this->registerNodeClass('DOMCdataSection', DOMCdataSection::class);
	17	+ $this->registerNodeClass('DOMCharacterData', DOMCharacterData::class);
	18	+ $this->registerNodeClass('DOMComment', DOMComment::class);
	19	+ $this->registerNodeClass('DOMDocument', self::class);
	20	+ $this->registerNodeClass('DOMDocumentFragment', DOMDocumentFragment::class);
	21	+ $this->registerNodeClass('DOMDocumentType', DOMDocumentType::class);
	22	+ $this->registerNodeClass('DOMElement', DOMElement::class);
	23	+ $this->registerNodeClass('DOMEntity', DOMEntity::class);
	24	+ $this->registerNodeClass('DOMEntityReference', DOMEntityReference::class);
	25	+ $this->registerNodeClass('DOMNode', DOMNode::class);
	26	+ $this->registerNodeClass('DOMNotation', DOMNotation::class);
	27	+ $this->registerNodeClass('DOMProcessingInstruction', DOMProcessingInstruction::class);
	28	+ $this->registerNodeClass('DOMText', DOMText::class);
	29	+ }
30	30	}

		@@ -6,5 +6,5 @@
		block discarded – undo
6	6
7	7	class DOMEntity extends \DOMEntity
8	8	{
9		- use NodeTrait;
	9	+ use NodeTrait;
10	10	}

		@@ -12,126 +12,126 @@ discard block
		block discarded – undo
12	12	*/
13	13	class NodeUtility
14	14	{
15		- /**
16		- * Collection of regexps to check the node usability.
17		- *
18		- * @var array
19		- */
20		- public static $regexps = [
21		- 'unlikelyCandidates' => '/-ad-\|banner\|breadcrumbs\|combx\|comment\|community\|cover-wrap\|disqus\|extra\|foot\|header\|legends\|menu\|related\|remark\|replies\|rss\|shoutbox\|sidebar\|skyscraper\|social\|sponsor\|supplemental\|ad-break\|agegate\|pagination\|pager\|popup\|yom-remote/i',
22		- 'okMaybeItsACandidate' => '/and\|article\|body\|column\|main\|shadow/i',
23		- 'extraneous' => '/print\|archive\|comment\|discuss\|e[\-]?mail\|share\|reply\|all\|login\|sign\|single\|utility/i',
24		- 'byline' => '/byline\|author\|dateline\|writtenby\|p-author/i',
25		- 'replaceFonts' => '/<(\/?)font[^>]*>/gi',
26		- 'normalize' => '/\s{2,}/',
27		- 'videos' => '/\/\/(www\.)?((dailymotion\|youtube\|youtube-nocookie\|player\.vimeo\|v\.qq)\.com\|(archive\|upload\.wikimedia)\.org\|player\.twitch\.tv)/i',
28		- 'nextLink' => '/(next\|weiter\|continue\|>([^\\|]\|$)\|»([^\\|]\|$))/i',
29		- 'prevLink' => '/(prev\|earl\|old\|new\|<\|«)/i',
30		- 'whitespace' => '/^\s*$/',
31		- 'hasContent' => '/\S$/',
32		- 'positive' => '/article\|body\|content\|entry\|hentry\|h-entry\|main\|page\|pagination\|post\|text\|blog\|story/i',
33		- 'negative' => '/hidden\|^hid$\| hid$\| hid \|^hid \|banner\|combx\|comment\|com-\|contact\|foot\|footer\|footnote\|masthead\|media\|meta\|outbrain\|promo\|related\|scroll\|share\|shoutbox\|sidebar\|skyscraper\|sponsor\|shopping\|tags\|tool\|widget/i',
34		- // \x{00A0} is the unicode version of
35		- 'onlyWhitespace' => '/\x{00A0}\|\s+/u'
36		- ];
37		-
38		- /**
39		- * Imported from the Element class on league\html-to-markdown.
40		- *
41		- * @param $node
42		- *
43		- * @return DOMElement
44		- */
45		- public static function nextElement($node)
46		- {
47		- $next = $node;
48		- while ($next
49		- && $next->nodeType !== XML_ELEMENT_NODE
50		- && $next->isWhitespace()) {
51		- $next = $next->nextSibling;
52		- }
53		-
54		- return $next;
55		- }
56		-
57		- /**
58		- * Changes the node tag name. Since tagName on DOMElement is a read only value, this must be done creating a new
59		- * element with the new tag name and importing it to the main DOMDocument.
60		- *
61		- * @param DOMNode $node
62		- * @param string $value
63		- * @param bool $importAttributes
64		- *
65		- * @return DOMNode
66		- */
67		- public static function setNodeTag($node, $value, $importAttributes = true)
68		- {
69		- $new = new DOMDocument('1.0', 'utf-8');
70		- $new->appendChild($new->createElement($value));
71		-
72		- $children = $node->childNodes;
73		- /** @var $children \DOMNodeList $i */
74		- for ($i = 0; $i < $children->length; $i++) {
75		- $import = $new->importNode($children->item($i), true);
76		- $new->firstChild->appendChild($import);
77		- }
78		-
79		- if ($importAttributes) {
80		- // Import attributes from the original node.
81		- foreach ($node->attributes as $attribute) {
82		- $new->firstChild->setAttribute($attribute->nodeName, $attribute->nodeValue);
83		- }
84		- }
85		-
86		- // The import must be done on the firstChild of $new, since $new is a DOMDocument and not a DOMElement.
87		- $import = $node->ownerDocument->importNode($new->firstChild, true);
88		- $node->parentNode->replaceChild($import, $node);
89		-
90		- return $import;
91		- }
92		-
93		- /**
94		- * Removes the current node and returns the next node to be parsed (child, sibling or parent).
95		- *
96		- * @param DOMNode $node
97		- *
98		- * @return DOMNode
99		- */
100		- public static function removeAndGetNext($node)
101		- {
102		- $nextNode = self::getNextNode($node, true);
103		- $node->parentNode->removeChild($node);
104		-
105		- return $nextNode;
106		- }
107		-
108		- /**
109		- * Remove the selected node.
110		- *
111		- * @param $node DOMElement
112		- *
113		- * @return void
114		- **/
115		- public static function removeNode($node)
116		- {
117		- $parent = $node->parentNode;
118		- if ($parent) {
119		- $parent->removeChild($node);
120		- }
121		- }
122		-
123		- /**
124		- * Returns the next node. First checks for children (if the flag allows it), then for siblings, and finally
125		- * for parents.
126		- *
127		- * @param DOMNode $originalNode
128		- * @param bool $ignoreSelfAndKids
129		- *
130		- * @return DOMNode
131		- */
132		- public static function getNextNode($originalNode, $ignoreSelfAndKids = false)
133		- {
134		- /*
	15	+ /**
	16	+ * Collection of regexps to check the node usability.
	17	+ *
	18	+ * @var array
	19	+ */
	20	+ public static $regexps = [
	21	+ 'unlikelyCandidates' => '/-ad-\|banner\|breadcrumbs\|combx\|comment\|community\|cover-wrap\|disqus\|extra\|foot\|header\|legends\|menu\|related\|remark\|replies\|rss\|shoutbox\|sidebar\|skyscraper\|social\|sponsor\|supplemental\|ad-break\|agegate\|pagination\|pager\|popup\|yom-remote/i',
	22	+ 'okMaybeItsACandidate' => '/and\|article\|body\|column\|main\|shadow/i',
	23	+ 'extraneous' => '/print\|archive\|comment\|discuss\|e[\-]?mail\|share\|reply\|all\|login\|sign\|single\|utility/i',
	24	+ 'byline' => '/byline\|author\|dateline\|writtenby\|p-author/i',
	25	+ 'replaceFonts' => '/<(\/?)font[^>]*>/gi',
	26	+ 'normalize' => '/\s{2,}/',
	27	+ 'videos' => '/\/\/(www\.)?((dailymotion\|youtube\|youtube-nocookie\|player\.vimeo\|v\.qq)\.com\|(archive\|upload\.wikimedia)\.org\|player\.twitch\.tv)/i',
	28	+ 'nextLink' => '/(next\|weiter\|continue\|>([^\\|]\|$)\|»([^\\|]\|$))/i',
	29	+ 'prevLink' => '/(prev\|earl\|old\|new\|<\|«)/i',
	30	+ 'whitespace' => '/^\s*$/',
	31	+ 'hasContent' => '/\S$/',
	32	+ 'positive' => '/article\|body\|content\|entry\|hentry\|h-entry\|main\|page\|pagination\|post\|text\|blog\|story/i',
	33	+ 'negative' => '/hidden\|^hid$\| hid$\| hid \|^hid \|banner\|combx\|comment\|com-\|contact\|foot\|footer\|footnote\|masthead\|media\|meta\|outbrain\|promo\|related\|scroll\|share\|shoutbox\|sidebar\|skyscraper\|sponsor\|shopping\|tags\|tool\|widget/i',
	34	+ // \x{00A0} is the unicode version of
	35	+ 'onlyWhitespace' => '/\x{00A0}\|\s+/u'
	36	+ ];
	37	+
	38	+ /**
	39	+ * Imported from the Element class on league\html-to-markdown.
	40	+ *
	41	+ * @param $node
	42	+ *
	43	+ * @return DOMElement
	44	+ */
	45	+ public static function nextElement($node)
	46	+ {
	47	+ $next = $node;
	48	+ while ($next
	49	+ && $next->nodeType !== XML_ELEMENT_NODE
	50	+ && $next->isWhitespace()) {
	51	+ $next = $next->nextSibling;
	52	+ }
	53	+
	54	+ return $next;
	55	+ }
	56	+
	57	+ /**
	58	+ * Changes the node tag name. Since tagName on DOMElement is a read only value, this must be done creating a new
	59	+ * element with the new tag name and importing it to the main DOMDocument.
	60	+ *
	61	+ * @param DOMNode $node
	62	+ * @param string $value
	63	+ * @param bool $importAttributes
	64	+ *
	65	+ * @return DOMNode
	66	+ */
	67	+ public static function setNodeTag($node, $value, $importAttributes = true)
	68	+ {
	69	+ $new = new DOMDocument('1.0', 'utf-8');
	70	+ $new->appendChild($new->createElement($value));
	71	+
	72	+ $children = $node->childNodes;
	73	+ /** @var $children \DOMNodeList $i */
	74	+ for ($i = 0; $i < $children->length; $i++) {
	75	+ $import = $new->importNode($children->item($i), true);
	76	+ $new->firstChild->appendChild($import);
	77	+ }
	78	+
	79	+ if ($importAttributes) {
	80	+ // Import attributes from the original node.
	81	+ foreach ($node->attributes as $attribute) {
	82	+ $new->firstChild->setAttribute($attribute->nodeName, $attribute->nodeValue);
	83	+ }
	84	+ }
	85	+
	86	+ // The import must be done on the firstChild of $new, since $new is a DOMDocument and not a DOMElement.
	87	+ $import = $node->ownerDocument->importNode($new->firstChild, true);
	88	+ $node->parentNode->replaceChild($import, $node);
	89	+
	90	+ return $import;
	91	+ }
	92	+
	93	+ /**
	94	+ * Removes the current node and returns the next node to be parsed (child, sibling or parent).
	95	+ *
	96	+ * @param DOMNode $node
	97	+ *
	98	+ * @return DOMNode
	99	+ */
	100	+ public static function removeAndGetNext($node)
	101	+ {
	102	+ $nextNode = self::getNextNode($node, true);
	103	+ $node->parentNode->removeChild($node);
	104	+
	105	+ return $nextNode;
	106	+ }
	107	+
	108	+ /**
	109	+ * Remove the selected node.
	110	+ *
	111	+ * @param $node DOMElement
	112	+ *
	113	+ * @return void
	114	+ **/
	115	+ public static function removeNode($node)
	116	+ {
	117	+ $parent = $node->parentNode;
	118	+ if ($parent) {
	119	+ $parent->removeChild($node);
	120	+ }
	121	+ }
	122	+
	123	+ /**
	124	+ * Returns the next node. First checks for children (if the flag allows it), then for siblings, and finally
	125	+ * for parents.
	126	+ *
	127	+ * @param DOMNode $originalNode
	128	+ * @param bool $ignoreSelfAndKids
	129	+ *
	130	+ * @return DOMNode
	131	+ */
	132	+ public static function getNextNode($originalNode, $ignoreSelfAndKids = false)
	133	+ {
	134	+ /*
135	135	* Traverse the DOM from node to node, starting at the node passed in.
136	136	* Pass true for the second parameter to indicate this node itself
137	137	* (and its kids) are going away, and we want the next node over.
		@@ -139,42 +139,42 @@ discard block
		block discarded – undo
139	139	* Calling this in a loop will traverse the DOM depth-first.
140	140	*/
141	141
142		- // First check for kids if those aren't being ignored
143		- if (!$ignoreSelfAndKids && $originalNode->firstChild) {
144		- return $originalNode->firstChild;
145		- }
146		-
147		- // Then for siblings...
148		- if ($originalNode->nextSibling) {
149		- return $originalNode->nextSibling;
150		- }
151		-
152		- // And finally, move up the parent chain and find a sibling
153		- // (because this is depth-first traversal, we will have already
154		- // seen the parent nodes themselves).
155		- do {
156		- $originalNode = $originalNode->parentNode;
157		- } while ($originalNode && !$originalNode->nextSibling);
158		-
159		- return ($originalNode) ? $originalNode->nextSibling : $originalNode;
160		- }
161		-
162		- /**
163		- * Remove all empty DOMNodes from DOMNodeLists.
164		- *
165		- * @param \DOMNodeList $list
166		- *
167		- * @return DOMNodeList
168		- */
169		- public static function filterTextNodes(\DOMNodeList $list)
170		- {
171		- $newList = new DOMNodeList();
172		- foreach ($list as $node) {
173		- if ($node->nodeType !== XML_TEXT_NODE \|\| mb_strlen(trim($node->nodeValue))) {
174		- $newList->add($node);
175		- }
176		- }
177		-
178		- return $newList;
179		- }
	142	+ // First check for kids if those aren't being ignored
	143	+ if (!$ignoreSelfAndKids && $originalNode->firstChild) {
	144	+ return $originalNode->firstChild;
	145	+ }
	146	+
	147	+ // Then for siblings...
	148	+ if ($originalNode->nextSibling) {
	149	+ return $originalNode->nextSibling;
	150	+ }
	151	+
	152	+ // And finally, move up the parent chain and find a sibling
	153	+ // (because this is depth-first traversal, we will have already
	154	+ // seen the parent nodes themselves).
	155	+ do {
	156	+ $originalNode = $originalNode->parentNode;
	157	+ } while ($originalNode && !$originalNode->nextSibling);
	158	+
	159	+ return ($originalNode) ? $originalNode->nextSibling : $originalNode;
	160	+ }
	161	+
	162	+ /**
	163	+ * Remove all empty DOMNodes from DOMNodeLists.
	164	+ *
	165	+ * @param \DOMNodeList $list
	166	+ *
	167	+ * @return DOMNodeList
	168	+ */
	169	+ public static function filterTextNodes(\DOMNodeList $list)
	170	+ {
	171	+ $newList = new DOMNodeList();
	172	+ foreach ($list as $node) {
	173	+ if ($node->nodeType !== XML_TEXT_NODE \|\| mb_strlen(trim($node->nodeValue))) {
	174	+ $newList->add($node);
	175	+ }
	176	+ }
	177	+
	178	+ return $newList;
	179	+ }
180	180	}

codysnider / tt-rss

Push — master ( 5a5c41...fade3b )

Status

Category

Indentation +1 added lines, -1 removed lines patch added patch discarded remove patch

Indentation +1 added lines, -1 removed lines patch added patch discarded remove patch

Indentation +1 added lines, -1 removed lines patch added patch discarded remove patch

Indentation +1 added lines, -1 removed lines patch added patch discarded remove patch

Indentation +58 added lines, -58 removed lines patch added patch discarded remove patch

Indentation +19 added lines, -19 removed lines patch added patch discarded remove patch

Indentation +1 added lines, -1 removed lines patch added patch discarded remove patch

Indentation +158 added lines, -158 removed lines patch added patch discarded remove patch

Indentation +553 added lines, -553 removed lines patch added patch discarded remove patch