@@ -535,10 +535,10 @@ |
||
| 535 | 535 | '/(?<start>.*)<(?<element_start>[a-z]+)(?<element_start_addon> [^>]*)?>(?<value>.*?)<\/(?<element_end>\2)>(?<end>.*)/sui', |
| 536 | 536 | static function ($matches) { |
| 537 | 537 | return $matches['start'] . |
| 538 | - '°lt_simple_html_dom__voku_°' . $matches['element_start'] . $matches['element_start_addon'] . '°gt_simple_html_dom__voku_°' . |
|
| 539 | - $matches['value'] . |
|
| 540 | - '°lt/_simple_html_dom__voku_°' . $matches['element_end'] . '°gt_simple_html_dom__voku_°' . |
|
| 541 | - $matches['end']; |
|
| 538 | + '°lt_simple_html_dom__voku_°' . $matches['element_start'] . $matches['element_start_addon'] . '°gt_simple_html_dom__voku_°' . |
|
| 539 | + $matches['value'] . |
|
| 540 | + '°lt/_simple_html_dom__voku_°' . $matches['element_end'] . '°gt_simple_html_dom__voku_°' . |
|
| 541 | + $matches['end']; |
|
| 542 | 542 | }, |
| 543 | 543 | $html |
| 544 | 544 | ); |
@@ -146,7 +146,7 @@ discard block |
||
| 146 | 146 | return \call_user_func_array([$this, self::$functionAliases[$name]], $arguments); |
| 147 | 147 | } |
| 148 | 148 | |
| 149 | - throw new \BadMethodCallException('Method does not exist: ' . $name); |
|
| 149 | + throw new \BadMethodCallException('Method does not exist: '.$name); |
|
| 150 | 150 | } |
| 151 | 151 | |
| 152 | 152 | /** |
@@ -336,7 +336,7 @@ discard block |
||
| 336 | 336 | || |
| 337 | 337 | $this->keepBrokenHtml |
| 338 | 338 | ) { |
| 339 | - $html = '<' . self::$domHtmlWrapperHelper . '>' . $html . '</' . self::$domHtmlWrapperHelper . '>'; |
|
| 339 | + $html = '<'.self::$domHtmlWrapperHelper.'>'.$html.'</'.self::$domHtmlWrapperHelper.'>'; |
|
| 340 | 340 | } |
| 341 | 341 | |
| 342 | 342 | $html = self::replaceToPreserveHtmlEntities($html); |
@@ -358,7 +358,7 @@ discard block |
||
| 358 | 358 | /** @noinspection StringFragmentMisplacedInspection */ |
| 359 | 359 | if (\stripos('<?xml', $html) !== 0) { |
| 360 | 360 | $xmlHackUsed = true; |
| 361 | - $html = '<?xml encoding="' . $this->getEncoding() . '" ?>' . $html; |
|
| 361 | + $html = '<?xml encoding="'.$this->getEncoding().'" ?>'.$html; |
|
| 362 | 362 | } |
| 363 | 363 | |
| 364 | 364 | $this->document->loadHTML($html, $optionsXml); |
@@ -891,11 +891,11 @@ discard block |
||
| 891 | 891 | |
| 892 | 892 | $html = (string) \preg_replace_callback( |
| 893 | 893 | '/(?<start>.*)<(?<element_start>[a-z]+)(?<element_start_addon> [^>]*)?>(?<value>.*?)<\/(?<element_end>\2)>(?<end>.*)/sui', |
| 894 | - static function ($matches) { |
|
| 895 | - return $matches['start'] . |
|
| 896 | - '°lt_simple_html_dom__voku_°' . $matches['element_start'] . $matches['element_start_addon'] . '°gt_simple_html_dom__voku_°' . |
|
| 897 | - $matches['value'] . |
|
| 898 | - '°lt/_simple_html_dom__voku_°' . $matches['element_end'] . '°gt_simple_html_dom__voku_°' . |
|
| 894 | + static function($matches) { |
|
| 895 | + return $matches['start']. |
|
| 896 | + '°lt_simple_html_dom__voku_°'.$matches['element_start'].$matches['element_start_addon'].'°gt_simple_html_dom__voku_°'. |
|
| 897 | + $matches['value']. |
|
| 898 | + '°lt/_simple_html_dom__voku_°'.$matches['element_end'].'°gt_simple_html_dom__voku_°'. |
|
| 899 | 899 | $matches['end']; |
| 900 | 900 | }, |
| 901 | 901 | $html |
@@ -907,7 +907,7 @@ discard block |
||
| 907 | 907 | |
| 908 | 908 | $html = (string) \preg_replace_callback( |
| 909 | 909 | '/(?<start>[^<]*)?(?<broken>(?:(?:<\/\w+(?:\s+\w+=\\"[^\"]+\\")*+)(?:[^<]+)>)+)(?<end>.*)/u', |
| 910 | - static function ($matches) { |
|
| 910 | + static function($matches) { |
|
| 911 | 911 | $matches['broken'] = \str_replace( |
| 912 | 912 | ['°lt/_simple_html_dom__voku_°', '°lt_simple_html_dom__voku_°', '°gt_simple_html_dom__voku_°'], |
| 913 | 913 | ['</', '<', '>'], |
@@ -915,9 +915,9 @@ discard block |
||
| 915 | 915 | ); |
| 916 | 916 | |
| 917 | 917 | self::$domBrokenReplaceHelper['orig'][] = $matches['broken']; |
| 918 | - self::$domBrokenReplaceHelper['tmp'][] = $matchesHash = self::$domHtmlBrokenHtmlHelper . \crc32($matches['broken']); |
|
| 918 | + self::$domBrokenReplaceHelper['tmp'][] = $matchesHash = self::$domHtmlBrokenHtmlHelper.\crc32($matches['broken']); |
|
| 919 | 919 | |
| 920 | - return $matches['start'] . $matchesHash . $matches['end']; |
|
| 920 | + return $matches['start'].$matchesHash.$matches['end']; |
|
| 921 | 921 | }, |
| 922 | 922 | $html |
| 923 | 923 | ); |
@@ -940,7 +940,7 @@ discard block |
||
| 940 | 940 | // regEx for e.g.: [<script id="elements-image-1" type="text/html">...</script>] |
| 941 | 941 | $html = (string) \preg_replace_callback( |
| 942 | 942 | '/(?<start>((?:<script) [^>]*type=(?:["\'])?(?:text\/html|text\/x-custom-template|text\/x-handlebars-template)+(?:[^>]*)>))(?<innerContent>.*)(?<end><\/script>)/isU', |
| 943 | - function ($matches) { |
|
| 943 | + function($matches) { |
|
| 944 | 944 | |
| 945 | 945 | // Check for logic in special script tags, like [<% _.each(tierPrices, function(item, key) { %>], |
| 946 | 946 | // because often this looks like non valid html in the template itself. |
@@ -950,18 +950,18 @@ discard block |
||
| 950 | 950 | $matches['innerContent'] = \str_replace('<\/', '</', $matches['innerContent']); |
| 951 | 951 | |
| 952 | 952 | self::$domBrokenReplaceHelper['orig'][] = $matches['innerContent']; |
| 953 | - self::$domBrokenReplaceHelper['tmp'][] = $matchesHash = '' . self::$domHtmlBrokenHtmlHelper . '' . \crc32($matches['innerContent']); |
|
| 953 | + self::$domBrokenReplaceHelper['tmp'][] = $matchesHash = ''.self::$domHtmlBrokenHtmlHelper.''.\crc32($matches['innerContent']); |
|
| 954 | 954 | |
| 955 | - return $matches['start'] . $matchesHash . $matches['end']; |
|
| 955 | + return $matches['start'].$matchesHash.$matches['end']; |
|
| 956 | 956 | } |
| 957 | 957 | } |
| 958 | 958 | |
| 959 | 959 | // remove the html5 fallback |
| 960 | 960 | $matches[0] = \str_replace('<\/', '</', $matches[0]); |
| 961 | 961 | |
| 962 | - $specialNonScript = '<' . self::$domHtmlSpecialScriptHelper . \substr($matches[0], \strlen('<script')); |
|
| 962 | + $specialNonScript = '<'.self::$domHtmlSpecialScriptHelper.\substr($matches[0], \strlen('<script')); |
|
| 963 | 963 | |
| 964 | - return \substr($specialNonScript, 0, -\strlen('</script>')) . '</' . self::$domHtmlSpecialScriptHelper . '>'; |
|
| 964 | + return \substr($specialNonScript, 0, -\strlen('</script>')).'</'.self::$domHtmlSpecialScriptHelper.'>'; |
|
| 965 | 965 | }, |
| 966 | 966 | $html |
| 967 | 967 | ); |
@@ -417,8 +417,8 @@ discard block |
||
| 417 | 417 | $tmpStr = $this->normalizeStringForComparision($string); |
| 418 | 418 | if ($tmpDomString !== $tmpStr) { |
| 419 | 419 | throw new \RuntimeException( |
| 420 | - 'Not valid HTML fragment!' . "\n" . |
|
| 421 | - $tmpDomString . "\n" . |
|
| 420 | + 'Not valid HTML fragment!'."\n". |
|
| 421 | + $tmpDomString."\n". |
|
| 422 | 422 | $tmpStr |
| 423 | 423 | ); |
| 424 | 424 | } |
@@ -490,8 +490,8 @@ discard block |
||
| 490 | 490 | $tmpStr = $this->normalizeStringForComparision($string); |
| 491 | 491 | if ($tmpDomOuterTextString !== $tmpStr) { |
| 492 | 492 | throw new \RuntimeException( |
| 493 | - 'Not valid HTML fragment!' . "\n" |
|
| 494 | - . $tmpDomOuterTextString . "\n" . |
|
| 493 | + 'Not valid HTML fragment!'."\n" |
|
| 494 | + . $tmpDomOuterTextString."\n". |
|
| 495 | 495 | $tmpStr |
| 496 | 496 | ); |
| 497 | 497 | } |
@@ -444,7 +444,7 @@ discard block |
||
| 444 | 444 | /** |
| 445 | 445 | * Returns the first child of node. |
| 446 | 446 | * |
| 447 | - * @return SimpleHtmlDomInterface|null |
|
| 447 | + * @return null|SimpleHtmlDom |
|
| 448 | 448 | */ |
| 449 | 449 | public function firstChild() |
| 450 | 450 | { |
@@ -590,7 +590,7 @@ discard block |
||
| 590 | 590 | /** |
| 591 | 591 | * Returns the last child of node. |
| 592 | 592 | * |
| 593 | - * @return SimpleHtmlDomInterface|null |
|
| 593 | + * @return null|SimpleHtmlDom |
|
| 594 | 594 | */ |
| 595 | 595 | public function lastChild() |
| 596 | 596 | { |
@@ -607,7 +607,7 @@ discard block |
||
| 607 | 607 | /** |
| 608 | 608 | * Returns the next sibling of node. |
| 609 | 609 | * |
| 610 | - * @return SimpleHtmlDomInterface|null |
|
| 610 | + * @return null|SimpleHtmlDom |
|
| 611 | 611 | */ |
| 612 | 612 | public function nextSibling() |
| 613 | 613 | { |
@@ -624,7 +624,7 @@ discard block |
||
| 624 | 624 | /** |
| 625 | 625 | * Returns the next sibling of node. |
| 626 | 626 | * |
| 627 | - * @return SimpleHtmlDomInterface|null |
|
| 627 | + * @return null|SimpleHtmlDom |
|
| 628 | 628 | */ |
| 629 | 629 | public function nextNonWhitespaceSibling() |
| 630 | 630 | { |
@@ -656,7 +656,7 @@ discard block |
||
| 656 | 656 | /** |
| 657 | 657 | * Returns the previous sibling of node. |
| 658 | 658 | * |
| 659 | - * @return SimpleHtmlDomInterface|null |
|
| 659 | + * @return null|SimpleHtmlDom |
|
| 660 | 660 | */ |
| 661 | 661 | public function previousSibling() |
| 662 | 662 | { |
@@ -417,8 +417,8 @@ discard block |
||
| 417 | 417 | $tmpStr = $this->normalizeStringForComparision($string); |
| 418 | 418 | if ($tmpDomString !== $tmpStr) { |
| 419 | 419 | throw new \RuntimeException( |
| 420 | - 'Not valid HTML fragment!' . "\n" . |
|
| 421 | - $tmpDomString . "\n" . |
|
| 420 | + 'Not valid HTML fragment!'."\n". |
|
| 421 | + $tmpDomString."\n". |
|
| 422 | 422 | $tmpStr |
| 423 | 423 | ); |
| 424 | 424 | } |
@@ -490,8 +490,8 @@ discard block |
||
| 490 | 490 | $tmpStr = $this->normalizeStringForComparision($string); |
| 491 | 491 | if ($tmpDomOuterTextString !== $tmpStr) { |
| 492 | 492 | throw new \RuntimeException( |
| 493 | - 'Not valid HTML fragment!' . "\n" |
|
| 494 | - . $tmpDomOuterTextString . "\n" . |
|
| 493 | + 'Not valid HTML fragment!'."\n" |
|
| 494 | + . $tmpDomOuterTextString."\n". |
|
| 495 | 495 | $tmpStr |
| 496 | 496 | ); |
| 497 | 497 | } |
@@ -418,7 +418,7 @@ discard block |
||
| 418 | 418 | /** |
| 419 | 419 | * Returns the first child of node. |
| 420 | 420 | * |
| 421 | - * @return SimpleXmlDomInterface|null |
|
| 421 | + * @return null|SimpleXmlDom |
|
| 422 | 422 | */ |
| 423 | 423 | public function firstChild() |
| 424 | 424 | { |
@@ -576,7 +576,7 @@ discard block |
||
| 576 | 576 | /** |
| 577 | 577 | * Returns the last child of node. |
| 578 | 578 | * |
| 579 | - * @return SimpleXmlDomInterface|null |
|
| 579 | + * @return null|SimpleXmlDom |
|
| 580 | 580 | */ |
| 581 | 581 | public function lastChild() |
| 582 | 582 | { |
@@ -593,7 +593,7 @@ discard block |
||
| 593 | 593 | /** |
| 594 | 594 | * Returns the next sibling of node. |
| 595 | 595 | * |
| 596 | - * @return SimpleXmlDomInterface|null |
|
| 596 | + * @return null|SimpleXmlDom |
|
| 597 | 597 | */ |
| 598 | 598 | public function nextSibling() |
| 599 | 599 | { |
@@ -610,7 +610,7 @@ discard block |
||
| 610 | 610 | /** |
| 611 | 611 | * Returns the next sibling of node. |
| 612 | 612 | * |
| 613 | - * @return SimpleXmlDomInterface|null |
|
| 613 | + * @return null|SimpleXmlDom |
|
| 614 | 614 | */ |
| 615 | 615 | public function nextNonWhitespaceSibling() |
| 616 | 616 | { |
@@ -642,7 +642,7 @@ discard block |
||
| 642 | 642 | /** |
| 643 | 643 | * Returns the previous sibling of node. |
| 644 | 644 | * |
| 645 | - * @return SimpleXmlDomInterface|null |
|
| 645 | + * @return null|SimpleXmlDom |
|
| 646 | 646 | */ |
| 647 | 647 | public function previousSibling() |
| 648 | 648 | { |
@@ -151,7 +151,7 @@ |
||
| 151 | 151 | /** @noinspection StringFragmentMisplacedInspection */ |
| 152 | 152 | if (\stripos('<?xml', $xml) !== 0) { |
| 153 | 153 | $xmlHackUsed = true; |
| 154 | - $xml = '<?xml encoding="' . $this->getEncoding() . '" ?>' . $xml; |
|
| 154 | + $xml = '<?xml encoding="'.$this->getEncoding().'" ?>'.$xml; |
|
| 155 | 155 | } |
| 156 | 156 | |
| 157 | 157 | $this->document->loadXML($xml, $optionsXml); |
@@ -83,7 +83,7 @@ discard block |
||
| 83 | 83 | return \call_user_func_array([$this, self::$functionAliases[$name]], $arguments); |
| 84 | 84 | } |
| 85 | 85 | |
| 86 | - throw new \BadMethodCallException('Method does not exist: ' . $name); |
|
| 86 | + throw new \BadMethodCallException('Method does not exist: '.$name); |
|
| 87 | 87 | } |
| 88 | 88 | |
| 89 | 89 | /** |
@@ -389,12 +389,12 @@ discard block |
||
| 389 | 389 | $regExSpecialScript = '/<(script)(?<attr>[^>]*)>(?<content>.*)<\/\1>/isU'; |
| 390 | 390 | $htmlTmp = \preg_replace_callback( |
| 391 | 391 | $regExSpecialScript, |
| 392 | - static function ($scripts) { |
|
| 392 | + static function($scripts) { |
|
| 393 | 393 | if (empty($scripts['content'])) { |
| 394 | 394 | return $scripts[0]; |
| 395 | 395 | } |
| 396 | 396 | |
| 397 | - return '<script' . $scripts['attr'] . '>' . \str_replace('</', '<\/', $scripts['content']) . '</script>'; |
|
| 397 | + return '<script'.$scripts['attr'].'>'.\str_replace('</', '<\/', $scripts['content']).'</script>'; |
|
| 398 | 398 | }, |
| 399 | 399 | $html |
| 400 | 400 | ); |
@@ -423,14 +423,14 @@ discard block |
||
| 423 | 423 | self::$domReplaceHelper['orig'] |
| 424 | 424 | ); |
| 425 | 425 | |
| 426 | - $DOM_REPLACE__HELPER_CACHE['tmp']['html_wrapper__start'] = '<' . self::$domHtmlWrapperHelper . '>'; |
|
| 427 | - $DOM_REPLACE__HELPER_CACHE['tmp']['html_wrapper__end'] = '</' . self::$domHtmlWrapperHelper . '>'; |
|
| 426 | + $DOM_REPLACE__HELPER_CACHE['tmp']['html_wrapper__start'] = '<'.self::$domHtmlWrapperHelper.'>'; |
|
| 427 | + $DOM_REPLACE__HELPER_CACHE['tmp']['html_wrapper__end'] = '</'.self::$domHtmlWrapperHelper.'>'; |
|
| 428 | 428 | |
| 429 | 429 | $DOM_REPLACE__HELPER_CACHE['orig']['html_wrapper__start'] = ''; |
| 430 | 430 | $DOM_REPLACE__HELPER_CACHE['orig']['html_wrapper__end'] = ''; |
| 431 | 431 | |
| 432 | - $DOM_REPLACE__HELPER_CACHE['tmp']['html_special_script__start'] = '<' . self::$domHtmlSpecialScriptHelper; |
|
| 433 | - $DOM_REPLACE__HELPER_CACHE['tmp']['html_special_script__end'] = '</' . self::$domHtmlSpecialScriptHelper . '>'; |
|
| 432 | + $DOM_REPLACE__HELPER_CACHE['tmp']['html_special_script__start'] = '<'.self::$domHtmlSpecialScriptHelper; |
|
| 433 | + $DOM_REPLACE__HELPER_CACHE['tmp']['html_special_script__end'] = '</'.self::$domHtmlSpecialScriptHelper.'>'; |
|
| 434 | 434 | |
| 435 | 435 | $DOM_REPLACE__HELPER_CACHE['orig']['html_special_script__start'] = '<script'; |
| 436 | 436 | $DOM_REPLACE__HELPER_CACHE['orig']['html_special_script__end'] = '</script>'; |
@@ -65,7 +65,7 @@ |
||
| 65 | 65 | return (string) $this; |
| 66 | 66 | } |
| 67 | 67 | |
| 68 | - throw new \InvalidArgumentException('Undefined property: $' . $name); |
|
| 68 | + throw new \InvalidArgumentException('Undefined property: $'.$name); |
|
| 69 | 69 | } |
| 70 | 70 | |
| 71 | 71 | /** |
@@ -41,5 +41,5 @@ |
||
| 41 | 41 | $document = new \voku\helper\HtmlDomParser($html); |
| 42 | 42 | |
| 43 | 43 | foreach (find_contains($document, '.lall', 'foo') as $child_dom) { |
| 44 | - echo $child_dom->html() . "\n"; |
|
| 44 | + echo $child_dom->html()."\n"; |
|
| 45 | 45 | } |
@@ -24,5 +24,5 @@ |
||
| 24 | 24 | $data = scraping_imdb('http://imdb.com/title/tt0335266/'); |
| 25 | 25 | |
| 26 | 26 | foreach ($data as $k => $v) { |
| 27 | - echo '<strong>' . $k . ' </strong>' . $v . '<br>'; |
|
| 27 | + echo '<strong>'.$k.' </strong>'.$v.'<br>'; |
|
| 28 | 28 | } |
@@ -34,6 +34,6 @@ |
||
| 34 | 34 | |
| 35 | 35 | foreach ($data as $v) { |
| 36 | 36 | foreach ($v as $k_inner => $v_inner) { |
| 37 | - echo '<strong>' . $k_inner . ':</strong> ' . $v_inner . '<br><br>'; |
|
| 37 | + echo '<strong>'.$k_inner.':</strong> '.$v_inner.'<br><br>'; |
|
| 38 | 38 | } |
| 39 | 39 | } |