Complex classes like TemplateInspector often do a lot of different things. To break such a class down, we need to identify a cohesive component within that class. A common approach to find such a component is to look for fields/methods that share the same prefixes, or suffixes. You can also have a look at the cohesion graph to spot any un-connected, or weakly-connected components.
Once you have determined the fields that belong together, you can apply the Extract Class refactoring. If the component makes sense as a sub-class, Extract Subclass is also a candidate, and is often faster.
While breaking up the class, it is a good idea to analyze how other classes use TemplateInspector, and based on these observations, apply Extract Interface, too.
| 1 | <?php |
||
| 32 | class TemplateInspector |
||
| 33 | { |
||
| 34 | /** |
||
| 35 | * XSL namespace |
||
| 36 | */ |
||
| 37 | const XMLNS_XSL = 'http://www.w3.org/1999/XSL/Transform'; |
||
| 38 | |||
| 39 | /** |
||
| 40 | * @var string[] allowChild bitfield for each branch |
||
| 41 | */ |
||
| 42 | protected $allowChildBitfields = []; |
||
| 43 | |||
| 44 | /** |
||
| 45 | * @var bool Whether elements are allowed as children |
||
| 46 | */ |
||
| 47 | protected $allowsChildElements; |
||
| 48 | |||
| 49 | /** |
||
| 50 | * @var bool Whether text nodes are allowed as children |
||
| 51 | */ |
||
| 52 | protected $allowsText; |
||
| 53 | |||
| 54 | /** |
||
| 55 | * @var array[] Array of array of DOMElement instances |
||
| 56 | */ |
||
| 57 | protected $branches; |
||
| 58 | |||
| 59 | /** |
||
| 60 | * @var string OR-ed bitfield representing all of the categories used by this template |
||
| 61 | */ |
||
| 62 | protected $contentBitfield = "\0"; |
||
| 63 | |||
| 64 | /** |
||
| 65 | * @var string denyDescendant bitfield |
||
| 66 | */ |
||
| 67 | protected $denyDescendantBitfield = "\0"; |
||
| 68 | |||
| 69 | /** |
||
| 70 | * @var DOMDocument Document containing the template |
||
| 71 | */ |
||
| 72 | protected $dom; |
||
| 73 | |||
| 74 | /** |
||
| 75 | * @var bool Whether this template contains any HTML elements |
||
| 76 | */ |
||
| 77 | protected $hasElements = false; |
||
| 78 | |||
| 79 | /** |
||
| 80 | * @var bool Whether this template renders non-whitespace text nodes at its root |
||
| 81 | */ |
||
| 82 | protected $hasRootText; |
||
| 83 | |||
| 84 | /** |
||
| 85 | * @var bool Whether this template should be considered a block-level element |
||
| 86 | */ |
||
| 87 | protected $isBlock = false; |
||
| 88 | |||
| 89 | /** |
||
| 90 | * @var bool Whether the template uses the "empty" content model |
||
| 91 | */ |
||
| 92 | protected $isEmpty; |
||
| 93 | |||
| 94 | /** |
||
| 95 | * @var bool Whether this template adds to the list of active formatting elements |
||
| 96 | */ |
||
| 97 | protected $isFormattingElement; |
||
| 98 | |||
| 99 | /** |
||
| 100 | * @var bool Whether this template lets content through via an xsl:apply-templates element |
||
| 101 | */ |
||
| 102 | protected $isPassthrough = false; |
||
| 103 | |||
| 104 | /** |
||
| 105 | * @var bool Whether all branches use the transparent content model |
||
| 106 | */ |
||
| 107 | protected $isTransparent = false; |
||
| 108 | |||
| 109 | /** |
||
| 110 | * @var bool Whether all branches have an ancestor that is a void element |
||
| 111 | */ |
||
| 112 | protected $isVoid; |
||
| 113 | |||
| 114 | /** |
||
| 115 | * @var array Names of every last HTML element that precedes an <xsl:apply-templates/> node |
||
| 116 | */ |
||
| 117 | protected $leafNodes = []; |
||
| 118 | |||
| 119 | /** |
||
| 120 | * @var bool Whether any branch has an element that preserves new lines by default (e.g. <pre>) |
||
| 121 | */ |
||
| 122 | protected $preservesNewLines = false; |
||
| 123 | |||
| 124 | /** |
||
| 125 | * @var array Bitfield of the first HTML element of every branch |
||
| 126 | */ |
||
| 127 | protected $rootBitfields = []; |
||
| 128 | |||
| 129 | /** |
||
| 130 | * @var array Names of every HTML element that have no HTML parent |
||
| 131 | */ |
||
| 132 | protected $rootNodes = []; |
||
| 133 | |||
| 134 | /** |
||
| 135 | * @var DOMXPath XPath engine associated with $this->dom |
||
| 136 | */ |
||
| 137 | protected $xpath; |
||
| 138 | |||
| 139 | /** |
||
| 140 | * Constructor |
||
| 141 | * |
||
| 142 | * @param string $template Template content |
||
| 143 | */ |
||
| 144 | public function __construct($template) |
||
| 145 | { |
||
| 146 | $this->dom = TemplateHelper::loadTemplate($template); |
||
| 147 | $this->xpath = new DOMXPath($this->dom); |
||
| 148 | |||
| 149 | $this->analyseRootNodes(); |
||
| 150 | $this->analyseBranches(); |
||
| 151 | $this->analyseContent(); |
||
| 152 | } |
||
| 153 | |||
| 154 | /** |
||
| 155 | * Return whether this template allows a given child |
||
| 156 | * |
||
| 157 | * @param TemplateInspector $child |
||
| 158 | * @return bool |
||
| 159 | */ |
||
| 160 | public function allowsChild(TemplateInspector $child) |
||
| 161 | { |
||
| 162 | // Sometimes, a template can technically be allowed as a child but denied as a descendant |
||
| 163 | if (!$this->allowsDescendant($child)) |
||
| 164 | { |
||
| 165 | return false; |
||
| 166 | } |
||
| 167 | |||
| 168 | foreach ($child->rootBitfields as $rootBitfield) |
||
| 169 | { |
||
| 170 | foreach ($this->allowChildBitfields as $allowChildBitfield) |
||
| 171 | { |
||
| 172 | if (!self::match($rootBitfield, $allowChildBitfield)) |
||
| 173 | { |
||
| 174 | return false; |
||
| 175 | } |
||
| 176 | } |
||
| 177 | } |
||
| 178 | |||
| 179 | return ($this->allowsText || !$child->hasRootText); |
||
| 180 | } |
||
| 181 | |||
| 182 | /** |
||
| 183 | * Return whether this template allows a given descendant |
||
| 184 | * |
||
| 185 | * @param TemplateInspector $descendant |
||
| 186 | * @return bool |
||
| 187 | */ |
||
| 188 | public function allowsDescendant(TemplateInspector $descendant) |
||
| 189 | { |
||
| 190 | // Test whether the descendant is explicitly disallowed |
||
| 191 | if (self::match($descendant->contentBitfield, $this->denyDescendantBitfield)) |
||
| 192 | { |
||
| 193 | return false; |
||
| 194 | } |
||
| 195 | |||
| 196 | // Test whether the descendant contains any elements and we disallow elements |
||
| 197 | return ($this->allowsChildElements || !$descendant->hasElements); |
||
| 198 | } |
||
| 199 | |||
| 200 | /** |
||
| 201 | * Return whether this template allows elements as children |
||
| 202 | * |
||
| 203 | * @return bool |
||
| 204 | */ |
||
| 205 | public function allowsChildElements() |
||
| 209 | |||
| 210 | /** |
||
| 211 | * Return whether this template allows text nodes as children |
||
| 212 | * |
||
| 213 | * @return bool |
||
| 214 | */ |
||
| 215 | public function allowsText() |
||
| 219 | |||
| 220 | /** |
||
| 221 | * Return whether this template automatically closes given parent template |
||
| 222 | * |
||
| 223 | * @param TemplateInspector $parent |
||
| 224 | * @return bool |
||
| 225 | */ |
||
| 226 | public function closesParent(TemplateInspector $parent) |
||
| 248 | |||
| 249 | /** |
||
| 250 | * Evaluate an XPath expression |
||
| 251 | * |
||
| 252 | * @param string $expr XPath expression |
||
| 253 | * @param DOMElement $node Context node |
||
| 254 | * @return mixed |
||
| 255 | */ |
||
| 256 | public function evaluate($expr, DOMElement $node = null) |
||
| 257 | { |
||
| 258 | return $this->xpath->evaluate($expr, $node); |
||
| 259 | } |
||
| 260 | |||
| 261 | /** |
||
| 262 | * Return whether this template should be considered a block-level element |
||
| 263 | * |
||
| 264 | * @return bool |
||
| 265 | */ |
||
| 266 | public function isBlock() |
||
| 270 | |||
| 271 | /** |
||
| 272 | * Return whether this template adds to the list of active formatting elements |
||
| 273 | * |
||
| 274 | * @return bool |
||
| 275 | */ |
||
| 276 | public function isFormattingElement() |
||
| 280 | |||
| 281 | /** |
||
| 282 | * Return whether this template uses the "empty" content model |
||
| 283 | * |
||
| 284 | * @return bool |
||
| 285 | */ |
||
| 286 | public function isEmpty() |
||
| 290 | |||
| 291 | /** |
||
| 292 | * Return whether this template lets content through via an xsl:apply-templates element |
||
| 293 | * |
||
| 294 | * @return bool |
||
| 295 | */ |
||
| 296 | public function isPassthrough() |
||
| 300 | |||
| 301 | /** |
||
| 302 | * Return whether this template uses the "transparent" content model |
||
| 303 | * |
||
| 304 | * @return bool |
||
| 305 | */ |
||
| 306 | public function isTransparent() |
||
| 310 | |||
| 311 | /** |
||
| 312 | * Return whether all branches have an ancestor that is a void element |
||
| 313 | * |
||
| 314 | * @return bool |
||
| 315 | */ |
||
| 316 | public function isVoid() |
||
| 320 | |||
| 321 | /** |
||
| 322 | * Return whether this template preserves the whitespace in its descendants |
||
| 323 | * |
||
| 324 | * @return bool |
||
| 325 | */ |
||
| 326 | public function preservesNewLines() |
||
| 330 | |||
| 331 | /** |
||
| 332 | * Analyses the content of the whole template and set $this->contentBitfield accordingly |
||
| 333 | */ |
||
| 334 | protected function analyseContent() |
||
| 347 | |||
| 348 | /** |
||
| 349 | * Records the HTML elements (and their bitfield) rendered at the root of the template |
||
| 350 | */ |
||
| 351 | protected function analyseRootNodes() |
||
| 386 | |||
| 387 | /** |
||
| 388 | * Analyses each branch that leads to an <xsl:apply-templates/> tag |
||
| 389 | */ |
||
| 390 | protected function analyseBranches() |
||
| 461 | |||
| 462 | /** |
||
| 463 | * Test whether any branch of this template has an element that has given property |
||
| 464 | * |
||
| 465 | * @param string $propName |
||
| 466 | * @return bool |
||
| 467 | */ |
||
| 468 | protected function anyBranchHasProperty($propName) |
||
| 483 | |||
| 484 | /** |
||
| 485 | * Compute the allowChildBitfields and denyDescendantBitfield properties |
||
| 486 | * |
||
| 487 | * @return void |
||
| 488 | */ |
||
| 489 | protected function computeBitfields() |
||
| 526 | |||
| 527 | /** |
||
| 528 | * Compute the allowsChildElements property |
||
| 529 | * |
||
| 530 | * A template allows child Elements if it has at least one xsl:apply-templates and none of its |
||
| 531 | * ancestors have the text-only ("to") property |
||
| 532 | * |
||
| 533 | * @return void |
||
| 534 | */ |
||
| 535 | protected function computeAllowsChildElements() |
||
| 539 | |||
| 540 | /** |
||
| 541 | * Compute the allowsText property |
||
| 542 | * |
||
| 543 | * A template is said to allow text if none of the leaf elements disallow text |
||
| 544 | * |
||
| 545 | * @return void |
||
| 546 | */ |
||
| 547 | protected function computeAllowsText() |
||
| 561 | |||
| 562 | /** |
||
| 563 | * Compute the isFormattingElement property |
||
| 564 | * |
||
| 565 | * A template is said to be a formatting element if all (non-zero) of its branches are entirely |
||
| 566 | * composed of formatting elements |
||
| 567 | * |
||
| 568 | * @return void |
||
| 569 | */ |
||
| 570 | protected function computeFormattingElement() |
||
| 586 | |||
| 587 | /** |
||
| 588 | * Compute the isEmpty property |
||
| 589 | * |
||
| 590 | * A template is said to be empty if it has no xsl:apply-templates elements or any there is a empty |
||
| 591 | * element ancestor to an xsl:apply-templates element |
||
| 592 | * |
||
| 593 | * @return void |
||
| 594 | */ |
||
| 595 | protected function computeIsEmpty() |
||
| 599 | |||
| 600 | /** |
||
| 601 | * Compute the isTransparent property |
||
| 602 | * |
||
| 603 | * A template is said to be transparent if it has at least one branch and no non-transparent |
||
| 604 | * elements in its path |
||
| 605 | * |
||
| 606 | * @return void |
||
| 607 | */ |
||
| 608 | protected function computeIsTransparent() |
||
| 624 | |||
| 625 | /** |
||
| 626 | * Compute the isVoid property |
||
| 627 | * |
||
| 628 | * A template is said to be void if it has no xsl:apply-templates elements or any there is a void |
||
| 629 | * element ancestor to an xsl:apply-templates element |
||
| 630 | * |
||
| 631 | * @return void |
||
| 632 | */ |
||
| 633 | protected function computeIsVoid() |
||
| 637 | |||
| 638 | /** |
||
| 639 | * Test whether given element is a block-level element |
||
| 640 | * |
||
| 641 | * @param DOMElement $element |
||
| 642 | * @return bool |
||
| 643 | */ |
||
| 644 | protected function elementIsBlock(DOMElement $element) |
||
| 658 | |||
| 659 | /** |
||
| 660 | * Retrieve and return the inline style assigned to given element |
||
| 661 | * |
||
| 662 | * @param DOMElement $node Context node |
||
| 663 | * @return string |
||
| 664 | */ |
||
| 665 | protected function getStyle(DOMElement $node) |
||
| 679 | |||
| 680 | /** |
||
| 681 | * Test whether given node is a span element used for formatting |
||
| 682 | * |
||
| 683 | * Will return TRUE if the node is a span element with a class attribute and/or a style attribute |
||
| 684 | * and no other attributes |
||
| 685 | * |
||
| 686 | * @param DOMElement $node |
||
| 687 | * @return boolean |
||
| 688 | */ |
||
| 689 | protected function isFormattingSpan(DOMElement $node) |
||
| 711 | |||
| 712 | /** |
||
| 713 | * Store the names of every leaf node |
||
| 714 | * |
||
| 715 | * A leaf node is defined as the closest non-XSL ancestor to an xsl:apply-templates element |
||
| 716 | * |
||
| 717 | * @return void |
||
| 718 | */ |
||
| 719 | protected function storeLeafNodes() |
||
| 726 | |||
| 727 | /** |
||
| 728 | * "What is this?" you might ask. This is basically a compressed version of the HTML5 content |
||
| 729 | * models and rules, with some liberties taken. |
||
| 730 | * |
||
| 731 | * For each element, up to three bitfields are defined: "c", "ac" and "dd". Bitfields are stored |
||
| 732 | * as raw bytes, formatted using the octal notation to keep the sources ASCII. |
||
| 733 | * |
||
| 734 | * "c" represents the categories the element belongs to. The categories are comprised of HTML5 |
||
| 735 | * content models (such as "phrasing content" or "interactive content") plus a few special |
||
| 736 | * categories created to cover the parts of the specs that refer to "a group of X and Y |
||
| 737 | * elements" rather than a specific content model. |
||
| 738 | * |
||
| 739 | * "ac" represents the categories that are allowed as children of given element. |
||
| 740 | * |
||
| 741 | * "dd" represents the categories that must not appear as a descendant of given element. |
||
| 742 | * |
||
| 743 | * Sometimes, HTML5 specifies some restrictions on when an element can accept certain children, |
||
| 744 | * or what categories the element belongs to. For example, an <img> element is only part of the |
||
| 745 | * "interactive content" category if it has a "usemap" attribute. Those restrictions are |
||
| 746 | * expressed as an XPath expression and stored using the concatenation of the key of the bitfield |
||
| 747 | * plus the bit number of the category. For instance, if "interactive content" got assigned to |
||
| 748 | * bit 2, the definition of the <img> element will contain a key "c2" with value "@usemap". |
||
| 749 | * |
||
| 750 | * Additionally, other flags are set: |
||
| 751 | * |
||
| 752 | * "t" indicates that the element uses the "transparent" content model. |
||
| 753 | * "e" indicates that the element uses the "empty" content model. |
||
| 754 | * "v" indicates that the element is a void element. |
||
| 755 | * "nt" indicates that the element does not accept text nodes. (no text) |
||
| 756 | * "to" indicates that the element should only contain text. (text-only) |
||
| 757 | * "fe" indicates that the element is a formatting element. It will automatically be reopened |
||
| 758 | * when closed by an end tag of a different name. |
||
| 759 | * "b" indicates that the element is not phrasing content, which makes it likely to act like |
||
| 760 | * a block element. |
||
| 761 | * |
||
| 762 | * Finally, HTML5 defines "optional end tag" rules, where one element automatically closes its |
||
| 763 | * predecessor. Those are used to generate closeParent rules and are stored in the "cp" key. |
||
| 764 | * |
||
| 765 | * @var array |
||
| 766 | * @see /scripts/patchTemplateInspector.php |
||
| 767 | */ |
||
| 768 | protected static $htmlElements = [ |
||
| 769 | 'a'=>['c'=>"\17\0\0\0\0\1",'c3'=>'@href','ac'=>"\0",'dd'=>"\10\0\0\0\0\1",'t'=>1,'fe'=>1], |
||
| 770 | 'abbr'=>['c'=>"\7",'ac'=>"\4",'dd'=>"\0"], |
||
| 771 | 'address'=>['c'=>"\3\40",'ac'=>"\1",'dd'=>"\0\45",'b'=>1,'cp'=>['p']], |
||
| 772 | 'article'=>['c'=>"\3\4",'ac'=>"\1",'dd'=>"\0",'b'=>1,'cp'=>['p']], |
||
| 773 | 'aside'=>['c'=>"\3\4",'ac'=>"\1",'dd'=>"\0\0\0\0\10",'b'=>1,'cp'=>['p']], |
||
| 774 | 'audio'=>['c'=>"\57",'c3'=>'@controls','c1'=>'@controls','ac'=>"\0\0\0\104",'ac26'=>'not(@src)','dd'=>"\0\0\0\0\0\2",'dd41'=>'@src','t'=>1], |
||
| 775 | 'b'=>['c'=>"\7",'ac'=>"\4",'dd'=>"\0",'fe'=>1], |
||
| 776 | 'base'=>['c'=>"\20",'ac'=>"\0",'dd'=>"\0",'nt'=>1,'e'=>1,'v'=>1,'b'=>1], |
||
| 777 | 'bdi'=>['c'=>"\7",'ac'=>"\4",'dd'=>"\0"], |
||
| 778 | 'bdo'=>['c'=>"\7",'ac'=>"\4",'dd'=>"\0"], |
||
| 779 | 'blockquote'=>['c'=>"\203",'ac'=>"\1",'dd'=>"\0",'b'=>1,'cp'=>['p']], |
||
| 780 | 'body'=>['c'=>"\200\0\4",'ac'=>"\1",'dd'=>"\0",'b'=>1], |
||
| 781 | 'br'=>['c'=>"\5",'ac'=>"\0",'dd'=>"\0",'nt'=>1,'e'=>1,'v'=>1], |
||
| 782 | 'button'=>['c'=>"\117",'ac'=>"\4",'dd'=>"\10"], |
||
| 783 | 'canvas'=>['c'=>"\47",'ac'=>"\0",'dd'=>"\0",'t'=>1], |
||
| 784 | 'caption'=>['c'=>"\0\2",'ac'=>"\1",'dd'=>"\0\0\0\200",'b'=>1], |
||
| 785 | 'cite'=>['c'=>"\7",'ac'=>"\4",'dd'=>"\0"], |
||
| 786 | 'code'=>['c'=>"\7",'ac'=>"\4",'dd'=>"\0",'fe'=>1], |
||
| 787 | 'col'=>['c'=>"\0\0\20",'ac'=>"\0",'dd'=>"\0",'nt'=>1,'e'=>1,'v'=>1,'b'=>1], |
||
| 788 | 'colgroup'=>['c'=>"\0\2",'ac'=>"\0\0\20",'ac20'=>'not(@span)','dd'=>"\0",'nt'=>1,'e'=>1,'e0'=>'@span','b'=>1], |
||
| 789 | 'data'=>['c'=>"\7",'ac'=>"\4",'dd'=>"\0"], |
||
| 790 | 'datalist'=>['c'=>"\5",'ac'=>"\4\200\0\10",'dd'=>"\0"], |
||
| 791 | 'dd'=>['c'=>"\0\0\200",'ac'=>"\1",'dd'=>"\0",'b'=>1,'cp'=>['dd','dt']], |
||
| 792 | 'del'=>['c'=>"\5",'ac'=>"\0",'dd'=>"\0",'t'=>1], |
||
| 793 | 'details'=>['c'=>"\213",'ac'=>"\1\0\0\2",'dd'=>"\0",'b'=>1,'cp'=>['p']], |
||
| 794 | 'dfn'=>['c'=>"\7\0\0\0\40",'ac'=>"\4",'dd'=>"\0\0\0\0\40"], |
||
| 795 | 'div'=>['c'=>"\3",'ac'=>"\1",'dd'=>"\0",'b'=>1,'cp'=>['p']], |
||
| 796 | 'dl'=>['c'=>"\3",'c1'=>'dt and dd','ac'=>"\0\200\200",'dd'=>"\0",'nt'=>1,'b'=>1,'cp'=>['p']], |
||
| 797 | 'dt'=>['c'=>"\0\0\200",'ac'=>"\1",'dd'=>"\0\5\0\40",'b'=>1,'cp'=>['dd','dt']], |
||
| 798 | 'em'=>['c'=>"\7",'ac'=>"\4",'dd'=>"\0",'fe'=>1], |
||
| 799 | 'embed'=>['c'=>"\57",'ac'=>"\0",'dd'=>"\0",'nt'=>1,'e'=>1,'v'=>1], |
||
| 800 | 'fieldset'=>['c'=>"\303",'ac'=>"\1\0\0\20",'dd'=>"\0",'b'=>1,'cp'=>['p']], |
||
| 801 | 'figcaption'=>['c'=>"\0\0\0\0\0\4",'ac'=>"\1",'dd'=>"\0",'b'=>1,'cp'=>['p']], |
||
| 802 | 'figure'=>['c'=>"\203",'ac'=>"\1\0\0\0\0\4",'dd'=>"\0",'b'=>1,'cp'=>['p']], |
||
| 803 | 'footer'=>['c'=>"\3\40",'ac'=>"\1",'dd'=>"\0\0\0\0\10",'b'=>1,'cp'=>['p']], |
||
| 804 | 'form'=>['c'=>"\3\0\0\0\20",'ac'=>"\1",'dd'=>"\0\0\0\0\20",'b'=>1,'cp'=>['p']], |
||
| 805 | 'h1'=>['c'=>"\3\1",'ac'=>"\4",'dd'=>"\0",'b'=>1,'cp'=>['p']], |
||
| 806 | 'h2'=>['c'=>"\3\1",'ac'=>"\4",'dd'=>"\0",'b'=>1,'cp'=>['p']], |
||
| 807 | 'h3'=>['c'=>"\3\1",'ac'=>"\4",'dd'=>"\0",'b'=>1,'cp'=>['p']], |
||
| 808 | 'h4'=>['c'=>"\3\1",'ac'=>"\4",'dd'=>"\0",'b'=>1,'cp'=>['p']], |
||
| 809 | 'h5'=>['c'=>"\3\1",'ac'=>"\4",'dd'=>"\0",'b'=>1,'cp'=>['p']], |
||
| 810 | 'h6'=>['c'=>"\3\1",'ac'=>"\4",'dd'=>"\0",'b'=>1,'cp'=>['p']], |
||
| 811 | 'head'=>['c'=>"\0\0\4",'ac'=>"\20",'dd'=>"\0",'nt'=>1,'b'=>1], |
||
| 812 | 'header'=>['c'=>"\3\40\0\40",'ac'=>"\1",'dd'=>"\0\0\0\0\10",'b'=>1,'cp'=>['p']], |
||
| 813 | 'hr'=>['c'=>"\1\100",'ac'=>"\0",'dd'=>"\0",'nt'=>1,'e'=>1,'v'=>1,'b'=>1,'cp'=>['p']], |
||
| 814 | 'html'=>['c'=>"\0",'ac'=>"\0\0\4",'dd'=>"\0",'nt'=>1,'b'=>1], |
||
| 815 | 'i'=>['c'=>"\7",'ac'=>"\4",'dd'=>"\0",'fe'=>1], |
||
| 816 | 'iframe'=>['c'=>"\57",'ac'=>"\4",'dd'=>"\0"], |
||
| 817 | 'img'=>['c'=>"\57\20\10",'c3'=>'@usemap','ac'=>"\0",'dd'=>"\0",'nt'=>1,'e'=>1,'v'=>1], |
||
| 818 | 'input'=>['c'=>"\17\20",'c3'=>'@type!="hidden"','c12'=>'@type!="hidden" or @type="hidden"','c1'=>'@type!="hidden"','ac'=>"\0",'dd'=>"\0",'nt'=>1,'e'=>1,'v'=>1], |
||
| 819 | 'ins'=>['c'=>"\7",'ac'=>"\0",'dd'=>"\0",'t'=>1], |
||
| 820 | 'kbd'=>['c'=>"\7",'ac'=>"\4",'dd'=>"\0"], |
||
| 821 | 'keygen'=>['c'=>"\117",'ac'=>"\0",'dd'=>"\0",'nt'=>1,'e'=>1,'v'=>1], |
||
| 822 | 'label'=>['c'=>"\17\20\0\0\4",'ac'=>"\4",'dd'=>"\0\0\1\0\4"], |
||
| 823 | 'legend'=>['c'=>"\0\0\0\20",'ac'=>"\4",'dd'=>"\0",'b'=>1], |
||
| 824 | 'li'=>['c'=>"\0\0\0\0\200",'ac'=>"\1",'dd'=>"\0",'b'=>1,'cp'=>['li']], |
||
| 825 | 'link'=>['c'=>"\20",'ac'=>"\0",'dd'=>"\0",'nt'=>1,'e'=>1,'v'=>1,'b'=>1], |
||
| 826 | 'main'=>['c'=>"\3\0\0\0\10",'ac'=>"\1",'dd'=>"\0",'b'=>1,'cp'=>['p']], |
||
| 827 | 'mark'=>['c'=>"\7",'ac'=>"\4",'dd'=>"\0"], |
||
| 828 | 'media element'=>['c'=>"\0\0\0\0\0\2",'ac'=>"\0",'dd'=>"\0",'nt'=>1,'b'=>1], |
||
| 829 | 'menu'=>['c'=>"\1\100",'ac'=>"\0\300",'dd'=>"\0",'nt'=>1,'b'=>1,'cp'=>['p']], |
||
| 830 | 'menuitem'=>['c'=>"\0\100",'ac'=>"\0",'dd'=>"\0",'nt'=>1,'e'=>1,'v'=>1,'b'=>1], |
||
| 831 | 'meta'=>['c'=>"\20",'ac'=>"\0",'dd'=>"\0",'nt'=>1,'e'=>1,'v'=>1,'b'=>1], |
||
| 832 | 'meter'=>['c'=>"\7\0\1\0\2",'ac'=>"\4",'dd'=>"\0\0\0\0\2"], |
||
| 833 | 'nav'=>['c'=>"\3\4",'ac'=>"\1",'dd'=>"\0\0\0\0\10",'b'=>1,'cp'=>['p']], |
||
| 834 | 'noscript'=>['c'=>"\25",'ac'=>"\0",'dd'=>"\0",'nt'=>1], |
||
| 835 | 'object'=>['c'=>"\147",'ac'=>"\0\0\0\0\1",'dd'=>"\0",'t'=>1], |
||
| 836 | 'ol'=>['c'=>"\3",'c1'=>'li','ac'=>"\0\200\0\0\200",'dd'=>"\0",'nt'=>1,'b'=>1,'cp'=>['p']], |
||
| 837 | 'optgroup'=>['c'=>"\0\0\2",'ac'=>"\0\200\0\10",'dd'=>"\0",'nt'=>1,'b'=>1,'cp'=>['optgroup','option']], |
||
| 838 | 'option'=>['c'=>"\0\0\2\10",'ac'=>"\0",'dd'=>"\0",'b'=>1,'cp'=>['option']], |
||
| 839 | 'output'=>['c'=>"\107",'ac'=>"\4",'dd'=>"\0"], |
||
| 840 | 'p'=>['c'=>"\3",'ac'=>"\4",'dd'=>"\0",'b'=>1,'cp'=>['p']], |
||
| 841 | 'param'=>['c'=>"\0\0\0\0\1",'ac'=>"\0",'dd'=>"\0",'nt'=>1,'e'=>1,'v'=>1,'b'=>1], |
||
| 842 | 'picture'=>['c'=>"\45",'ac'=>"\0\200\10",'dd'=>"\0",'nt'=>1], |
||
| 843 | 'pre'=>['c'=>"\3",'ac'=>"\4",'dd'=>"\0",'pre'=>1,'b'=>1,'cp'=>['p']], |
||
| 844 | 'progress'=>['c'=>"\7\0\1\1",'ac'=>"\4",'dd'=>"\0\0\0\1"], |
||
| 845 | 'q'=>['c'=>"\7",'ac'=>"\4",'dd'=>"\0"], |
||
| 846 | 'rb'=>['c'=>"\0\10",'ac'=>"\4",'dd'=>"\0",'b'=>1], |
||
| 847 | 'rp'=>['c'=>"\0\10\100",'ac'=>"\4",'dd'=>"\0",'b'=>1,'cp'=>['rp','rt']], |
||
| 848 | 'rt'=>['c'=>"\0\10\100",'ac'=>"\4",'dd'=>"\0",'b'=>1,'cp'=>['rp','rt']], |
||
| 849 | 'rtc'=>['c'=>"\0\10",'ac'=>"\4\0\100",'dd'=>"\0",'b'=>1], |
||
| 850 | 'ruby'=>['c'=>"\7",'ac'=>"\4\10",'dd'=>"\0"], |
||
| 851 | 's'=>['c'=>"\7",'ac'=>"\4",'dd'=>"\0",'fe'=>1], |
||
| 852 | 'samp'=>['c'=>"\7",'ac'=>"\4",'dd'=>"\0"], |
||
| 853 | 'script'=>['c'=>"\25\200",'ac'=>"\0",'dd'=>"\0",'to'=>1], |
||
| 854 | 'section'=>['c'=>"\3\4",'ac'=>"\1",'dd'=>"\0",'b'=>1,'cp'=>['p']], |
||
| 855 | 'select'=>['c'=>"\117",'ac'=>"\0\200\2",'dd'=>"\0",'nt'=>1], |
||
| 856 | 'small'=>['c'=>"\7",'ac'=>"\4",'dd'=>"\0",'fe'=>1], |
||
| 857 | 'source'=>['c'=>"\0\0\10\4",'ac'=>"\0",'dd'=>"\0",'nt'=>1,'e'=>1,'v'=>1,'b'=>1], |
||
| 858 | 'span'=>['c'=>"\7",'ac'=>"\4",'dd'=>"\0"], |
||
| 859 | 'strong'=>['c'=>"\7",'ac'=>"\4",'dd'=>"\0",'fe'=>1], |
||
| 860 | 'style'=>['c'=>"\20",'ac'=>"\0",'dd'=>"\0",'to'=>1,'b'=>1], |
||
| 861 | 'sub'=>['c'=>"\7",'ac'=>"\4",'dd'=>"\0"], |
||
| 862 | 'summary'=>['c'=>"\0\0\0\2",'ac'=>"\4\1",'dd'=>"\0",'b'=>1], |
||
| 863 | 'sup'=>['c'=>"\7",'ac'=>"\4",'dd'=>"\0"], |
||
| 864 | 'table'=>['c'=>"\3\0\0\200",'ac'=>"\0\202",'dd'=>"\0",'nt'=>1,'b'=>1,'cp'=>['p']], |
||
| 865 | 'tbody'=>['c'=>"\0\2",'ac'=>"\0\200\0\0\100",'dd'=>"\0",'nt'=>1,'b'=>1,'cp'=>['tbody','td','tfoot','th','thead','tr']], |
||
| 866 | 'td'=>['c'=>"\200\0\40",'ac'=>"\1",'dd'=>"\0",'b'=>1,'cp'=>['td','th']], |
||
| 867 | 'template'=>['c'=>"\25\200\20",'ac'=>"\0",'dd'=>"\0",'nt'=>1], |
||
| 868 | 'textarea'=>['c'=>"\117",'ac'=>"\0",'dd'=>"\0",'pre'=>1,'to'=>1], |
||
| 869 | 'tfoot'=>['c'=>"\0\2",'ac'=>"\0\200\0\0\100",'dd'=>"\0",'nt'=>1,'b'=>1,'cp'=>['tbody','td','th','thead','tr']], |
||
| 870 | 'th'=>['c'=>"\0\0\40",'ac'=>"\1",'dd'=>"\0\5\0\40",'b'=>1,'cp'=>['td','th']], |
||
| 871 | 'thead'=>['c'=>"\0\2",'ac'=>"\0\200\0\0\100",'dd'=>"\0",'nt'=>1,'b'=>1], |
||
| 872 | 'time'=>['c'=>"\7",'ac'=>"\4",'ac2'=>'@datetime','dd'=>"\0"], |
||
| 873 | 'title'=>['c'=>"\20",'ac'=>"\0",'dd'=>"\0",'to'=>1,'b'=>1], |
||
| 874 | 'tr'=>['c'=>"\0\2\0\0\100",'ac'=>"\0\200\40",'dd'=>"\0",'nt'=>1,'b'=>1,'cp'=>['td','th','tr']], |
||
| 875 | 'track'=>['c'=>"\0\0\0\100",'ac'=>"\0",'dd'=>"\0",'nt'=>1,'e'=>1,'v'=>1,'b'=>1], |
||
| 876 | 'u'=>['c'=>"\7",'ac'=>"\4",'dd'=>"\0",'fe'=>1], |
||
| 877 | 'ul'=>['c'=>"\3",'c1'=>'li','ac'=>"\0\200\0\0\200",'dd'=>"\0",'nt'=>1,'b'=>1,'cp'=>['p']], |
||
| 878 | 'var'=>['c'=>"\7",'ac'=>"\4",'dd'=>"\0"], |
||
| 879 | 'video'=>['c'=>"\57",'c3'=>'@controls','ac'=>"\0\0\0\104",'ac26'=>'not(@src)','dd'=>"\0\0\0\0\0\2",'dd41'=>'@src','t'=>1], |
||
| 880 | 'wbr'=>['c'=>"\5",'ac'=>"\0",'dd'=>"\0",'nt'=>1,'e'=>1,'v'=>1] |
||
| 881 | ]; |
||
| 882 | |||
| 883 | /** |
||
| 884 | * Get the bitfield value for a given element in a given context |
||
| 885 | * |
||
| 886 | * @param DOMElement $element Context node |
||
| 887 | * @param string $k Bitfield name: either 'c', 'ac' or 'dd' |
||
| 888 | * @return string |
||
| 889 | */ |
||
| 890 | protected function getBitfield(DOMElement $element, $k) |
||
| 933 | |||
| 934 | /** |
||
| 935 | * Test whether given element has given property in context |
||
| 936 | * |
||
| 937 | * @param string $elName Element name |
||
| 938 | * @param string $propName Property name, see self::$htmlElements |
||
| 939 | * @param DOMElement $node Context node |
||
| 940 | * @return bool |
||
| 941 | */ |
||
| 942 | protected function hasProperty($elName, $propName, DOMElement $node) |
||
| 956 | |||
| 957 | /** |
||
| 958 | * Test whether two bitfields have any bits in common |
||
| 959 | * |
||
| 960 | * @param string $bitfield1 |
||
| 961 | * @param string $bitfield2 |
||
| 962 | * @return bool |
||
| 963 | */ |
||
| 964 | protected static function match($bitfield1, $bitfield2) |
||
| 968 | } |