@@ -15,17 +15,17 @@ discard block |
||
| 15 | 15 | * |
| 16 | 16 | * @return array |
| 17 | 17 | */ |
| 18 | - public static function parse( $html ) { |
|
| 19 | - $toBeEscaped = Strings::isAnEscapedHTML( $html ); |
|
| 18 | + public static function parse($html) { |
|
| 19 | + $toBeEscaped = Strings::isAnEscapedHTML($html); |
|
| 20 | 20 | |
| 21 | - if ( $toBeEscaped ) { |
|
| 22 | - $html = Strings::htmlspecialchars_decode( $html ); |
|
| 21 | + if ($toBeEscaped) { |
|
| 22 | + $html = Strings::htmlspecialchars_decode($html); |
|
| 23 | 23 | } |
| 24 | 24 | |
| 25 | - $html = self::protectNotClosedHtmlTags( $html ); |
|
| 26 | - $html = self::protectNotHtmlLessThanSymbols( $html ); |
|
| 25 | + $html = self::protectNotClosedHtmlTags($html); |
|
| 26 | + $html = self::protectNotHtmlLessThanSymbols($html); |
|
| 27 | 27 | |
| 28 | - return self::extractHtmlNode( $html, $toBeEscaped ); |
|
| 28 | + return self::extractHtmlNode($html, $toBeEscaped); |
|
| 29 | 29 | } |
| 30 | 30 | |
| 31 | 31 | /** |
@@ -43,41 +43,41 @@ discard block |
||
| 43 | 43 | * |
| 44 | 44 | * @return string |
| 45 | 45 | */ |
| 46 | - private static function protectNotHtmlLessThanSymbols( $html ) { |
|
| 47 | - preg_match_all( '/<|>/iu', $html, $matches, PREG_OFFSET_CAPTURE ); |
|
| 46 | + private static function protectNotHtmlLessThanSymbols($html) { |
|
| 47 | + preg_match_all('/<|>/iu', $html, $matches, PREG_OFFSET_CAPTURE); |
|
| 48 | 48 | |
| 49 | 49 | $delta = 0; |
| 50 | 50 | $realNextOffset = 0; |
| 51 | 51 | $next = null; |
| 52 | 52 | |
| 53 | - foreach ( $matches[ 0 ] as $key => $match ) { |
|
| 53 | + foreach ($matches[0] as $key => $match) { |
|
| 54 | 54 | |
| 55 | - $current = $matches[ 0 ][ $key ][ 0 ]; |
|
| 55 | + $current = $matches[0][$key][0]; |
|
| 56 | 56 | |
| 57 | - if ( isset( $matches[ 0 ][ $key + 1 ][ 0 ] ) ) { |
|
| 58 | - $next = $matches[ 0 ][ $key + 1 ][ 0 ]; |
|
| 59 | - $nextOffset = $matches[ 0 ][ $key + 1 ][ 1 ]; |
|
| 60 | - $realNextOffset = ( $delta === 0 ) ? $nextOffset : ( $nextOffset + $delta ); |
|
| 57 | + if (isset($matches[0][$key + 1][0])) { |
|
| 58 | + $next = $matches[0][$key + 1][0]; |
|
| 59 | + $nextOffset = $matches[0][$key + 1][1]; |
|
| 60 | + $realNextOffset = ($delta === 0) ? $nextOffset : ($nextOffset + $delta); |
|
| 61 | 61 | } |
| 62 | 62 | |
| 63 | - $length = strlen( $match[ 0 ] ); |
|
| 64 | - $offset = $matches[ 0 ][ $key ][ 1 ]; |
|
| 65 | - $realOffset = ( $delta === 0 ) ? $offset : ( $offset + $delta ); |
|
| 63 | + $length = strlen($match[0]); |
|
| 64 | + $offset = $matches[0][$key][1]; |
|
| 65 | + $realOffset = ($delta === 0) ? $offset : ($offset + $delta); |
|
| 66 | 66 | |
| 67 | - if ( $current === '<' && isset( $next ) ) { |
|
| 67 | + if ($current === '<' && isset($next)) { |
|
| 68 | 68 | |
| 69 | 69 | // 1. if next is > or |
| 70 | 70 | // 2. next is < and is not html tag (like < >) |
| 71 | - $insideAngularTags = substr( $html, $realOffset, ( $realNextOffset - $realOffset + 1 ) ); |
|
| 71 | + $insideAngularTags = substr($html, $realOffset, ($realNextOffset - $realOffset + 1)); |
|
| 72 | 72 | |
| 73 | - if ( $next !== '>' || !Strings::isHtmlString( $insideAngularTags ) ) { |
|
| 74 | - $html = substr_replace( $html, self::LT_PLACEHOLDER, $realOffset, $length ); |
|
| 75 | - $delta = $delta + strlen( self::LT_PLACEHOLDER ) - $length; |
|
| 73 | + if ($next !== '>' || !Strings::isHtmlString($insideAngularTags)) { |
|
| 74 | + $html = substr_replace($html, self::LT_PLACEHOLDER, $realOffset, $length); |
|
| 75 | + $delta = $delta + strlen(self::LT_PLACEHOLDER) - $length; |
|
| 76 | 76 | } |
| 77 | 77 | } |
| 78 | 78 | } |
| 79 | 79 | |
| 80 | - return !is_array( $html ) ? $html : implode( $html ); |
|
| 80 | + return !is_array($html) ? $html : implode($html); |
|
| 81 | 81 | } |
| 82 | 82 | |
| 83 | 83 | /** |
@@ -95,29 +95,29 @@ discard block |
||
| 95 | 95 | * |
| 96 | 96 | * @return string |
| 97 | 97 | */ |
| 98 | - private static function protectNotClosedHtmlTags( $html ) { |
|
| 99 | - preg_match_all( '/<|>/iu', $html, $matches, PREG_OFFSET_CAPTURE ); |
|
| 98 | + private static function protectNotClosedHtmlTags($html) { |
|
| 99 | + preg_match_all('/<|>/iu', $html, $matches, PREG_OFFSET_CAPTURE); |
|
| 100 | 100 | |
| 101 | 101 | $tags = []; |
| 102 | 102 | $offsets = []; |
| 103 | 103 | $originalLengths = []; |
| 104 | 104 | |
| 105 | 105 | // 1. Map all tags |
| 106 | - foreach ( $matches[ 0 ] as $key => $match ) { |
|
| 107 | - $current = $matches[ 0 ][ $key ][ 0 ]; |
|
| 108 | - $currentOffset = $matches[ 0 ][ $key ][ 1 ]; |
|
| 106 | + foreach ($matches[0] as $key => $match) { |
|
| 107 | + $current = $matches[0][$key][0]; |
|
| 108 | + $currentOffset = $matches[0][$key][1]; |
|
| 109 | 109 | |
| 110 | 110 | // check every string inside angular brackets (< and >) |
| 111 | - if ( $current === '<' && isset( $matches[ 0 ][ $key + 1 ][ 0 ] ) && $matches[ 0 ][ $key + 1 ][ 0 ] === '>' ) { |
|
| 112 | - $nextOffset = $matches[ 0 ][ $key + 1 ][ 1 ]; |
|
| 113 | - $tag = substr( $html, ( $currentOffset + 1 ), ( $nextOffset - $currentOffset - 1 ) ); |
|
| 114 | - $trimmedTag = trim( $tag ); |
|
| 111 | + if ($current === '<' && isset($matches[0][$key + 1][0]) && $matches[0][$key + 1][0] === '>') { |
|
| 112 | + $nextOffset = $matches[0][$key + 1][1]; |
|
| 113 | + $tag = substr($html, ($currentOffset + 1), ($nextOffset - $currentOffset - 1)); |
|
| 114 | + $trimmedTag = trim($tag); |
|
| 115 | 115 | |
| 116 | 116 | // if the tag is self closed do nothing |
| 117 | - if ( Strings::lastChar( $tag ) !== '/' ) { |
|
| 117 | + if (Strings::lastChar($tag) !== '/') { |
|
| 118 | 118 | $tags[] = $trimmedTag; |
| 119 | 119 | $offsets[] = $currentOffset; |
| 120 | - $originalLengths[] = strlen( $tag ) + 2; // add 2 to length because there are < and > |
|
| 120 | + $originalLengths[] = strlen($tag) + 2; // add 2 to length because there are < and > |
|
| 121 | 121 | } |
| 122 | 122 | } |
| 123 | 123 | } |
@@ -125,47 +125,47 @@ discard block |
||
| 125 | 125 | // 2. Removing closed tags |
| 126 | 126 | $indexes = []; |
| 127 | 127 | |
| 128 | - if ( count( $tags ) > 0 ) { |
|
| 129 | - foreach ( $tags as $index => $tag ) { |
|
| 128 | + if (count($tags) > 0) { |
|
| 129 | + foreach ($tags as $index => $tag) { |
|
| 130 | 130 | |
| 131 | - if ( Strings::contains( '/', $tag ) ) { |
|
| 131 | + if (Strings::contains('/', $tag)) { |
|
| 132 | 132 | $complementaryTag = $tag; |
| 133 | 133 | } else { |
| 134 | - $complementaryTag = '/' . explode( ' ', $tag )[ 0 ]; |
|
| 134 | + $complementaryTag = '/' . explode(' ', $tag)[0]; |
|
| 135 | 135 | } |
| 136 | 136 | |
| 137 | - $complementaryTagIndex = array_search( $complementaryTag, $tags ); |
|
| 137 | + $complementaryTagIndex = array_search($complementaryTag, $tags); |
|
| 138 | 138 | |
| 139 | - if ( false !== $complementaryTagIndex ) { |
|
| 139 | + if (false !== $complementaryTagIndex) { |
|
| 140 | 140 | $indexes[] = $index; |
| 141 | 141 | $indexes[] = $complementaryTagIndex; |
| 142 | 142 | } |
| 143 | 143 | } |
| 144 | 144 | } |
| 145 | 145 | |
| 146 | - $indexes = array_unique( $indexes ); |
|
| 147 | - foreach ( $indexes as $index ) { |
|
| 148 | - unset( $tags[ $index ] ); |
|
| 146 | + $indexes = array_unique($indexes); |
|
| 147 | + foreach ($indexes as $index) { |
|
| 148 | + unset($tags[$index]); |
|
| 149 | 149 | } |
| 150 | 150 | |
| 151 | 151 | // 3. Loop not closed tags |
| 152 | 152 | $delta = 0; |
| 153 | 153 | |
| 154 | - if ( count( $tags ) ) { |
|
| 155 | - foreach ( $tags as $index => $tag ) { |
|
| 154 | + if (count($tags)) { |
|
| 155 | + foreach ($tags as $index => $tag) { |
|
| 156 | 156 | |
| 157 | - $length = $originalLengths[ $index ]; |
|
| 158 | - $offset = $offsets[ $index ]; |
|
| 159 | - $realOffset = ( $delta === 0 ) ? $offset : ( $offset + $delta ); |
|
| 157 | + $length = $originalLengths[$index]; |
|
| 158 | + $offset = $offsets[$index]; |
|
| 159 | + $realOffset = ($delta === 0) ? $offset : ($offset + $delta); |
|
| 160 | 160 | |
| 161 | 161 | $replacement = self::LT_PLACEHOLDER . $tag . self::GT_PLACEHOLDER; |
| 162 | 162 | |
| 163 | - $html = substr_replace( $html, $replacement, $realOffset, $length ); |
|
| 164 | - $delta = $delta + strlen( $replacement ) - $length; |
|
| 163 | + $html = substr_replace($html, $replacement, $realOffset, $length); |
|
| 164 | + $delta = $delta + strlen($replacement) - $length; |
|
| 165 | 165 | } |
| 166 | 166 | } |
| 167 | 167 | |
| 168 | - return !is_array( $html ) ? $html : implode( $html ); |
|
| 168 | + return !is_array($html) ? $html : implode($html); |
|
| 169 | 169 | } |
| 170 | 170 | |
| 171 | 171 | /** |
@@ -174,55 +174,55 @@ discard block |
||
| 174 | 174 | * |
| 175 | 175 | * @return array |
| 176 | 176 | */ |
| 177 | - private static function extractHtmlNode( $html, $toBeEscaped = false ) { |
|
| 177 | + private static function extractHtmlNode($html, $toBeEscaped = false) { |
|
| 178 | 178 | $pattern = "/<([a-zA-Z0-9._-]+)([^>]|[^<]*?)(([\s]*\/>)|" . |
| 179 | 179 | "(>((([^<]*?|<\!\-\-.*?\-\->)|(?R))*)<\/\\1[\s]*>))/sm"; |
| 180 | - preg_match_all( $pattern, $html, $matches, PREG_OFFSET_CAPTURE ); |
|
| 180 | + preg_match_all($pattern, $html, $matches, PREG_OFFSET_CAPTURE); |
|
| 181 | 181 | |
| 182 | 182 | $elements = []; |
| 183 | 183 | |
| 184 | - foreach ( $matches[ 0 ] as $key => $match ) { |
|
| 184 | + foreach ($matches[0] as $key => $match) { |
|
| 185 | 185 | |
| 186 | - $attributes = isset( $matches[ 2 ][ $key ][ 0 ] ) ? self::getAttributes( $matches[ 2 ][ $key ][ 0 ] ) : []; |
|
| 187 | - $base64Decoded = ( isset( $attributes[ 'equiv-text' ] ) ) ? base64_decode( str_replace( "base64:", "", $attributes[ 'equiv-text' ] ) ) : null; |
|
| 188 | - $tagName = $matches[ 1 ][ $key ][ 0 ]; |
|
| 189 | - $text = !empty( $matches[ 6 ][ $key ][ 0 ] ) ? $matches[ 6 ][ $key ][ 0 ] : ""; |
|
| 186 | + $attributes = isset($matches[2][$key][0]) ? self::getAttributes($matches[2][$key][0]) : []; |
|
| 187 | + $base64Decoded = (isset($attributes['equiv-text'])) ? base64_decode(str_replace("base64:", "", $attributes['equiv-text'])) : null; |
|
| 188 | + $tagName = $matches[1][$key][0]; |
|
| 189 | + $text = !empty($matches[6][$key][0]) ? $matches[6][$key][0] : ""; |
|
| 190 | 190 | $originalText = $text; |
| 191 | - $strippedText = strip_tags( $text ); |
|
| 191 | + $strippedText = strip_tags($text); |
|
| 192 | 192 | |
| 193 | 193 | // get start and end tags |
| 194 | - $explodedNode = explode( self::ORIGINAL_TEXT_PLACEHOLDER, str_replace( $originalText, self::ORIGINAL_TEXT_PLACEHOLDER, $match[ 0 ] ) ); |
|
| 194 | + $explodedNode = explode(self::ORIGINAL_TEXT_PLACEHOLDER, str_replace($originalText, self::ORIGINAL_TEXT_PLACEHOLDER, $match[0])); |
|
| 195 | 195 | |
| 196 | - $start = ( isset( $explodedNode[ 0 ] ) ) ? $explodedNode[ 0 ] : ""; |
|
| 197 | - $end = ( isset( $explodedNode[ 1 ] ) ) ? $explodedNode[ 1 ] : ""; |
|
| 196 | + $start = (isset($explodedNode[0])) ? $explodedNode[0] : ""; |
|
| 197 | + $end = (isset($explodedNode[1])) ? $explodedNode[1] : ""; |
|
| 198 | 198 | |
| 199 | 199 | // inner_html |
| 200 | - $inner_html = self::getInnerHtml( $matches, $key, $toBeEscaped ); |
|
| 200 | + $inner_html = self::getInnerHtml($matches, $key, $toBeEscaped); |
|
| 201 | 201 | |
| 202 | 202 | // node |
| 203 | - $node = self::rebuildNode( $originalText, $toBeEscaped, $start, $end ); |
|
| 203 | + $node = self::rebuildNode($originalText, $toBeEscaped, $start, $end); |
|
| 204 | 204 | |
| 205 | 205 | // terminator |
| 206 | - $terminator = ( $toBeEscaped ) ? '>' : '>'; |
|
| 206 | + $terminator = ($toBeEscaped) ? '>' : '>'; |
|
| 207 | 207 | |
| 208 | 208 | // self closed |
| 209 | - $selfClosed = Strings::contains( '/>', trim( $start ) ); |
|
| 209 | + $selfClosed = Strings::contains('/>', trim($start)); |
|
| 210 | 210 | |
| 211 | 211 | $elements[] = (object)[ |
| 212 | - 'node' => self::restoreLessThanAndGreaterThanSymbols( $node ), |
|
| 213 | - 'start' => self::restoreLessThanAndGreaterThanSymbols( $start ), |
|
| 214 | - 'end' => self::restoreLessThanAndGreaterThanSymbols( $end ), |
|
| 212 | + 'node' => self::restoreLessThanAndGreaterThanSymbols($node), |
|
| 213 | + 'start' => self::restoreLessThanAndGreaterThanSymbols($start), |
|
| 214 | + 'end' => self::restoreLessThanAndGreaterThanSymbols($end), |
|
| 215 | 215 | 'terminator' => $terminator, |
| 216 | - 'offset' => $match[ 1 ], |
|
| 216 | + 'offset' => $match[1], |
|
| 217 | 217 | 'tagname' => $tagName, |
| 218 | 218 | 'attributes' => $attributes, |
| 219 | 219 | 'base64_decoded' => $base64Decoded, |
| 220 | 220 | 'self_closed' => $selfClosed, |
| 221 | - 'omittag' => ( $matches[ 4 ][ $key ][ 1 ] > -1 ), // boolean |
|
| 221 | + 'omittag' => ($matches[4][$key][1] > -1), // boolean |
|
| 222 | 222 | 'inner_html' => $inner_html, |
| 223 | - 'has_children' => is_array( $inner_html ), |
|
| 224 | - 'original_text' => ( $toBeEscaped ) ? self::restoreLessThanAndGreaterThanSymbols( Strings::escapeOnlyHTMLTags( $originalText ) ) : self::restoreLessThanAndGreaterThanSymbols( $originalText ), |
|
| 225 | - 'stripped_text' => self::restoreLessThanAndGreaterThanSymbols( $strippedText ), |
|
| 223 | + 'has_children' => is_array($inner_html), |
|
| 224 | + 'original_text' => ($toBeEscaped) ? self::restoreLessThanAndGreaterThanSymbols(Strings::escapeOnlyHTMLTags($originalText)) : self::restoreLessThanAndGreaterThanSymbols($originalText), |
|
| 225 | + 'stripped_text' => self::restoreLessThanAndGreaterThanSymbols($strippedText), |
|
| 226 | 226 | ]; |
| 227 | 227 | } |
| 228 | 228 | |
@@ -234,8 +234,8 @@ discard block |
||
| 234 | 234 | * |
| 235 | 235 | * @return string|string[] |
| 236 | 236 | */ |
| 237 | - private static function restoreLessThanAndGreaterThanSymbols( $text ) { |
|
| 238 | - return str_replace( [ self::LT_PLACEHOLDER, self::GT_PLACEHOLDER ], [ '<', '>' ], $text ); |
|
| 237 | + private static function restoreLessThanAndGreaterThanSymbols($text) { |
|
| 238 | + return str_replace([self::LT_PLACEHOLDER, self::GT_PLACEHOLDER], ['<', '>'], $text); |
|
| 239 | 239 | } |
| 240 | 240 | |
| 241 | 241 | /** |
@@ -246,17 +246,17 @@ discard block |
||
| 246 | 246 | * |
| 247 | 247 | * @return string |
| 248 | 248 | */ |
| 249 | - private static function rebuildNode( $originalText, $toBeEscaped, $start = null, $end = null ) { |
|
| 249 | + private static function rebuildNode($originalText, $toBeEscaped, $start = null, $end = null) { |
|
| 250 | 250 | $node = ''; |
| 251 | 251 | |
| 252 | - if ( !empty( $start ) ) { |
|
| 253 | - $node .= ( $toBeEscaped ) ? Strings::escapeOnlyHTMLTags( $start ) : $start; |
|
| 252 | + if (!empty($start)) { |
|
| 253 | + $node .= ($toBeEscaped) ? Strings::escapeOnlyHTMLTags($start) : $start; |
|
| 254 | 254 | } |
| 255 | 255 | |
| 256 | - $node .= ( $toBeEscaped ) ? Strings::escapeOnlyHTMLTags( $originalText ) : $originalText; |
|
| 256 | + $node .= ($toBeEscaped) ? Strings::escapeOnlyHTMLTags($originalText) : $originalText; |
|
| 257 | 257 | |
| 258 | - if ( !empty( $end ) ) { |
|
| 259 | - $node .= ( $toBeEscaped ) ? Strings::escapeOnlyHTMLTags( $end ) : $end; |
|
| 258 | + if (!empty($end)) { |
|
| 259 | + $node .= ($toBeEscaped) ? Strings::escapeOnlyHTMLTags($end) : $end; |
|
| 260 | 260 | } |
| 261 | 261 | |
| 262 | 262 | return $node; |
@@ -267,16 +267,16 @@ discard block |
||
| 267 | 267 | * |
| 268 | 268 | * @return mixed |
| 269 | 269 | */ |
| 270 | - public static function getAttributes( $content ) { |
|
| 270 | + public static function getAttributes($content) { |
|
| 271 | 271 | $pattern = '/(.*?)=("|\'|\\\")(.*?)("|\'|\\\"|\\\')/'; |
| 272 | 272 | |
| 273 | - preg_match_all( $pattern, $content, $matches, PREG_OFFSET_CAPTURE ); |
|
| 273 | + preg_match_all($pattern, $content, $matches, PREG_OFFSET_CAPTURE); |
|
| 274 | 274 | |
| 275 | 275 | $attributes = []; |
| 276 | 276 | |
| 277 | - if ( isset( $matches[ 1 ] ) && count( $matches[ 1 ] ) > 0 ) { |
|
| 278 | - foreach ( $matches[ 1 ] as $key => $match ) { |
|
| 279 | - $attributes[ trim( $match[ 0 ] ) ] = $matches[ 3 ][ $key ][ 0 ]; |
|
| 277 | + if (isset($matches[1]) && count($matches[1]) > 0) { |
|
| 278 | + foreach ($matches[1] as $key => $match) { |
|
| 279 | + $attributes[trim($match[0])] = $matches[3][$key][0]; |
|
| 280 | 280 | } |
| 281 | 281 | } |
| 282 | 282 | |
@@ -291,11 +291,11 @@ discard block |
||
| 291 | 291 | * |
| 292 | 292 | * @return array|mixed|string |
| 293 | 293 | */ |
| 294 | - private static function getInnerHtml( $matches, $key, $toBeEscaped = false ) { |
|
| 295 | - if ( isset( $matches[ 6 ][ $key ][ 0 ] ) ) { |
|
| 296 | - $node = self::extractHtmlNode( $matches[ 6 ][ $key ][ 0 ], $toBeEscaped ); |
|
| 294 | + private static function getInnerHtml($matches, $key, $toBeEscaped = false) { |
|
| 295 | + if (isset($matches[6][$key][0])) { |
|
| 296 | + $node = self::extractHtmlNode($matches[6][$key][0], $toBeEscaped); |
|
| 297 | 297 | |
| 298 | - return ( !empty( $node ) ) ? $node : $matches[ 6 ][ $key ][ 0 ]; |
|
| 298 | + return (!empty($node)) ? $node : $matches[6][$key][0]; |
|
| 299 | 299 | } |
| 300 | 300 | |
| 301 | 301 | return null; |
@@ -7404,7 +7404,7 @@ |
||
| 7404 | 7404 | ' |
@@ -7402,7 +7402,7 @@ |
||
| 7402 | 7402 | ' |
@@ -16,7 +16,7 @@ discard block |
||
| 16 | 16 | * |
| 17 | 17 | * @param array $map |
| 18 | 18 | */ |
| 19 | - public function __construct( array $map = null ) { |
|
| 19 | + public function __construct(array $map = null) { |
|
| 20 | 20 | $this->map = $map; |
| 21 | 21 | } |
| 22 | 22 | |
@@ -31,38 +31,38 @@ discard block |
||
| 31 | 31 | * |
| 32 | 32 | * @return string |
| 33 | 33 | */ |
| 34 | - public function replace( $string ) { |
|
| 34 | + public function replace($string) { |
|
| 35 | 35 | // if map is empty |
| 36 | 36 | // or the string has not a dataRef attribute |
| 37 | 37 | // return string as is |
| 38 | - if ( empty( $this->map ) || !$this->hasAnyDataRefAttribute( $string ) ) { |
|
| 38 | + if (empty($this->map) || !$this->hasAnyDataRefAttribute($string)) { |
|
| 39 | 39 | return $string; |
| 40 | 40 | } |
| 41 | 41 | |
| 42 | 42 | // (recursively) clean string from equiv-text eventually present |
| 43 | - $string = $this->cleanFromEquivText( $string ); |
|
| 43 | + $string = $this->cleanFromEquivText($string); |
|
| 44 | 44 | |
| 45 | - $html = HtmlParser::parse( $string ); |
|
| 45 | + $html = HtmlParser::parse($string); |
|
| 46 | 46 | |
| 47 | 47 | // 1. Replace <ph>|<sc>|<ec> tags |
| 48 | - foreach ( $html as $node ) { |
|
| 49 | - $string = $this->recursiveAddEquivTextToPhTag( $node, $string ); |
|
| 48 | + foreach ($html as $node) { |
|
| 49 | + $string = $this->recursiveAddEquivTextToPhTag($node, $string); |
|
| 50 | 50 | } |
| 51 | 51 | |
| 52 | 52 | // 2. Replace <pc> tags |
| 53 | - $toBeEscaped = Strings::isAnEscapedHTML( $string ); |
|
| 53 | + $toBeEscaped = Strings::isAnEscapedHTML($string); |
|
| 54 | 54 | |
| 55 | - if ( $this->stringContainsPcTags( $string, $toBeEscaped ) ) { |
|
| 55 | + if ($this->stringContainsPcTags($string, $toBeEscaped)) { |
|
| 56 | 56 | |
| 57 | 57 | // replace self-closed <pc /> |
| 58 | - $string = $this->replaceSelfClosedPcTags( $string, $toBeEscaped ); |
|
| 58 | + $string = $this->replaceSelfClosedPcTags($string, $toBeEscaped); |
|
| 59 | 59 | |
| 60 | 60 | // create a dataRefEnd map |
| 61 | 61 | // (needed for correct handling of </pc> closing tags) |
| 62 | - $dataRefEndMap = $this->buildDataRefEndMap( $html ); |
|
| 63 | - $string = $this->replaceOpeningPcTags( $string, $toBeEscaped ); |
|
| 64 | - $string = $this->replaceClosingPcTags( $string, $toBeEscaped, $dataRefEndMap ); |
|
| 65 | - $string = ( $toBeEscaped ) ? Strings::escapeOnlyHTMLTags( $string ) : $string; |
|
| 62 | + $dataRefEndMap = $this->buildDataRefEndMap($html); |
|
| 63 | + $string = $this->replaceOpeningPcTags($string, $toBeEscaped); |
|
| 64 | + $string = $this->replaceClosingPcTags($string, $toBeEscaped, $dataRefEndMap); |
|
| 65 | + $string = ($toBeEscaped) ? Strings::escapeOnlyHTMLTags($string) : $string; |
|
| 66 | 66 | } |
| 67 | 67 | |
| 68 | 68 | return $string; |
@@ -73,17 +73,17 @@ discard block |
||
| 73 | 73 | * |
| 74 | 74 | * @return bool |
| 75 | 75 | */ |
| 76 | - private function hasAnyDataRefAttribute( $string ) { |
|
| 76 | + private function hasAnyDataRefAttribute($string) { |
|
| 77 | 77 | $dataRefTags = [ |
| 78 | 78 | 'dataRef', |
| 79 | 79 | 'dataRefStart', |
| 80 | 80 | 'dataRefEnd', |
| 81 | 81 | ]; |
| 82 | 82 | |
| 83 | - foreach ( $dataRefTags as $tag ) { |
|
| 84 | - preg_match( '/ ' . $tag . '=[\\\\"](.*?)[\\\\"]/', $string, $matches ); |
|
| 83 | + foreach ($dataRefTags as $tag) { |
|
| 84 | + preg_match('/ ' . $tag . '=[\\\\"](.*?)[\\\\"]/', $string, $matches); |
|
| 85 | 85 | |
| 86 | - if ( count( $matches ) > 0 ) { |
|
| 86 | + if (count($matches) > 0) { |
|
| 87 | 87 | return true; |
| 88 | 88 | } |
| 89 | 89 | } |
@@ -94,11 +94,11 @@ discard block |
||
| 94 | 94 | * |
| 95 | 95 | * @return string |
| 96 | 96 | */ |
| 97 | - private function cleanFromEquivText( $string ) { |
|
| 98 | - $html = HtmlParser::parse( $string ); |
|
| 97 | + private function cleanFromEquivText($string) { |
|
| 98 | + $html = HtmlParser::parse($string); |
|
| 99 | 99 | |
| 100 | - foreach ( $html as $node ) { |
|
| 101 | - $string = $this->recursiveCleanFromEquivText( $node, $string ); |
|
| 100 | + foreach ($html as $node) { |
|
| 101 | + $string = $this->recursiveCleanFromEquivText($node, $string); |
|
| 102 | 102 | } |
| 103 | 103 | |
| 104 | 104 | return $string; |
@@ -117,57 +117,57 @@ discard block |
||
| 117 | 117 | * |
| 118 | 118 | * @return string |
| 119 | 119 | */ |
| 120 | - private function recursiveAddEquivTextToPhTag( $node, $string ) { |
|
| 121 | - if ( $node->has_children ) { |
|
| 122 | - foreach ( $node->inner_html as $childNode ) { |
|
| 123 | - $string = $this->recursiveAddEquivTextToPhTag( $childNode, $string ); |
|
| 120 | + private function recursiveAddEquivTextToPhTag($node, $string) { |
|
| 121 | + if ($node->has_children) { |
|
| 122 | + foreach ($node->inner_html as $childNode) { |
|
| 123 | + $string = $this->recursiveAddEquivTextToPhTag($childNode, $string); |
|
| 124 | 124 | } |
| 125 | 125 | } else { |
| 126 | - if ( $node->tagname === 'ph' || $node->tagname === 'sc' || $node->tagname === 'ec' ) { |
|
| 127 | - if ( !isset( $node->attributes[ 'dataRef' ] ) ) { |
|
| 126 | + if ($node->tagname === 'ph' || $node->tagname === 'sc' || $node->tagname === 'ec') { |
|
| 127 | + if (!isset($node->attributes['dataRef'])) { |
|
| 128 | 128 | return $string; |
| 129 | 129 | } |
| 130 | 130 | |
| 131 | - $a = $node->node; // complete match. Eg: <ph id="source1" dataRef="source1"/> |
|
| 132 | - $b = $node->attributes[ 'dataRef' ]; // map identifier. Eg: source1 |
|
| 131 | + $a = $node->node; // complete match. Eg: <ph id="source1" dataRef="source1"/> |
|
| 132 | + $b = $node->attributes['dataRef']; // map identifier. Eg: source1 |
|
| 133 | 133 | |
| 134 | 134 | |
| 135 | 135 | // if isset a value in the map calculate base64 encoded value |
| 136 | 136 | // otherwise skip |
| 137 | - if ( !in_array( $b, array_keys( $this->map ) ) ) { |
|
| 137 | + if (!in_array($b, array_keys($this->map))) { |
|
| 138 | 138 | return $string; |
| 139 | 139 | } |
| 140 | 140 | |
| 141 | 141 | // check if is null, in this case convert it to NULL string |
| 142 | - if ( is_null( $this->map[ $b ] ) ) { |
|
| 143 | - $this->map[ $b ] = 'NULL'; |
|
| 142 | + if (is_null($this->map[$b])) { |
|
| 143 | + $this->map[$b] = 'NULL'; |
|
| 144 | 144 | } |
| 145 | 145 | |
| 146 | - $value = $this->map[ $b ]; |
|
| 147 | - $base64EncodedValue = base64_encode( $value ); |
|
| 146 | + $value = $this->map[$b]; |
|
| 147 | + $base64EncodedValue = base64_encode($value); |
|
| 148 | 148 | |
| 149 | - if ( empty( $base64EncodedValue ) || $base64EncodedValue === '' ) { |
|
| 149 | + if (empty($base64EncodedValue) || $base64EncodedValue === '') { |
|
| 150 | 150 | return $string; |
| 151 | 151 | } |
| 152 | 152 | |
| 153 | 153 | // if there is no id copy it from dataRef |
| 154 | - $id = ( !isset( $node->attributes[ 'id' ] ) ) ? ' id="' . $b . '" removeId="true"' : ''; |
|
| 154 | + $id = (!isset($node->attributes['id'])) ? ' id="' . $b . '" removeId="true"' : ''; |
|
| 155 | 155 | |
| 156 | 156 | // introduce dataType for <ec>/<sc> tag handling |
| 157 | - $dataType = ( $this->isAEcOrScTag( $node ) ) ? ' dataType="' . $node->tagname . '"' : ''; |
|
| 157 | + $dataType = ($this->isAEcOrScTag($node)) ? ' dataType="' . $node->tagname . '"' : ''; |
|
| 158 | 158 | |
| 159 | 159 | // replacement |
| 160 | - $d = str_replace( '/', $id . $dataType . ' equiv-text="base64:' . $base64EncodedValue . '"/', $a ); |
|
| 161 | - $a = str_replace( [ '<', '>', '>', '<' ], '', $a ); |
|
| 162 | - $d = str_replace( [ '<', '>', '>', '<' ], '', $d ); |
|
| 160 | + $d = str_replace('/', $id . $dataType . ' equiv-text="base64:' . $base64EncodedValue . '"/', $a); |
|
| 161 | + $a = str_replace(['<', '>', '>', '<'], '', $a); |
|
| 162 | + $d = str_replace(['<', '>', '>', '<'], '', $d); |
|
| 163 | 163 | |
| 164 | 164 | // convert <ec>/<sc> into <ph> |
| 165 | - if ( $this->isAEcOrScTag( $node ) ) { |
|
| 166 | - $d = 'ph' . substr( $d, 2 ); |
|
| 167 | - $d = trim( $d ); |
|
| 165 | + if ($this->isAEcOrScTag($node)) { |
|
| 166 | + $d = 'ph' . substr($d, 2); |
|
| 167 | + $d = trim($d); |
|
| 168 | 168 | } |
| 169 | 169 | |
| 170 | - return str_replace( $a, $d, $string ); |
|
| 170 | + return str_replace($a, $d, $string); |
|
| 171 | 171 | } |
| 172 | 172 | } |
| 173 | 173 | |
@@ -180,11 +180,11 @@ discard block |
||
| 180 | 180 | * |
| 181 | 181 | * @return bool |
| 182 | 182 | */ |
| 183 | - private function stringContainsPcTags( $string, $toBeEscaped ) { |
|
| 184 | - $regex = ( $toBeEscaped ) ? '/<pc (.*?)>/iu' : '/<pc (.*?)>/iu'; |
|
| 185 | - preg_match_all( $regex, $string, $openingPcMatches ); |
|
| 183 | + private function stringContainsPcTags($string, $toBeEscaped) { |
|
| 184 | + $regex = ($toBeEscaped) ? '/<pc (.*?)>/iu' : '/<pc (.*?)>/iu'; |
|
| 185 | + preg_match_all($regex, $string, $openingPcMatches); |
|
| 186 | 186 | |
| 187 | - return ( isset( $openingPcMatches[ 0 ] ) && count( $openingPcMatches[ 0 ] ) > 0 ); |
|
| 187 | + return (isset($openingPcMatches[0]) && count($openingPcMatches[0]) > 0); |
|
| 188 | 188 | } |
| 189 | 189 | |
| 190 | 190 | /** |
@@ -193,28 +193,28 @@ discard block |
||
| 193 | 193 | * |
| 194 | 194 | * @return mixed |
| 195 | 195 | */ |
| 196 | - private function replaceSelfClosedPcTags( $string, $toBeEscaped ) { |
|
| 197 | - if ( $toBeEscaped ) { |
|
| 198 | - $string = str_replace( [ '<', '>' ], [ '<', '>' ], $string ); |
|
| 196 | + private function replaceSelfClosedPcTags($string, $toBeEscaped) { |
|
| 197 | + if ($toBeEscaped) { |
|
| 198 | + $string = str_replace(['<', '>'], ['<', '>'], $string); |
|
| 199 | 199 | } |
| 200 | 200 | |
| 201 | 201 | $regex = '/<pc[^>]+?\/>/iu'; |
| 202 | - preg_match_all( $regex, $string, $selfClosedPcMatches ); |
|
| 202 | + preg_match_all($regex, $string, $selfClosedPcMatches); |
|
| 203 | 203 | |
| 204 | - foreach ( $selfClosedPcMatches[ 0 ] as $match ) { |
|
| 204 | + foreach ($selfClosedPcMatches[0] as $match) { |
|
| 205 | 205 | |
| 206 | - $html = HtmlParser::parse( $match ); |
|
| 207 | - $node = $html[ 0 ]; |
|
| 206 | + $html = HtmlParser::parse($match); |
|
| 207 | + $node = $html[0]; |
|
| 208 | 208 | $attributes = $node->attributes; |
| 209 | 209 | |
| 210 | - if ( isset( $attributes[ 'dataRefStart' ] ) && array_key_exists( $node->attributes[ 'dataRefStart' ], $this->map ) ) { |
|
| 211 | - $replacement = '<ph id="' . $attributes[ 'id' ] . '" dataType="pcSelf" originalData="' . base64_encode( $match ) . '" dataRef="' . $attributes[ 'dataRefStart' ] . '" equiv-text="base64:' . base64_encode( $this->map[ $node->attributes[ 'dataRefStart' ] ] ) . '"/>'; |
|
| 212 | - $string = str_replace( $match, $replacement, $string ); |
|
| 210 | + if (isset($attributes['dataRefStart']) && array_key_exists($node->attributes['dataRefStart'], $this->map)) { |
|
| 211 | + $replacement = '<ph id="' . $attributes['id'] . '" dataType="pcSelf" originalData="' . base64_encode($match) . '" dataRef="' . $attributes['dataRefStart'] . '" equiv-text="base64:' . base64_encode($this->map[$node->attributes['dataRefStart']]) . '"/>'; |
|
| 212 | + $string = str_replace($match, $replacement, $string); |
|
| 213 | 213 | } |
| 214 | 214 | } |
| 215 | 215 | |
| 216 | - if ( $toBeEscaped ) { |
|
| 217 | - $string = str_replace( [ '<', '>' ], [ '<', '>' ], $string ); |
|
| 216 | + if ($toBeEscaped) { |
|
| 217 | + $string = str_replace(['<', '>'], ['<', '>'], $string); |
|
| 218 | 218 | } |
| 219 | 219 | |
| 220 | 220 | return $string; |
@@ -228,12 +228,12 @@ discard block |
||
| 228 | 228 | * |
| 229 | 229 | * @return array |
| 230 | 230 | */ |
| 231 | - private function buildDataRefEndMap( $html ) { |
|
| 231 | + private function buildDataRefEndMap($html) { |
|
| 232 | 232 | $dataRefEndMap = []; |
| 233 | 233 | |
| 234 | - foreach ( $html as $index => $node ) { |
|
| 235 | - if ( $node->tagname === 'pc' ) { |
|
| 236 | - $this->extractDataRefMapRecursively( $node, $dataRefEndMap ); |
|
| 234 | + foreach ($html as $index => $node) { |
|
| 235 | + if ($node->tagname === 'pc') { |
|
| 236 | + $this->extractDataRefMapRecursively($node, $dataRefEndMap); |
|
| 237 | 237 | } |
| 238 | 238 | } |
| 239 | 239 | |
@@ -246,25 +246,25 @@ discard block |
||
| 246 | 246 | * @param object $node |
| 247 | 247 | * @param $dataRefEndMap |
| 248 | 248 | */ |
| 249 | - private function extractDataRefMapRecursively( $node, &$dataRefEndMap ) { |
|
| 250 | - if ( $this->nodeContainsNestedPcTags( $node ) ) { |
|
| 251 | - foreach ( $node->inner_html as $nestedNode ) { |
|
| 252 | - $this->extractDataRefMapRecursively( $nestedNode, $dataRefEndMap ); |
|
| 249 | + private function extractDataRefMapRecursively($node, &$dataRefEndMap) { |
|
| 250 | + if ($this->nodeContainsNestedPcTags($node)) { |
|
| 251 | + foreach ($node->inner_html as $nestedNode) { |
|
| 252 | + $this->extractDataRefMapRecursively($nestedNode, $dataRefEndMap); |
|
| 253 | 253 | } |
| 254 | 254 | } |
| 255 | 255 | |
| 256 | 256 | // EXCLUDE self closed <pc/> |
| 257 | - if ( $node->tagname === 'pc' && $node->self_closed === false ) { |
|
| 258 | - if ( isset( $node->attributes[ 'dataRefEnd' ] ) ) { |
|
| 259 | - $dataRefEnd = $node->attributes[ 'dataRefEnd' ]; |
|
| 260 | - } elseif ( isset( $node->attributes[ 'dataRefStart' ] ) ) { |
|
| 261 | - $dataRefEnd = $node->attributes[ 'dataRefStart' ]; |
|
| 257 | + if ($node->tagname === 'pc' && $node->self_closed === false) { |
|
| 258 | + if (isset($node->attributes['dataRefEnd'])) { |
|
| 259 | + $dataRefEnd = $node->attributes['dataRefEnd']; |
|
| 260 | + } elseif (isset($node->attributes['dataRefStart'])) { |
|
| 261 | + $dataRefEnd = $node->attributes['dataRefStart']; |
|
| 262 | 262 | } else { |
| 263 | 263 | $dataRefEnd = null; |
| 264 | 264 | } |
| 265 | 265 | |
| 266 | 266 | $dataRefEndMap[] = [ |
| 267 | - 'id' => isset( $node->attributes[ 'id' ] ) ? $node->attributes[ 'id' ] : null, |
|
| 267 | + 'id' => isset($node->attributes['id']) ? $node->attributes['id'] : null, |
|
| 268 | 268 | 'dataRefEnd' => $dataRefEnd, |
| 269 | 269 | ]; |
| 270 | 270 | } |
@@ -276,15 +276,15 @@ discard block |
||
| 276 | 276 | * |
| 277 | 277 | * @return string|string[] |
| 278 | 278 | */ |
| 279 | - private function recursiveCleanFromEquivText( $node, $string ) { |
|
| 280 | - if ( $node->has_children ) { |
|
| 281 | - foreach ( $node->inner_html as $childNode ) { |
|
| 282 | - $string = $this->recursiveCleanFromEquivText( $childNode, $string ); |
|
| 279 | + private function recursiveCleanFromEquivText($node, $string) { |
|
| 280 | + if ($node->has_children) { |
|
| 281 | + foreach ($node->inner_html as $childNode) { |
|
| 282 | + $string = $this->recursiveCleanFromEquivText($childNode, $string); |
|
| 283 | 283 | } |
| 284 | 284 | } else { |
| 285 | - if ( isset( $node->attributes[ 'dataRef' ] ) && array_key_exists( $node->attributes[ 'dataRef' ], $this->map ) ) { |
|
| 286 | - $cleaned = preg_replace( '/ equiv-text="(.*?)"/', '', $node->node ); |
|
| 287 | - $string = str_replace( $node->node, $cleaned, $string ); |
|
| 285 | + if (isset($node->attributes['dataRef']) && array_key_exists($node->attributes['dataRef'], $this->map)) { |
|
| 286 | + $cleaned = preg_replace('/ equiv-text="(.*?)"/', '', $node->node); |
|
| 287 | + $string = str_replace($node->node, $cleaned, $string); |
|
| 288 | 288 | } |
| 289 | 289 | } |
| 290 | 290 | |
@@ -299,35 +299,35 @@ discard block |
||
| 299 | 299 | * |
| 300 | 300 | * @return string |
| 301 | 301 | */ |
| 302 | - private function replaceOpeningPcTags( $string, $toBeEscaped ) { |
|
| 303 | - $regex = ( $toBeEscaped ) ? '/<pc (.*?)>/iu' : '/<pc (.*?)>/iu'; |
|
| 304 | - preg_match_all( $regex, $string, $openingPcMatches ); |
|
| 302 | + private function replaceOpeningPcTags($string, $toBeEscaped) { |
|
| 303 | + $regex = ($toBeEscaped) ? '/<pc (.*?)>/iu' : '/<pc (.*?)>/iu'; |
|
| 304 | + preg_match_all($regex, $string, $openingPcMatches); |
|
| 305 | 305 | |
| 306 | - foreach ( $openingPcMatches[ 0 ] as $index => $match ) { |
|
| 307 | - $attr = HtmlParser::getAttributes( $openingPcMatches[ 1 ][ $index ] ); |
|
| 306 | + foreach ($openingPcMatches[0] as $index => $match) { |
|
| 307 | + $attr = HtmlParser::getAttributes($openingPcMatches[1][$index]); |
|
| 308 | 308 | |
| 309 | 309 | // CASE 1 - Missing `dataRefStart` |
| 310 | - if ( isset( $attr[ 'dataRefEnd' ] ) && !isset( $attr[ 'dataRefStart' ] ) ) { |
|
| 311 | - $attr[ 'dataRefStart' ] = $attr[ 'dataRefEnd' ]; |
|
| 310 | + if (isset($attr['dataRefEnd']) && !isset($attr['dataRefStart'])) { |
|
| 311 | + $attr['dataRefStart'] = $attr['dataRefEnd']; |
|
| 312 | 312 | } |
| 313 | 313 | |
| 314 | 314 | // CASE 2 - Missing `dataRefEnd` |
| 315 | - if ( isset( $attr[ 'dataRefStart' ] ) && !isset( $attr[ 'dataRefEnd' ] ) ) { |
|
| 316 | - $attr[ 'dataRefEnd' ] = $attr[ 'dataRefStart' ]; |
|
| 315 | + if (isset($attr['dataRefStart']) && !isset($attr['dataRefEnd'])) { |
|
| 316 | + $attr['dataRefEnd'] = $attr['dataRefStart']; |
|
| 317 | 317 | } |
| 318 | 318 | |
| 319 | - if ( isset( $attr[ 'dataRefStart' ] ) ) { |
|
| 319 | + if (isset($attr['dataRefStart'])) { |
|
| 320 | 320 | $startOriginalData = $match; // opening <pc> |
| 321 | - $startValue = $this->map[ $attr[ 'dataRefStart' ] ] ? $this->map[ $attr[ 'dataRefStart' ] ] : 'NULL'; //handling null values in original data map |
|
| 322 | - $base64EncodedStartValue = base64_encode( $startValue ); |
|
| 323 | - $base64StartOriginalData = base64_encode( $startOriginalData ); |
|
| 321 | + $startValue = $this->map[$attr['dataRefStart']] ? $this->map[$attr['dataRefStart']] : 'NULL'; //handling null values in original data map |
|
| 322 | + $base64EncodedStartValue = base64_encode($startValue); |
|
| 323 | + $base64StartOriginalData = base64_encode($startOriginalData); |
|
| 324 | 324 | |
| 325 | 325 | // conversion for opening <pc> tag |
| 326 | - $openingPcConverted = '<ph ' . ( ( isset( $attr[ 'id' ] ) ) ? 'id="' . $attr[ 'id' ] . '_1"' : '' ) . ' dataType="pcStart" originalData="' . $base64StartOriginalData . '" dataRef="' |
|
| 327 | - . $attr[ 'dataRefStart' ] . '" equiv-text="base64:' |
|
| 326 | + $openingPcConverted = '<ph ' . ((isset($attr['id'])) ? 'id="' . $attr['id'] . '_1"' : '') . ' dataType="pcStart" originalData="' . $base64StartOriginalData . '" dataRef="' |
|
| 327 | + . $attr['dataRefStart'] . '" equiv-text="base64:' |
|
| 328 | 328 | . $base64EncodedStartValue . '"/>'; |
| 329 | 329 | |
| 330 | - $string = str_replace( $startOriginalData, $openingPcConverted, $string ); |
|
| 330 | + $string = str_replace($startOriginalData, $openingPcConverted, $string); |
|
| 331 | 331 | } |
| 332 | 332 | } |
| 333 | 333 | |
@@ -344,34 +344,34 @@ discard block |
||
| 344 | 344 | * |
| 345 | 345 | * @return string |
| 346 | 346 | */ |
| 347 | - private function replaceClosingPcTags( $string, $toBeEscaped, $dataRefEndMap = [] ) { |
|
| 348 | - $regex = ( $toBeEscaped ) ? '/<\/pc>/iu' : '/<\/pc>/iu'; |
|
| 349 | - preg_match_all( $regex, $string, $closingPcMatches, PREG_OFFSET_CAPTURE ); |
|
| 347 | + private function replaceClosingPcTags($string, $toBeEscaped, $dataRefEndMap = []) { |
|
| 348 | + $regex = ($toBeEscaped) ? '/<\/pc>/iu' : '/<\/pc>/iu'; |
|
| 349 | + preg_match_all($regex, $string, $closingPcMatches, PREG_OFFSET_CAPTURE); |
|
| 350 | 350 | $delta = 0; |
| 351 | 351 | |
| 352 | - foreach ( $closingPcMatches[ 0 ] as $index => $match ) { |
|
| 353 | - $offset = $match[ 1 ]; |
|
| 354 | - $length = strlen( $match[ 0 ] ); |
|
| 355 | - $attr = $dataRefEndMap[ $index ]; |
|
| 352 | + foreach ($closingPcMatches[0] as $index => $match) { |
|
| 353 | + $offset = $match[1]; |
|
| 354 | + $length = strlen($match[0]); |
|
| 355 | + $attr = $dataRefEndMap[$index]; |
|
| 356 | 356 | |
| 357 | - if ( !empty( $attr ) && isset( $attr[ 'dataRefEnd' ] ) ) { |
|
| 358 | - $endOriginalData = $match[ 0 ]; // </pc> |
|
| 359 | - $endValue = $this->map[ $attr[ 'dataRefEnd' ] ] ?: 'NULL'; |
|
| 360 | - $base64EncodedEndValue = base64_encode( $endValue ); |
|
| 361 | - $base64EndOriginalData = base64_encode( $endOriginalData ); |
|
| 357 | + if (!empty($attr) && isset($attr['dataRefEnd'])) { |
|
| 358 | + $endOriginalData = $match[0]; // </pc> |
|
| 359 | + $endValue = $this->map[$attr['dataRefEnd']] ?: 'NULL'; |
|
| 360 | + $base64EncodedEndValue = base64_encode($endValue); |
|
| 361 | + $base64EndOriginalData = base64_encode($endOriginalData); |
|
| 362 | 362 | |
| 363 | 363 | // conversion for closing <pc> tag |
| 364 | - $closingPcConverted = '<ph ' . ( ( isset( $attr[ 'id' ] ) ) ? 'id="' . $attr[ 'id' ] . '_2"' : '' ) . ' dataType="pcEnd" originalData="' . $base64EndOriginalData . '" dataRef="' |
|
| 365 | - . $attr[ 'dataRefEnd' ] . '" equiv-text="base64:' . $base64EncodedEndValue . '"/>'; |
|
| 364 | + $closingPcConverted = '<ph ' . ((isset($attr['id'])) ? 'id="' . $attr['id'] . '_2"' : '') . ' dataType="pcEnd" originalData="' . $base64EndOriginalData . '" dataRef="' |
|
| 365 | + . $attr['dataRefEnd'] . '" equiv-text="base64:' . $base64EncodedEndValue . '"/>'; |
|
| 366 | 366 | |
| 367 | - $realOffset = ( $delta === 0 ) ? $offset : ( $offset + $delta ); |
|
| 367 | + $realOffset = ($delta === 0) ? $offset : ($offset + $delta); |
|
| 368 | 368 | |
| 369 | - $string = substr_replace( $string, $closingPcConverted, $realOffset, $length ); |
|
| 370 | - $delta = $delta + strlen( $closingPcConverted ) - $length; |
|
| 369 | + $string = substr_replace($string, $closingPcConverted, $realOffset, $length); |
|
| 370 | + $delta = $delta + strlen($closingPcConverted) - $length; |
|
| 371 | 371 | } |
| 372 | 372 | } |
| 373 | 373 | |
| 374 | - return !is_array( $string ) ? $string : implode( $string ); |
|
| 374 | + return !is_array($string) ? $string : implode($string); |
|
| 375 | 375 | } |
| 376 | 376 | |
| 377 | 377 | /** |
@@ -379,13 +379,13 @@ discard block |
||
| 379 | 379 | * |
| 380 | 380 | * @return bool |
| 381 | 381 | */ |
| 382 | - private function nodeContainsNestedPcTags( $node ) { |
|
| 383 | - if ( !$node->has_children ) { |
|
| 382 | + private function nodeContainsNestedPcTags($node) { |
|
| 383 | + if (!$node->has_children) { |
|
| 384 | 384 | return false; |
| 385 | 385 | } |
| 386 | 386 | |
| 387 | - foreach ( $node->inner_html as $nestedNode ) { |
|
| 388 | - if ( $nestedNode->tagname === 'pc' && ( isset( $node->attributes[ 'dataRefEnd' ] ) || isset( $node->attributes[ 'dataRefStart' ] ) ) ) { |
|
| 387 | + foreach ($node->inner_html as $nestedNode) { |
|
| 388 | + if ($nestedNode->tagname === 'pc' && (isset($node->attributes['dataRefEnd']) || isset($node->attributes['dataRefStart']))) { |
|
| 389 | 389 | return true; |
| 390 | 390 | } |
| 391 | 391 | } |
@@ -398,18 +398,18 @@ discard block |
||
| 398 | 398 | * |
| 399 | 399 | * @return string |
| 400 | 400 | */ |
| 401 | - public function restore( $string ) { |
|
| 401 | + public function restore($string) { |
|
| 402 | 402 | // if map is empty return string as is |
| 403 | - if ( empty( $this->map ) ) { |
|
| 403 | + if (empty($this->map)) { |
|
| 404 | 404 | return $string; |
| 405 | 405 | } |
| 406 | 406 | |
| 407 | 407 | // replace eventual empty equiv-text="" |
| 408 | - $string = str_replace( ' equiv-text=""', '', $string ); |
|
| 409 | - $html = HtmlParser::parse( $string ); |
|
| 408 | + $string = str_replace(' equiv-text=""', '', $string); |
|
| 409 | + $html = HtmlParser::parse($string); |
|
| 410 | 410 | |
| 411 | - foreach ( $html as $node ) { |
|
| 412 | - $string = $this->recursiveRemoveOriginalData( $node, $string ); |
|
| 411 | + foreach ($html as $node) { |
|
| 412 | + $string = $this->recursiveRemoveOriginalData($node, $string); |
|
| 413 | 413 | } |
| 414 | 414 | |
| 415 | 415 | return $string; |
@@ -421,76 +421,76 @@ discard block |
||
| 421 | 421 | * |
| 422 | 422 | * @return string|string[] |
| 423 | 423 | */ |
| 424 | - private function recursiveRemoveOriginalData( $node, $string ) { |
|
| 425 | - if ( $node->has_children ) { |
|
| 426 | - foreach ( $node->inner_html as $childNode ) { |
|
| 427 | - $string = $this->recursiveRemoveOriginalData( $childNode, $string ); |
|
| 424 | + private function recursiveRemoveOriginalData($node, $string) { |
|
| 425 | + if ($node->has_children) { |
|
| 426 | + foreach ($node->inner_html as $childNode) { |
|
| 427 | + $string = $this->recursiveRemoveOriginalData($childNode, $string); |
|
| 428 | 428 | } |
| 429 | 429 | } else { |
| 430 | 430 | |
| 431 | - if ( !isset( $node->attributes[ 'dataRef' ] ) ) { |
|
| 431 | + if (!isset($node->attributes['dataRef'])) { |
|
| 432 | 432 | return $string; |
| 433 | 433 | } |
| 434 | 434 | |
| 435 | - $a = $node->node; // complete match. Eg: <ph id="source1" dataRef="source1"/> |
|
| 436 | - $b = $node->attributes[ 'dataRef' ]; // map identifier. Eg: source1 |
|
| 437 | - $c = $node->terminator; // terminator: Eg: > |
|
| 435 | + $a = $node->node; // complete match. Eg: <ph id="source1" dataRef="source1"/> |
|
| 436 | + $b = $node->attributes['dataRef']; // map identifier. Eg: source1 |
|
| 437 | + $c = $node->terminator; // terminator: Eg: > |
|
| 438 | 438 | |
| 439 | 439 | // if isset a value in the map calculate base64 encoded value |
| 440 | 440 | // or it is an empty string |
| 441 | 441 | // otherwise skip |
| 442 | - if ( !in_array( $b, array_keys( $this->map ) ) ) { |
|
| 442 | + if (!in_array($b, array_keys($this->map))) { |
|
| 443 | 443 | return $string; |
| 444 | 444 | } |
| 445 | 445 | |
| 446 | 446 | // check if is null, in this case convert it to NULL string |
| 447 | - if ( is_null( $this->map[ $b ] ) ) { |
|
| 448 | - $this->map[ $b ] = 'NULL'; |
|
| 447 | + if (is_null($this->map[$b])) { |
|
| 448 | + $this->map[$b] = 'NULL'; |
|
| 449 | 449 | } |
| 450 | 450 | |
| 451 | 451 | // remove id? |
| 452 | - $removeId = ( isset( $node->attributes[ 'removeId' ] ) && $node->attributes[ 'removeId' ] === "true" ) ? ' id="' . $b . '" removeId="true"' : ''; |
|
| 452 | + $removeId = (isset($node->attributes['removeId']) && $node->attributes['removeId'] === "true") ? ' id="' . $b . '" removeId="true"' : ''; |
|
| 453 | 453 | |
| 454 | 454 | // grab dataType attribute for <ec>/<sc> tag handling |
| 455 | - $dataType = ( $this->wasAEcOrScTag( $node ) ) ? ' dataType="' . $node->attributes[ 'dataType' ] . '"' : ''; |
|
| 455 | + $dataType = ($this->wasAEcOrScTag($node)) ? ' dataType="' . $node->attributes['dataType'] . '"' : ''; |
|
| 456 | 456 | |
| 457 | - $d = str_replace( $removeId . $dataType . ' equiv-text="base64:' . base64_encode( $this->map[ $b ] ) . '"/' . $c, '/' . $c, $a ); |
|
| 457 | + $d = str_replace($removeId . $dataType . ' equiv-text="base64:' . base64_encode($this->map[$b]) . '"/' . $c, '/' . $c, $a); |
|
| 458 | 458 | |
| 459 | 459 | // replace original <ec>/<sc> tag |
| 460 | - if ( $this->wasAEcOrScTag( $node ) ) { |
|
| 461 | - $d = $node->attributes[ 'dataType' ] . substr( $d, 3 ); |
|
| 462 | - $d = trim( $d ); |
|
| 460 | + if ($this->wasAEcOrScTag($node)) { |
|
| 461 | + $d = $node->attributes['dataType'] . substr($d, 3); |
|
| 462 | + $d = trim($d); |
|
| 463 | 463 | } |
| 464 | 464 | |
| 465 | 465 | // replace only content tag, no matter if the string is encoded or not |
| 466 | 466 | // in this way we can handle string with mixed tags (encoded and not-encoded) |
| 467 | 467 | // in the same string |
| 468 | - $a = $this->purgeTags( $a ); |
|
| 469 | - $d = $this->purgeTags( $d ); |
|
| 468 | + $a = $this->purgeTags($a); |
|
| 469 | + $d = $this->purgeTags($d); |
|
| 470 | 470 | |
| 471 | - $string = str_replace( $a, $d, $string ); |
|
| 471 | + $string = str_replace($a, $d, $string); |
|
| 472 | 472 | |
| 473 | 473 | // restoring <pc/> self-closed here |
| 474 | - if ( Strings::contains( 'dataType="pcSelf"', $d ) ) { |
|
| 475 | - preg_match( '/\s?originalData="(.*?)"\s?/', $d, $originalDataMatches ); |
|
| 474 | + if (Strings::contains('dataType="pcSelf"', $d)) { |
|
| 475 | + preg_match('/\s?originalData="(.*?)"\s?/', $d, $originalDataMatches); |
|
| 476 | 476 | |
| 477 | - if ( isset( $originalDataMatches[ 1 ] ) ) { |
|
| 478 | - $originalData = base64_decode( $originalDataMatches[ 1 ] ); |
|
| 479 | - $originalData = $this->purgeTags( $originalData ); |
|
| 480 | - $string = str_replace( $d, $originalData, $string ); |
|
| 477 | + if (isset($originalDataMatches[1])) { |
|
| 478 | + $originalData = base64_decode($originalDataMatches[1]); |
|
| 479 | + $originalData = $this->purgeTags($originalData); |
|
| 480 | + $string = str_replace($d, $originalData, $string); |
|
| 481 | 481 | } |
| 482 | 482 | } |
| 483 | 483 | |
| 484 | 484 | // restoring <pc> tags here |
| 485 | 485 | // if <ph> tag has originalData and originalType is pcStart or pcEnd, |
| 486 | 486 | // replace with original data |
| 487 | - if ( Strings::contains( 'dataType="pcStart"', $d ) || Strings::contains( 'dataType="pcEnd"', $d ) ) { |
|
| 488 | - preg_match( '/\s?originalData="(.*?)"\s?/', $d, $originalDataMatches ); |
|
| 487 | + if (Strings::contains('dataType="pcStart"', $d) || Strings::contains('dataType="pcEnd"', $d)) { |
|
| 488 | + preg_match('/\s?originalData="(.*?)"\s?/', $d, $originalDataMatches); |
|
| 489 | 489 | |
| 490 | - if ( isset( $originalDataMatches[ 1 ] ) ) { |
|
| 491 | - $originalData = base64_decode( $originalDataMatches[ 1 ] ); |
|
| 492 | - $originalData = $this->purgeTags( $originalData ); |
|
| 493 | - $string = str_replace( $d, $originalData, $string ); |
|
| 490 | + if (isset($originalDataMatches[1])) { |
|
| 491 | + $originalData = base64_decode($originalDataMatches[1]); |
|
| 492 | + $originalData = $this->purgeTags($originalData); |
|
| 493 | + $string = str_replace($d, $originalData, $string); |
|
| 494 | 494 | } |
| 495 | 495 | } |
| 496 | 496 | } |
@@ -503,8 +503,8 @@ discard block |
||
| 503 | 503 | * |
| 504 | 504 | * @return string |
| 505 | 505 | */ |
| 506 | - private function purgeTags( $string ) { |
|
| 507 | - return str_replace( [ '<', '>', '<', '>' ], '', $string ); |
|
| 506 | + private function purgeTags($string) { |
|
| 507 | + return str_replace(['<', '>', '<', '>'], '', $string); |
|
| 508 | 508 | } |
| 509 | 509 | |
| 510 | 510 | /** |
@@ -514,8 +514,8 @@ discard block |
||
| 514 | 514 | * |
| 515 | 515 | * @return bool |
| 516 | 516 | */ |
| 517 | - private function isAEcOrScTag( $node ) { |
|
| 518 | - return ( $node->tagname === 'ec' || $node->tagname === 'sc' ); |
|
| 517 | + private function isAEcOrScTag($node) { |
|
| 518 | + return ($node->tagname === 'ec' || $node->tagname === 'sc'); |
|
| 519 | 519 | } |
| 520 | 520 | |
| 521 | 521 | /** |
@@ -526,7 +526,7 @@ discard block |
||
| 526 | 526 | * |
| 527 | 527 | * @return bool |
| 528 | 528 | */ |
| 529 | - private function wasAEcOrScTag( $node ) { |
|
| 530 | - return ( isset( $node->attributes[ 'dataType' ] ) && ( $node->attributes[ 'dataType' ] === 'ec' || $node->attributes[ 'dataType' ] === 'sc' ) ); |
|
| 529 | + private function wasAEcOrScTag($node) { |
|
| 530 | + return (isset($node->attributes['dataType']) && ($node->attributes['dataType'] === 'ec' || $node->attributes['dataType'] === 'sc')); |
|
| 531 | 531 | } |
| 532 | 532 | } |