@@ -17,392 +17,392 @@ |
||
17 | 17 | */ |
18 | 18 | class CleanHtmlService implements SingletonInterface |
19 | 19 | { |
20 | - /** |
|
21 | - * Enable Debug comment in footer. |
|
22 | - * |
|
23 | - * @var bool |
|
24 | - */ |
|
25 | - protected $debugComment = false; |
|
26 | - |
|
27 | - /** |
|
28 | - * Format Type. |
|
29 | - * |
|
30 | - * @var int |
|
31 | - */ |
|
32 | - protected $formatType = 0; |
|
33 | - |
|
34 | - /** |
|
35 | - * Tab character. |
|
36 | - * |
|
37 | - * @var string |
|
38 | - */ |
|
39 | - protected $tab = "\t"; |
|
40 | - |
|
41 | - /** |
|
42 | - * Newline character. |
|
43 | - * |
|
44 | - * @var string |
|
45 | - */ |
|
46 | - protected $newline = "\n"; |
|
47 | - |
|
48 | - /** |
|
49 | - * Configured extra header comment. |
|
50 | - * |
|
51 | - * @var string |
|
52 | - */ |
|
53 | - protected $headerComment = ''; |
|
54 | - |
|
55 | - /** |
|
56 | - * Empty space char. |
|
57 | - * |
|
58 | - * @var string |
|
59 | - */ |
|
60 | - protected $emptySpaceChar = ' '; |
|
61 | - |
|
62 | - /** |
|
63 | - * Set variables based on given config. |
|
64 | - */ |
|
65 | - public function setVariables(array $config): void |
|
66 | - { |
|
67 | - if (!empty($config)) { |
|
68 | - if ($config['formatHtml'] && is_numeric($config['formatHtml'])) { |
|
69 | - $this->formatType = (int) $config['formatHtml']; |
|
70 | - } |
|
71 | - |
|
72 | - if ($config['formatHtml.']['tabSize'] && is_numeric($config['formatHtml.']['tabSize'])) { |
|
73 | - $this->tab = str_pad('', (int) $config['formatHtml.']['tabSize'], ' '); |
|
74 | - } |
|
75 | - |
|
76 | - if (isset($config['formatHtml.']['debugComment'])) { |
|
77 | - $this->debugComment = (bool) $config['formatHtml.']['debugComment']; |
|
78 | - } |
|
79 | - |
|
80 | - if (isset($config['headerComment'])) { |
|
81 | - $this->headerComment = $config['headerComment']; |
|
82 | - } |
|
83 | - |
|
84 | - if (isset($config['dropEmptySpaceChar']) && (bool) $config['dropEmptySpaceChar']) { |
|
85 | - $this->emptySpaceChar = ''; |
|
86 | - } |
|
87 | - } |
|
88 | - } |
|
89 | - |
|
90 | - /** |
|
91 | - * Clean given HTML with formatter. |
|
92 | - * |
|
93 | - * @return string |
|
94 | - */ |
|
95 | - public function clean(string $html, array $config = []) |
|
96 | - { |
|
97 | - if (!empty($config)) { |
|
98 | - $this->setVariables($config); |
|
99 | - } |
|
100 | - // convert line-breaks to UNIX |
|
101 | - $this->convNlOs($html); |
|
102 | - |
|
103 | - $manipulations = []; |
|
104 | - |
|
105 | - if (isset($config['removeGenerator']) && (bool) $config['removeGenerator']) { |
|
106 | - $manipulations['removeGenerator'] = GeneralUtility::makeInstance(RemoveGenerator::class); |
|
107 | - } |
|
108 | - |
|
109 | - if (isset($config['removeComments']) && (bool) $config['removeComments']) { |
|
110 | - $manipulations['removeComments'] = GeneralUtility::makeInstance(RemoveComments::class); |
|
111 | - } |
|
112 | - |
|
113 | - if (!empty($this->headerComment)) { |
|
114 | - $this->includeHeaderComment($html); |
|
115 | - } |
|
116 | - |
|
117 | - foreach ($manipulations as $key => $manipulation) { |
|
118 | - /** @var ManipulationInterface $manipulation */ |
|
119 | - $configuration = isset($config[$key.'.']) && \is_array($config[$key.'.']) ? $config[$key.'.'] : []; |
|
120 | - $html = $manipulation->manipulate($html, $configuration); |
|
121 | - } |
|
122 | - |
|
123 | - // cleanup HTML5 self-closing elements |
|
124 | - if (!isset($GLOBALS['TSFE']->config['config']['doctype']) |
|
125 | - || 'x' !== substr($GLOBALS['TSFE']->config['config']['doctype'], 0, 1)) { |
|
126 | - $html = preg_replace( |
|
127 | - '/<((?:area|base|br|col|embed|hr|img|input|link|meta|param|source|track|wbr)\s[^>\\\\]+?)\s?\/>/', |
|
128 | - '<$1>', |
|
129 | - $html |
|
130 | - ); |
|
131 | - } |
|
132 | - |
|
133 | - if ($this->formatType > 0) { |
|
134 | - $html = $this->formatHtml($html); |
|
135 | - } |
|
136 | - // remove white space after line ending |
|
137 | - $this->rTrimLines($html); |
|
138 | - |
|
139 | - // recover line-breaks |
|
140 | - if (Environment::isWindows()) { |
|
141 | - $html = str_replace($this->newline, "\r\n", $html); |
|
142 | - } |
|
143 | - |
|
144 | - return $html; |
|
145 | - } |
|
146 | - |
|
147 | - /** |
|
148 | - * Formats the (X)HTML code: |
|
149 | - * - taps according to the hirarchy of the tags |
|
150 | - * - removes empty spaces between tags |
|
151 | - * - removes linebreaks within tags (spares where necessary: pre, textarea, comments, ..) |
|
152 | - * choose from five options: |
|
153 | - * 0 => off |
|
154 | - * 1 => no line break at all (code in one line) |
|
155 | - * 2 => minimalistic line breaks (structure defining box-elements) |
|
156 | - * 3 => aesthetic line breaks (important box-elements) |
|
157 | - * 4 => logic line breaks (all box-elements) |
|
158 | - * 5 => max line breaks (all elements). |
|
159 | - */ |
|
160 | - protected function formatHtml(string $html):string |
|
161 | - { |
|
162 | - // Save original formated pre, textarea, comments, styles and scripts & replace them with markers |
|
163 | - preg_match_all( |
|
164 | - '/(?s)((<!--.*?-->)|(<[ \n\r]*pre[^>]*>.*?<[ \n\r]*\/pre[^>]*>)|(<[ \n\r]*textarea[^>]*>.*?<[ \n\r]*\/textarea[^>]*>)|(<[ \n\r]*style[^>]*>.*?<[ \n\r]*\/style[^>]*>)|(<[ \n\r]*script[^>]*>.*?<[ \n\r]*\/script[^>]*>))/im', |
|
165 | - $html, |
|
166 | - $matches |
|
167 | - ); |
|
168 | - $noFormat = $matches[0]; // do not format these block elements |
|
169 | - for ($i = 0; $i < \count($noFormat); ++$i) { |
|
170 | - $html = str_replace($noFormat[$i], "\n<!-- ELEMENT {$i} -->", $html); |
|
171 | - } |
|
172 | - |
|
173 | - // define box elements for formatting |
|
174 | - $trueBoxElements = 'address|blockquote|center|dir|div|dl|fieldset|form|h1|h2|h3|h4|h5|h6|hr|isindex|menu|noframes|noscript|ol|p|pre|table|ul|article|aside|details|figcaption|figure|footer|header|hgroup|menu|nav|section'; |
|
175 | - $functionalBoxElements = 'dd|dt|frameset|li|tbody|td|tfoot|th|thead|tr|colgroup'; |
|
176 | - $usableBoxElements = 'applet|button|del|iframe|ins|map|object|script'; |
|
177 | - $imagineBoxElements = 'html|body|head|meta|title|link|script|base|!--'; |
|
178 | - $allBoxLikeElements = '(?>'.$trueBoxElements.'|'.$functionalBoxElements.'|'.$usableBoxElements.'|'.$imagineBoxElements.')'; |
|
179 | - $esteticBoxLikeElements = '(?>html|head|body|meta name|title|div|table|h1|h2|h3|h4|h5|h6|p|form|pre|center|!--)'; |
|
180 | - $structureBoxLikeElements = '(?>html|head|body|div|!--)'; |
|
181 | - |
|
182 | - // split html into it's elements |
|
183 | - $htmlArrayTemp = preg_split( |
|
184 | - '/(<(?:[^<>]+(?:"[^"]*"|\'[^\']*\')?)+>)/', |
|
185 | - $html, |
|
186 | - -1, |
|
187 | - \PREG_SPLIT_DELIM_CAPTURE | \PREG_SPLIT_NO_EMPTY |
|
188 | - ); |
|
189 | - |
|
190 | - if (false === $htmlArrayTemp) { |
|
191 | - // Restore saved comments, styles and scripts |
|
192 | - for ($i = 0; $i < \count($noFormat); ++$i) { |
|
193 | - $html = str_replace("<!-- ELEMENT {$i} -->", $noFormat[$i], $html); |
|
194 | - } |
|
195 | - |
|
196 | - return $html; |
|
197 | - } |
|
198 | - // remove empty lines |
|
199 | - $htmlArray = ['']; |
|
200 | - $index = 1; |
|
201 | - for ($x = 0; $x < \count($htmlArrayTemp); ++$x) { |
|
202 | - $text = trim($htmlArrayTemp[$x]); |
|
203 | - $htmlArray[$index] = '' !== $text ? $htmlArrayTemp[$x] : $this->emptySpaceChar; |
|
204 | - ++$index; |
|
205 | - } |
|
206 | - |
|
207 | - // rebuild html |
|
208 | - $html = ''; |
|
209 | - $tabs = 0; |
|
210 | - for ($x = 0; $x < \count($htmlArray); ++$x) { |
|
211 | - $htmlArrayBefore = $htmlArray[$x - 1] ?? ''; |
|
212 | - $htmlArrayCurrent = $htmlArray[$x] ?? ''; |
|
213 | - |
|
214 | - // check if the element should stand in a new line |
|
215 | - $newline = false; |
|
216 | - if ('<?xml' == substr($htmlArrayBefore, 0, 5)) { |
|
217 | - $newline = true; |
|
218 | - } elseif (2 == $this->formatType && ( // minimalistic line break |
|
219 | - // this element has a line break before itself |
|
220 | - preg_match( |
|
221 | - '/<'.$structureBoxLikeElements.'(.*)>/Usi', |
|
222 | - $htmlArrayCurrent |
|
223 | - ) || preg_match( |
|
224 | - '/<'.$structureBoxLikeElements.'(.*) \/>/Usi', |
|
225 | - $htmlArrayCurrent |
|
226 | - ) // one element before is a element that has a line break after |
|
227 | - || preg_match( |
|
228 | - '/<\/'.$structureBoxLikeElements.'(.*)>/Usi', |
|
229 | - $htmlArrayBefore |
|
230 | - ) || '<!--' == substr( |
|
231 | - $htmlArrayBefore, |
|
232 | - 0, |
|
233 | - 4 |
|
234 | - ) || preg_match('/<'.$structureBoxLikeElements.'(.*) \/>/Usi', $htmlArrayBefore)) |
|
235 | - ) { |
|
236 | - $newline = true; |
|
237 | - } elseif (3 == $this->formatType && ( // aestetic line break |
|
238 | - // this element has a line break before itself |
|
239 | - preg_match( |
|
240 | - '/<'.$esteticBoxLikeElements.'(.*)>/Usi', |
|
241 | - $htmlArrayCurrent |
|
242 | - ) || preg_match( |
|
243 | - '/<'.$esteticBoxLikeElements.'(.*) \/>/Usi', |
|
244 | - $htmlArrayCurrent |
|
245 | - ) // one element before is a element that has a line break after |
|
246 | - || preg_match('/<\/'.$esteticBoxLikeElements.'(.*)>/Usi', $htmlArrayBefore) || '<!--' == substr( |
|
247 | - $htmlArrayBefore, |
|
248 | - 0, |
|
249 | - 4 |
|
250 | - ) || preg_match('/<'.$esteticBoxLikeElements.'(.*) \/>/Usi', $htmlArrayBefore)) |
|
251 | - ) { |
|
252 | - $newline = true; |
|
253 | - } elseif ($this->formatType >= 4 && ( // logical line break |
|
254 | - // this element has a line break before itself |
|
255 | - preg_match( |
|
256 | - '/<'.$allBoxLikeElements.'(.*)>/Usi', |
|
257 | - $htmlArrayCurrent |
|
258 | - ) || preg_match( |
|
259 | - '/<'.$allBoxLikeElements.'(.*) \/>/Usi', |
|
260 | - $htmlArrayCurrent |
|
261 | - ) // one element before is a element that has a line break after |
|
262 | - || preg_match('/<\/'.$allBoxLikeElements.'(.*)>/Usi', $htmlArrayBefore) || '<!--' == substr( |
|
263 | - $htmlArrayBefore, |
|
264 | - 0, |
|
265 | - 4 |
|
266 | - ) || preg_match('/<'.$allBoxLikeElements.'(.*) \/>/Usi', $htmlArrayBefore)) |
|
267 | - ) { |
|
268 | - $newline = true; |
|
269 | - } |
|
270 | - |
|
271 | - // count down a tab |
|
272 | - if ('</' == substr($htmlArrayCurrent, 0, 2)) { |
|
273 | - --$tabs; |
|
274 | - } |
|
275 | - |
|
276 | - // add tabs and line breaks in front of the current tag |
|
277 | - if ($newline) { |
|
278 | - $html .= $this->newline; |
|
279 | - for ($y = 0; $y < $tabs; ++$y) { |
|
280 | - $html .= $this->tab; |
|
281 | - } |
|
282 | - } |
|
283 | - |
|
284 | - // remove white spaces and line breaks and add current tag to the html-string |
|
285 | - if ('<![CDATA[' == substr($htmlArrayCurrent, 0, 9) // remove multiple white space in CDATA / XML |
|
286 | - || '<?xml' == substr($htmlArrayCurrent, 0, 5) |
|
287 | - ) { |
|
288 | - $html .= $this->killWhiteSpace($htmlArrayCurrent); |
|
289 | - } else { // remove all line breaks |
|
290 | - $html .= $this->killLineBreaks($htmlArrayCurrent); |
|
291 | - } |
|
292 | - |
|
293 | - // count up a tab |
|
294 | - if ('<' == substr($htmlArrayCurrent, 0, 1) && '/' != substr($htmlArrayCurrent, 1, 1)) { |
|
295 | - if (' ' !== substr($htmlArrayCurrent, 1, 1) |
|
296 | - && 'img' !== substr($htmlArrayCurrent, 1, 3) |
|
297 | - && 'source' !== substr($htmlArrayCurrent, 1, 6) |
|
298 | - && 'br' !== substr($htmlArrayCurrent, 1, 2) |
|
299 | - && 'hr' !== substr($htmlArrayCurrent, 1, 2) |
|
300 | - && 'input' !== substr($htmlArrayCurrent, 1, 5) |
|
301 | - && 'link' !== substr($htmlArrayCurrent, 1, 4) |
|
302 | - && 'meta' !== substr($htmlArrayCurrent, 1, 4) |
|
303 | - && 'col ' !== substr($htmlArrayCurrent, 1, 4) |
|
304 | - && 'frame' !== substr($htmlArrayCurrent, 1, 5) |
|
305 | - && 'isindex' !== substr($htmlArrayCurrent, 1, 7) |
|
306 | - && 'param' !== substr($htmlArrayCurrent, 1, 5) |
|
307 | - && 'area' !== substr($htmlArrayCurrent, 1, 4) |
|
308 | - && 'base' !== substr($htmlArrayCurrent, 1, 4) |
|
309 | - && '<!' !== substr($htmlArrayCurrent, 0, 2) |
|
310 | - && '<?xml' !== substr($htmlArrayCurrent, 0, 5) |
|
311 | - ) { |
|
312 | - ++$tabs; |
|
313 | - } |
|
314 | - } |
|
315 | - } |
|
316 | - |
|
317 | - // Remove empty lines |
|
318 | - if ($this->formatType > 1) { |
|
319 | - $this->removeEmptyLines($html); |
|
320 | - } |
|
321 | - |
|
322 | - // Restore saved comments, styles and scripts |
|
323 | - for ($i = 0; $i < \count($noFormat); ++$i) { |
|
324 | - $html = str_replace("<!-- ELEMENT {$i} -->", $noFormat[$i], $html); |
|
325 | - } |
|
326 | - |
|
327 | - // include debug comment at the end |
|
328 | - if (0 != $tabs && true === $this->debugComment) { |
|
329 | - $html .= "<!-- {$tabs} open elements found -->"; |
|
330 | - } |
|
331 | - |
|
332 | - return $html; |
|
333 | - } |
|
334 | - |
|
335 | - /** |
|
336 | - * Remove ALL line breaks and multiple white space. |
|
337 | - * |
|
338 | - * @param string $html |
|
339 | - * |
|
340 | - * @return string |
|
341 | - */ |
|
342 | - protected function killLineBreaks($html) |
|
343 | - { |
|
344 | - $html = str_replace($this->newline, '', $html); |
|
345 | - |
|
346 | - return preg_replace('/\s\s+/u', ' ', $html); |
|
347 | - // ? return preg_replace('/\n|\s+(\s)/u', '$1', $html); |
|
348 | - } |
|
349 | - |
|
350 | - /** |
|
351 | - * Remove multiple white space, keeps line breaks. |
|
352 | - */ |
|
353 | - protected function killWhiteSpace(string $html): string |
|
354 | - { |
|
355 | - $temp = explode($this->newline, $html); |
|
356 | - for ($i = 0; $i < \count($temp); ++$i) { |
|
357 | - if (!trim($temp[$i])) { |
|
358 | - unset($temp[$i]); |
|
359 | - continue; |
|
360 | - } |
|
361 | - |
|
362 | - $temp[$i] = trim($temp[$i]); |
|
363 | - $temp[$i] = preg_replace('/\s\s+/', ' ', $temp[$i]); |
|
364 | - } |
|
365 | - |
|
366 | - return implode($this->newline, $temp); |
|
367 | - } |
|
368 | - |
|
369 | - /** |
|
370 | - * Remove white space at the end of lines, keeps other white space and line breaks. |
|
371 | - */ |
|
372 | - protected function rTrimLines(string &$html): void |
|
373 | - { |
|
374 | - $html = preg_replace('/\s+$/m', '', $html); |
|
375 | - } |
|
376 | - |
|
377 | - /** |
|
378 | - * Convert newlines according to the current OS. |
|
379 | - */ |
|
380 | - protected function convNlOs(string &$html): void |
|
381 | - { |
|
382 | - $html = preg_replace("(\r\n|\r)", $this->newline, $html); |
|
383 | - } |
|
384 | - |
|
385 | - /** |
|
386 | - * Remove empty lines. |
|
387 | - */ |
|
388 | - protected function removeEmptyLines(string &$html): void |
|
389 | - { |
|
390 | - $temp = explode($this->newline, $html); |
|
391 | - $result = []; |
|
392 | - for ($i = 0; $i < \count($temp); ++$i) { |
|
393 | - if ('' == trim($temp[$i])) { |
|
394 | - continue; |
|
395 | - } |
|
396 | - $result[] = $temp[$i]; |
|
397 | - } |
|
398 | - $html = implode($this->newline, $result); |
|
399 | - } |
|
400 | - |
|
401 | - /** |
|
402 | - * Include configured header comment in HTML content block. |
|
403 | - */ |
|
404 | - public function includeHeaderComment(string &$html): void |
|
405 | - { |
|
406 | - $html = preg_replace('/^(-->)$/m', "\n\t".$this->headerComment."\n$1", $html); |
|
407 | - } |
|
20 | + /** |
|
21 | + * Enable Debug comment in footer. |
|
22 | + * |
|
23 | + * @var bool |
|
24 | + */ |
|
25 | + protected $debugComment = false; |
|
26 | + |
|
27 | + /** |
|
28 | + * Format Type. |
|
29 | + * |
|
30 | + * @var int |
|
31 | + */ |
|
32 | + protected $formatType = 0; |
|
33 | + |
|
34 | + /** |
|
35 | + * Tab character. |
|
36 | + * |
|
37 | + * @var string |
|
38 | + */ |
|
39 | + protected $tab = "\t"; |
|
40 | + |
|
41 | + /** |
|
42 | + * Newline character. |
|
43 | + * |
|
44 | + * @var string |
|
45 | + */ |
|
46 | + protected $newline = "\n"; |
|
47 | + |
|
48 | + /** |
|
49 | + * Configured extra header comment. |
|
50 | + * |
|
51 | + * @var string |
|
52 | + */ |
|
53 | + protected $headerComment = ''; |
|
54 | + |
|
55 | + /** |
|
56 | + * Empty space char. |
|
57 | + * |
|
58 | + * @var string |
|
59 | + */ |
|
60 | + protected $emptySpaceChar = ' '; |
|
61 | + |
|
62 | + /** |
|
63 | + * Set variables based on given config. |
|
64 | + */ |
|
65 | + public function setVariables(array $config): void |
|
66 | + { |
|
67 | + if (!empty($config)) { |
|
68 | + if ($config['formatHtml'] && is_numeric($config['formatHtml'])) { |
|
69 | + $this->formatType = (int) $config['formatHtml']; |
|
70 | + } |
|
71 | + |
|
72 | + if ($config['formatHtml.']['tabSize'] && is_numeric($config['formatHtml.']['tabSize'])) { |
|
73 | + $this->tab = str_pad('', (int) $config['formatHtml.']['tabSize'], ' '); |
|
74 | + } |
|
75 | + |
|
76 | + if (isset($config['formatHtml.']['debugComment'])) { |
|
77 | + $this->debugComment = (bool) $config['formatHtml.']['debugComment']; |
|
78 | + } |
|
79 | + |
|
80 | + if (isset($config['headerComment'])) { |
|
81 | + $this->headerComment = $config['headerComment']; |
|
82 | + } |
|
83 | + |
|
84 | + if (isset($config['dropEmptySpaceChar']) && (bool) $config['dropEmptySpaceChar']) { |
|
85 | + $this->emptySpaceChar = ''; |
|
86 | + } |
|
87 | + } |
|
88 | + } |
|
89 | + |
|
90 | + /** |
|
91 | + * Clean given HTML with formatter. |
|
92 | + * |
|
93 | + * @return string |
|
94 | + */ |
|
95 | + public function clean(string $html, array $config = []) |
|
96 | + { |
|
97 | + if (!empty($config)) { |
|
98 | + $this->setVariables($config); |
|
99 | + } |
|
100 | + // convert line-breaks to UNIX |
|
101 | + $this->convNlOs($html); |
|
102 | + |
|
103 | + $manipulations = []; |
|
104 | + |
|
105 | + if (isset($config['removeGenerator']) && (bool) $config['removeGenerator']) { |
|
106 | + $manipulations['removeGenerator'] = GeneralUtility::makeInstance(RemoveGenerator::class); |
|
107 | + } |
|
108 | + |
|
109 | + if (isset($config['removeComments']) && (bool) $config['removeComments']) { |
|
110 | + $manipulations['removeComments'] = GeneralUtility::makeInstance(RemoveComments::class); |
|
111 | + } |
|
112 | + |
|
113 | + if (!empty($this->headerComment)) { |
|
114 | + $this->includeHeaderComment($html); |
|
115 | + } |
|
116 | + |
|
117 | + foreach ($manipulations as $key => $manipulation) { |
|
118 | + /** @var ManipulationInterface $manipulation */ |
|
119 | + $configuration = isset($config[$key.'.']) && \is_array($config[$key.'.']) ? $config[$key.'.'] : []; |
|
120 | + $html = $manipulation->manipulate($html, $configuration); |
|
121 | + } |
|
122 | + |
|
123 | + // cleanup HTML5 self-closing elements |
|
124 | + if (!isset($GLOBALS['TSFE']->config['config']['doctype']) |
|
125 | + || 'x' !== substr($GLOBALS['TSFE']->config['config']['doctype'], 0, 1)) { |
|
126 | + $html = preg_replace( |
|
127 | + '/<((?:area|base|br|col|embed|hr|img|input|link|meta|param|source|track|wbr)\s[^>\\\\]+?)\s?\/>/', |
|
128 | + '<$1>', |
|
129 | + $html |
|
130 | + ); |
|
131 | + } |
|
132 | + |
|
133 | + if ($this->formatType > 0) { |
|
134 | + $html = $this->formatHtml($html); |
|
135 | + } |
|
136 | + // remove white space after line ending |
|
137 | + $this->rTrimLines($html); |
|
138 | + |
|
139 | + // recover line-breaks |
|
140 | + if (Environment::isWindows()) { |
|
141 | + $html = str_replace($this->newline, "\r\n", $html); |
|
142 | + } |
|
143 | + |
|
144 | + return $html; |
|
145 | + } |
|
146 | + |
|
147 | + /** |
|
148 | + * Formats the (X)HTML code: |
|
149 | + * - taps according to the hirarchy of the tags |
|
150 | + * - removes empty spaces between tags |
|
151 | + * - removes linebreaks within tags (spares where necessary: pre, textarea, comments, ..) |
|
152 | + * choose from five options: |
|
153 | + * 0 => off |
|
154 | + * 1 => no line break at all (code in one line) |
|
155 | + * 2 => minimalistic line breaks (structure defining box-elements) |
|
156 | + * 3 => aesthetic line breaks (important box-elements) |
|
157 | + * 4 => logic line breaks (all box-elements) |
|
158 | + * 5 => max line breaks (all elements). |
|
159 | + */ |
|
160 | + protected function formatHtml(string $html):string |
|
161 | + { |
|
162 | + // Save original formated pre, textarea, comments, styles and scripts & replace them with markers |
|
163 | + preg_match_all( |
|
164 | + '/(?s)((<!--.*?-->)|(<[ \n\r]*pre[^>]*>.*?<[ \n\r]*\/pre[^>]*>)|(<[ \n\r]*textarea[^>]*>.*?<[ \n\r]*\/textarea[^>]*>)|(<[ \n\r]*style[^>]*>.*?<[ \n\r]*\/style[^>]*>)|(<[ \n\r]*script[^>]*>.*?<[ \n\r]*\/script[^>]*>))/im', |
|
165 | + $html, |
|
166 | + $matches |
|
167 | + ); |
|
168 | + $noFormat = $matches[0]; // do not format these block elements |
|
169 | + for ($i = 0; $i < \count($noFormat); ++$i) { |
|
170 | + $html = str_replace($noFormat[$i], "\n<!-- ELEMENT {$i} -->", $html); |
|
171 | + } |
|
172 | + |
|
173 | + // define box elements for formatting |
|
174 | + $trueBoxElements = 'address|blockquote|center|dir|div|dl|fieldset|form|h1|h2|h3|h4|h5|h6|hr|isindex|menu|noframes|noscript|ol|p|pre|table|ul|article|aside|details|figcaption|figure|footer|header|hgroup|menu|nav|section'; |
|
175 | + $functionalBoxElements = 'dd|dt|frameset|li|tbody|td|tfoot|th|thead|tr|colgroup'; |
|
176 | + $usableBoxElements = 'applet|button|del|iframe|ins|map|object|script'; |
|
177 | + $imagineBoxElements = 'html|body|head|meta|title|link|script|base|!--'; |
|
178 | + $allBoxLikeElements = '(?>'.$trueBoxElements.'|'.$functionalBoxElements.'|'.$usableBoxElements.'|'.$imagineBoxElements.')'; |
|
179 | + $esteticBoxLikeElements = '(?>html|head|body|meta name|title|div|table|h1|h2|h3|h4|h5|h6|p|form|pre|center|!--)'; |
|
180 | + $structureBoxLikeElements = '(?>html|head|body|div|!--)'; |
|
181 | + |
|
182 | + // split html into it's elements |
|
183 | + $htmlArrayTemp = preg_split( |
|
184 | + '/(<(?:[^<>]+(?:"[^"]*"|\'[^\']*\')?)+>)/', |
|
185 | + $html, |
|
186 | + -1, |
|
187 | + \PREG_SPLIT_DELIM_CAPTURE | \PREG_SPLIT_NO_EMPTY |
|
188 | + ); |
|
189 | + |
|
190 | + if (false === $htmlArrayTemp) { |
|
191 | + // Restore saved comments, styles and scripts |
|
192 | + for ($i = 0; $i < \count($noFormat); ++$i) { |
|
193 | + $html = str_replace("<!-- ELEMENT {$i} -->", $noFormat[$i], $html); |
|
194 | + } |
|
195 | + |
|
196 | + return $html; |
|
197 | + } |
|
198 | + // remove empty lines |
|
199 | + $htmlArray = ['']; |
|
200 | + $index = 1; |
|
201 | + for ($x = 0; $x < \count($htmlArrayTemp); ++$x) { |
|
202 | + $text = trim($htmlArrayTemp[$x]); |
|
203 | + $htmlArray[$index] = '' !== $text ? $htmlArrayTemp[$x] : $this->emptySpaceChar; |
|
204 | + ++$index; |
|
205 | + } |
|
206 | + |
|
207 | + // rebuild html |
|
208 | + $html = ''; |
|
209 | + $tabs = 0; |
|
210 | + for ($x = 0; $x < \count($htmlArray); ++$x) { |
|
211 | + $htmlArrayBefore = $htmlArray[$x - 1] ?? ''; |
|
212 | + $htmlArrayCurrent = $htmlArray[$x] ?? ''; |
|
213 | + |
|
214 | + // check if the element should stand in a new line |
|
215 | + $newline = false; |
|
216 | + if ('<?xml' == substr($htmlArrayBefore, 0, 5)) { |
|
217 | + $newline = true; |
|
218 | + } elseif (2 == $this->formatType && ( // minimalistic line break |
|
219 | + // this element has a line break before itself |
|
220 | + preg_match( |
|
221 | + '/<'.$structureBoxLikeElements.'(.*)>/Usi', |
|
222 | + $htmlArrayCurrent |
|
223 | + ) || preg_match( |
|
224 | + '/<'.$structureBoxLikeElements.'(.*) \/>/Usi', |
|
225 | + $htmlArrayCurrent |
|
226 | + ) // one element before is a element that has a line break after |
|
227 | + || preg_match( |
|
228 | + '/<\/'.$structureBoxLikeElements.'(.*)>/Usi', |
|
229 | + $htmlArrayBefore |
|
230 | + ) || '<!--' == substr( |
|
231 | + $htmlArrayBefore, |
|
232 | + 0, |
|
233 | + 4 |
|
234 | + ) || preg_match('/<'.$structureBoxLikeElements.'(.*) \/>/Usi', $htmlArrayBefore)) |
|
235 | + ) { |
|
236 | + $newline = true; |
|
237 | + } elseif (3 == $this->formatType && ( // aestetic line break |
|
238 | + // this element has a line break before itself |
|
239 | + preg_match( |
|
240 | + '/<'.$esteticBoxLikeElements.'(.*)>/Usi', |
|
241 | + $htmlArrayCurrent |
|
242 | + ) || preg_match( |
|
243 | + '/<'.$esteticBoxLikeElements.'(.*) \/>/Usi', |
|
244 | + $htmlArrayCurrent |
|
245 | + ) // one element before is a element that has a line break after |
|
246 | + || preg_match('/<\/'.$esteticBoxLikeElements.'(.*)>/Usi', $htmlArrayBefore) || '<!--' == substr( |
|
247 | + $htmlArrayBefore, |
|
248 | + 0, |
|
249 | + 4 |
|
250 | + ) || preg_match('/<'.$esteticBoxLikeElements.'(.*) \/>/Usi', $htmlArrayBefore)) |
|
251 | + ) { |
|
252 | + $newline = true; |
|
253 | + } elseif ($this->formatType >= 4 && ( // logical line break |
|
254 | + // this element has a line break before itself |
|
255 | + preg_match( |
|
256 | + '/<'.$allBoxLikeElements.'(.*)>/Usi', |
|
257 | + $htmlArrayCurrent |
|
258 | + ) || preg_match( |
|
259 | + '/<'.$allBoxLikeElements.'(.*) \/>/Usi', |
|
260 | + $htmlArrayCurrent |
|
261 | + ) // one element before is a element that has a line break after |
|
262 | + || preg_match('/<\/'.$allBoxLikeElements.'(.*)>/Usi', $htmlArrayBefore) || '<!--' == substr( |
|
263 | + $htmlArrayBefore, |
|
264 | + 0, |
|
265 | + 4 |
|
266 | + ) || preg_match('/<'.$allBoxLikeElements.'(.*) \/>/Usi', $htmlArrayBefore)) |
|
267 | + ) { |
|
268 | + $newline = true; |
|
269 | + } |
|
270 | + |
|
271 | + // count down a tab |
|
272 | + if ('</' == substr($htmlArrayCurrent, 0, 2)) { |
|
273 | + --$tabs; |
|
274 | + } |
|
275 | + |
|
276 | + // add tabs and line breaks in front of the current tag |
|
277 | + if ($newline) { |
|
278 | + $html .= $this->newline; |
|
279 | + for ($y = 0; $y < $tabs; ++$y) { |
|
280 | + $html .= $this->tab; |
|
281 | + } |
|
282 | + } |
|
283 | + |
|
284 | + // remove white spaces and line breaks and add current tag to the html-string |
|
285 | + if ('<![CDATA[' == substr($htmlArrayCurrent, 0, 9) // remove multiple white space in CDATA / XML |
|
286 | + || '<?xml' == substr($htmlArrayCurrent, 0, 5) |
|
287 | + ) { |
|
288 | + $html .= $this->killWhiteSpace($htmlArrayCurrent); |
|
289 | + } else { // remove all line breaks |
|
290 | + $html .= $this->killLineBreaks($htmlArrayCurrent); |
|
291 | + } |
|
292 | + |
|
293 | + // count up a tab |
|
294 | + if ('<' == substr($htmlArrayCurrent, 0, 1) && '/' != substr($htmlArrayCurrent, 1, 1)) { |
|
295 | + if (' ' !== substr($htmlArrayCurrent, 1, 1) |
|
296 | + && 'img' !== substr($htmlArrayCurrent, 1, 3) |
|
297 | + && 'source' !== substr($htmlArrayCurrent, 1, 6) |
|
298 | + && 'br' !== substr($htmlArrayCurrent, 1, 2) |
|
299 | + && 'hr' !== substr($htmlArrayCurrent, 1, 2) |
|
300 | + && 'input' !== substr($htmlArrayCurrent, 1, 5) |
|
301 | + && 'link' !== substr($htmlArrayCurrent, 1, 4) |
|
302 | + && 'meta' !== substr($htmlArrayCurrent, 1, 4) |
|
303 | + && 'col ' !== substr($htmlArrayCurrent, 1, 4) |
|
304 | + && 'frame' !== substr($htmlArrayCurrent, 1, 5) |
|
305 | + && 'isindex' !== substr($htmlArrayCurrent, 1, 7) |
|
306 | + && 'param' !== substr($htmlArrayCurrent, 1, 5) |
|
307 | + && 'area' !== substr($htmlArrayCurrent, 1, 4) |
|
308 | + && 'base' !== substr($htmlArrayCurrent, 1, 4) |
|
309 | + && '<!' !== substr($htmlArrayCurrent, 0, 2) |
|
310 | + && '<?xml' !== substr($htmlArrayCurrent, 0, 5) |
|
311 | + ) { |
|
312 | + ++$tabs; |
|
313 | + } |
|
314 | + } |
|
315 | + } |
|
316 | + |
|
317 | + // Remove empty lines |
|
318 | + if ($this->formatType > 1) { |
|
319 | + $this->removeEmptyLines($html); |
|
320 | + } |
|
321 | + |
|
322 | + // Restore saved comments, styles and scripts |
|
323 | + for ($i = 0; $i < \count($noFormat); ++$i) { |
|
324 | + $html = str_replace("<!-- ELEMENT {$i} -->", $noFormat[$i], $html); |
|
325 | + } |
|
326 | + |
|
327 | + // include debug comment at the end |
|
328 | + if (0 != $tabs && true === $this->debugComment) { |
|
329 | + $html .= "<!-- {$tabs} open elements found -->"; |
|
330 | + } |
|
331 | + |
|
332 | + return $html; |
|
333 | + } |
|
334 | + |
|
335 | + /** |
|
336 | + * Remove ALL line breaks and multiple white space. |
|
337 | + * |
|
338 | + * @param string $html |
|
339 | + * |
|
340 | + * @return string |
|
341 | + */ |
|
342 | + protected function killLineBreaks($html) |
|
343 | + { |
|
344 | + $html = str_replace($this->newline, '', $html); |
|
345 | + |
|
346 | + return preg_replace('/\s\s+/u', ' ', $html); |
|
347 | + // ? return preg_replace('/\n|\s+(\s)/u', '$1', $html); |
|
348 | + } |
|
349 | + |
|
350 | + /** |
|
351 | + * Remove multiple white space, keeps line breaks. |
|
352 | + */ |
|
353 | + protected function killWhiteSpace(string $html): string |
|
354 | + { |
|
355 | + $temp = explode($this->newline, $html); |
|
356 | + for ($i = 0; $i < \count($temp); ++$i) { |
|
357 | + if (!trim($temp[$i])) { |
|
358 | + unset($temp[$i]); |
|
359 | + continue; |
|
360 | + } |
|
361 | + |
|
362 | + $temp[$i] = trim($temp[$i]); |
|
363 | + $temp[$i] = preg_replace('/\s\s+/', ' ', $temp[$i]); |
|
364 | + } |
|
365 | + |
|
366 | + return implode($this->newline, $temp); |
|
367 | + } |
|
368 | + |
|
369 | + /** |
|
370 | + * Remove white space at the end of lines, keeps other white space and line breaks. |
|
371 | + */ |
|
372 | + protected function rTrimLines(string &$html): void |
|
373 | + { |
|
374 | + $html = preg_replace('/\s+$/m', '', $html); |
|
375 | + } |
|
376 | + |
|
377 | + /** |
|
378 | + * Convert newlines according to the current OS. |
|
379 | + */ |
|
380 | + protected function convNlOs(string &$html): void |
|
381 | + { |
|
382 | + $html = preg_replace("(\r\n|\r)", $this->newline, $html); |
|
383 | + } |
|
384 | + |
|
385 | + /** |
|
386 | + * Remove empty lines. |
|
387 | + */ |
|
388 | + protected function removeEmptyLines(string &$html): void |
|
389 | + { |
|
390 | + $temp = explode($this->newline, $html); |
|
391 | + $result = []; |
|
392 | + for ($i = 0; $i < \count($temp); ++$i) { |
|
393 | + if ('' == trim($temp[$i])) { |
|
394 | + continue; |
|
395 | + } |
|
396 | + $result[] = $temp[$i]; |
|
397 | + } |
|
398 | + $html = implode($this->newline, $result); |
|
399 | + } |
|
400 | + |
|
401 | + /** |
|
402 | + * Include configured header comment in HTML content block. |
|
403 | + */ |
|
404 | + public function includeHeaderComment(string &$html): void |
|
405 | + { |
|
406 | + $html = preg_replace('/^(-->)$/m', "\n\t".$this->headerComment."\n$1", $html); |
|
407 | + } |
|
408 | 408 | } |
@@ -13,197 +13,197 @@ |
||
13 | 13 | */ |
14 | 14 | class SvgStoreService implements \TYPO3\CMS\Core\SingletonInterface |
15 | 15 | { |
16 | - /** |
|
17 | - * SVG-Sprite storage directory. |
|
18 | - * |
|
19 | - * @var string |
|
20 | - */ |
|
21 | - protected $outputDir = '/typo3temp/assets/svg/'; |
|
22 | - |
|
23 | - public function __construct() |
|
24 | - { |
|
25 | - // $this->styl = []; # https://stackoverflow.com/questions/39583880/external-svg-fails-to-apply-internal-css |
|
26 | - // $this->defs = []; # https://bugs.chromium.org/p/chromium/issues/detail?id=751733#c14 |
|
27 | - $this->svgs = []; |
|
28 | - |
|
29 | - $this->sitePath = \TYPO3\CMS\Core\Core\Environment::getPublicPath(); // [^/]$ |
|
30 | - $this->svgCache = GeneralUtility::makeInstance(\TYPO3\CMS\Core\Cache\CacheManager::class)->getCache('svgstore'); |
|
31 | - } |
|
32 | - |
|
33 | - public function process(string $html): string |
|
34 | - { |
|
35 | - $this->spritePath = $this->svgCache->get('spritePath') ?: ''; |
|
36 | - $this->svgFileArr = $this->svgCache->get('svgFileArr') ?: []; |
|
37 | - |
|
38 | - if (empty($this->spritePath) && !$this->populateCache()) { |
|
39 | - throw new \Exception('could not write file: '.$this->sitePath.$this->spritePath); |
|
40 | - } |
|
41 | - |
|
42 | - if (!file_exists($this->sitePath.$this->spritePath)) { |
|
43 | - throw new \Exception('file does not exists: '.$this->sitePath.$this->spritePath); |
|
44 | - } |
|
45 | - |
|
46 | - if ($GLOBALS['TSFE']->config['config']['disableAllHeaderCode'] ?? false) { |
|
47 | - $dom = ['head' => '', 'body' => $html]; |
|
48 | - } elseif (!preg_match('/(?<head>.+?<\/head>)(?<body>.+)/s', $html, $dom) && 5 == \count($dom)) { |
|
49 | - return $html; |
|
50 | - } |
|
51 | - |
|
52 | - // https://developer.mozilla.org/en-US/docs/Web/HTML/Element/img#attributes |
|
53 | - $dom['body'] = preg_replace_callback('/<img(?<pre>[^>]*)src="(?:https?:)?(?:\/\/[^\/]+?)?(?<src>\/[^"]+\.svg)"(?<post>[^>]*?)[\s\/]*>(?!\s*<\/picture>)/s', function (array $match): string { // ^[/] |
|
54 | - if (!isset($this->svgFileArr[$match['src']])) { // check usage |
|
55 | - return $match[0]; |
|
56 | - } |
|
57 | - $attr = preg_replace('/\s(?:alt|ismap|loading|title|sizes|srcset|usemap|crossorigin|decoding|referrerpolicy)="[^"]*"/', '', $match['pre'].$match['post']); // cleanup |
|
58 | - |
|
59 | - return sprintf('<svg %s %s><use href="%s#%s"/></svg>', $this->svgFileArr[$match['src']]['attr'], trim($attr), $this->spritePath, $this->convertFilePath($match['src'])); |
|
60 | - }, $dom['body']); |
|
61 | - |
|
62 | - // https://developer.mozilla.org/en-US/docs/Web/HTML/Element/object#attributes |
|
63 | - $dom['body'] = preg_replace_callback('/<object(?<pre>[^>]*)data="(?<data>\/[^"]+\.svg)"(?<post>[^>]*?)[\s\/]*>(?:<\/object>)/s', function (array $match): string { // ^[/] |
|
64 | - if (!isset($this->svgFileArr[$match['data']])) { // check usage |
|
65 | - return $match[0]; |
|
66 | - } |
|
67 | - $attr = preg_replace('/\s(?:form|name|type|usemap)="[^"]*"/', '', $match['pre'].$match['post']); // cleanup |
|
68 | - |
|
69 | - return sprintf('<svg %s %s><use href="%s#%s"/></svg>', $this->svgFileArr[$match['data']]['attr'], trim($attr), $this->spritePath, $this->convertFilePath($match['data'])); |
|
70 | - }, $dom['body']); |
|
71 | - |
|
72 | - return $dom['head'].$dom['body']; |
|
73 | - } |
|
74 | - |
|
75 | - private function convertFilePath(string $path): string |
|
76 | - { |
|
77 | - return preg_replace('/.svg$|[^\w\-]/', '', str_replace('/', '-', ltrim($path, '/'))); // ^[^/] |
|
78 | - } |
|
79 | - |
|
80 | - private function addFileToSpriteArr(string $hash, string $path): ?array |
|
81 | - { |
|
82 | - if (!file_exists($this->sitePath.$path)) { |
|
83 | - return null; |
|
84 | - } |
|
85 | - |
|
86 | - if (preg_match('/(?:;base64|i:a?i?pgf)/', $svg = file_get_contents($this->sitePath.$path))) { // noop! |
|
87 | - return null; |
|
88 | - } |
|
89 | - |
|
90 | - if (preg_match('/<(?:style|defs)|url\(/', $svg)) { |
|
91 | - return null; // check links @ __construct |
|
92 | - } |
|
93 | - |
|
94 | - // https://developer.mozilla.org/en-US/docs/Web/SVG/Attribute/xlink:href |
|
95 | - $svg = preg_replace('/^.*?<svg|\s*(<\/svg>)(?!.*\1).*$|xlink:|\s(?:(?:version|xmlns)|(?:[a-z\-]+\:[a-z\-]+))="[^"]*"/s', '', $svg); // cleanup |
|
96 | - |
|
97 | - // $svg = preg_replace('/(?<=(?:id|class)=")/', $hash.'__', $svg); // extend IDs |
|
98 | - // $svg = preg_replace('/(?<=href="|url\()#/', $hash.'__', $svg); // recover IDs |
|
99 | - |
|
100 | - // $svg = preg_replace_callback('/<style[^>]*>(?<styl>.+?)<\/style>|<defs[^>]*>(?<defs>.+?)<\/defs>/s', function(array $match) use($hash): string { |
|
101 | - // |
|
102 | - // if(isset($match['styl'])) |
|
103 | - // { |
|
104 | - // $this->styl[] = preg_replace('/\s*(\.|#){1}(.+?)\s*\{/', '$1'.$hash.'__$2{', $match['styl']); // patch CSS # https://mathiasbynens.be/notes/css-escapes |
|
105 | - // } |
|
106 | - // if(isset($match['defs'])) |
|
107 | - // { |
|
108 | - // $this->defs[] = trim($match['defs']); |
|
109 | - // } |
|
110 | - // return ''; |
|
111 | - // }, $svg); |
|
112 | - |
|
113 | - // https://developer.mozilla.org/en-US/docs/Web/SVG/Element/svg#attributes |
|
114 | - $svg = preg_replace_callback('/([^>]*)\s*(?=>)/s', function (array $match) use (&$attr): string { |
|
115 | - if (false === preg_match_all('/(?!\s)(?<attr>[\w\-]+)="\s*(?<value>[^"]+)\s*"/', $match[1], $matches)) { |
|
116 | - return $match[0]; |
|
117 | - } |
|
118 | - foreach ($matches['attr'] as $index => $attribute) { |
|
119 | - switch ($attribute) { |
|
120 | - case 'id': |
|
121 | - case 'width': |
|
122 | - case 'height': |
|
123 | - unset($matches[0][$index]); |
|
124 | - break; |
|
125 | - |
|
126 | - case 'viewBox': |
|
127 | - if (false !== preg_match('/\S+\s\S+\s\+?(?<width>[\d\.]+)\s\+?(?<height>[\d\.]+)/', $matches['value'][$index], $match)) { |
|
128 | - $attr[] = sprintf('%s="0 0 %s %s"', $attribute, $match['width'], $match['height']); // save! |
|
129 | - } |
|
130 | - } |
|
131 | - } |
|
132 | - |
|
133 | - return implode(' ', $matches[0]); |
|
134 | - }, $svg, 1); |
|
135 | - |
|
136 | - if ($attr) { // TODO; beautify |
|
137 | - $this->svgs[] = sprintf('id="%s" %s', $this->convertFilePath($path), $svg); // prepend ID |
|
138 | - |
|
139 | - return ['attr' => implode(' ', $attr), 'hash' => $hash]; |
|
140 | - } |
|
141 | - |
|
142 | - return null; |
|
143 | - } |
|
144 | - |
|
145 | - private function populateCache(): bool |
|
146 | - { |
|
147 | - $storageArr = GeneralUtility::makeInstance(\TYPO3\CMS\Core\Resource\StorageRepository::class)->findAll(); |
|
148 | - foreach ($storageArr as $storage) { |
|
149 | - if ('relative' == $storage->getConfiguration()['pathType']) { |
|
150 | - $storageArr[$storage->getUid()] = rtrim($storage->getConfiguration()['basePath'], '/'); // [^/]$ |
|
151 | - } |
|
152 | - } |
|
153 | - unset($storageArr[0]); // keep! |
|
154 | - |
|
155 | - $fileArr = GeneralUtility::makeInstance(\HTML\Sourceopt\Resource\SvgFileRepository::class)->findAllByStorageUids(array_keys($storageArr)); |
|
156 | - foreach ($fileArr as $file) { |
|
157 | - $file['path'] = '/'.$storageArr[$file['storage']].$file['identifier']; // ^[/] |
|
158 | - $file['defs'] = $this->addFileToSpriteArr($file['sha1'], $file['path']); |
|
159 | - |
|
160 | - if (null !== $file['defs']) { |
|
161 | - $this->svgFileArr[$file['path']] = $file['defs']; |
|
162 | - } |
|
163 | - } |
|
164 | - unset($storageArr, $storage, $fileArr, $file); // save MEM |
|
165 | - |
|
166 | - $svg = preg_replace_callback( |
|
167 | - '/<use(?<pre>.*?)(?:xlink:)?href="(?<href>\/.+?\.svg)#[^"]+"(?<post>.*?)[\s\/]*>(?:<\/use>)?/s', |
|
168 | - function (array $match): string { |
|
169 | - if (!isset($this->svgFileArr[$match['href']])) { // check usage |
|
170 | - return $match[0]; |
|
171 | - } |
|
172 | - |
|
173 | - return sprintf('<use%s href="#%s"/>', $match['pre'].$match['post'], $this->convertFilePath($match['href'])); |
|
174 | - }, |
|
175 | - '<svg xmlns="http://www.w3.org/2000/svg">' |
|
176 | - // ."\n<style>\n".implode("\n", $this->styl)."\n</style>" |
|
177 | - // ."\n<defs>\n".implode("\n", $this->defs)."\n</defs>" |
|
178 | - ."\n<symbol ".implode("</symbol>\n<symbol ", $this->svgs)."</symbol>\n" |
|
179 | - .'</svg>' |
|
180 | - ); |
|
181 | - |
|
182 | - // unset($this->styl); // save MEM |
|
183 | - // unset($this->defs); // save MEM |
|
184 | - unset($this->svgs); // save MEM |
|
185 | - |
|
186 | - if ($GLOBALS['TSFE']->config['config']['sourceopt.']['formatHtml'] ?? false) { |
|
187 | - $svg = preg_replace('/(?<=>)\s+(?=<)/', '', $svg); // remove emptiness |
|
188 | - $svg = preg_replace('/[\t\v]/', ' ', $svg); // prepare shrinkage |
|
189 | - $svg = preg_replace('/\s{2,}/', ' ', $svg); // shrink whitespace |
|
190 | - } |
|
191 | - |
|
192 | - $svg = preg_replace('/<([a-z]+)\s*(\/|>\s*<\/\1)>\s*|\s+(?=\/>)/i', '', $svg); // remove emtpy TAGs & shorten endings |
|
193 | - $svg = preg_replace('/<((circle|ellipse|line|path|polygon|polyline|rect|stop|use)\s[^>]+?)\s*>\s*<\/\2>/', '<$1/>', $svg); // shorten/minify TAG syntax |
|
194 | - |
|
195 | - if (!is_dir($this->sitePath.$this->outputDir)) { |
|
196 | - GeneralUtility::mkdir_deep($this->sitePath.$this->outputDir); |
|
197 | - } |
|
198 | - |
|
199 | - $this->spritePath = $this->outputDir.hash('sha1', serialize($this->svgFileArr)).'.svg'; |
|
200 | - if (false === file_put_contents($this->sitePath.$this->spritePath, $svg)) { |
|
201 | - return false; |
|
202 | - } |
|
203 | - |
|
204 | - $this->svgCache->set('spritePath', $this->spritePath); |
|
205 | - $this->svgCache->set('svgFileArr', $this->svgFileArr); |
|
206 | - |
|
207 | - return true; |
|
208 | - } |
|
16 | + /** |
|
17 | + * SVG-Sprite storage directory. |
|
18 | + * |
|
19 | + * @var string |
|
20 | + */ |
|
21 | + protected $outputDir = '/typo3temp/assets/svg/'; |
|
22 | + |
|
23 | + public function __construct() |
|
24 | + { |
|
25 | + // $this->styl = []; # https://stackoverflow.com/questions/39583880/external-svg-fails-to-apply-internal-css |
|
26 | + // $this->defs = []; # https://bugs.chromium.org/p/chromium/issues/detail?id=751733#c14 |
|
27 | + $this->svgs = []; |
|
28 | + |
|
29 | + $this->sitePath = \TYPO3\CMS\Core\Core\Environment::getPublicPath(); // [^/]$ |
|
30 | + $this->svgCache = GeneralUtility::makeInstance(\TYPO3\CMS\Core\Cache\CacheManager::class)->getCache('svgstore'); |
|
31 | + } |
|
32 | + |
|
33 | + public function process(string $html): string |
|
34 | + { |
|
35 | + $this->spritePath = $this->svgCache->get('spritePath') ?: ''; |
|
36 | + $this->svgFileArr = $this->svgCache->get('svgFileArr') ?: []; |
|
37 | + |
|
38 | + if (empty($this->spritePath) && !$this->populateCache()) { |
|
39 | + throw new \Exception('could not write file: '.$this->sitePath.$this->spritePath); |
|
40 | + } |
|
41 | + |
|
42 | + if (!file_exists($this->sitePath.$this->spritePath)) { |
|
43 | + throw new \Exception('file does not exists: '.$this->sitePath.$this->spritePath); |
|
44 | + } |
|
45 | + |
|
46 | + if ($GLOBALS['TSFE']->config['config']['disableAllHeaderCode'] ?? false) { |
|
47 | + $dom = ['head' => '', 'body' => $html]; |
|
48 | + } elseif (!preg_match('/(?<head>.+?<\/head>)(?<body>.+)/s', $html, $dom) && 5 == \count($dom)) { |
|
49 | + return $html; |
|
50 | + } |
|
51 | + |
|
52 | + // https://developer.mozilla.org/en-US/docs/Web/HTML/Element/img#attributes |
|
53 | + $dom['body'] = preg_replace_callback('/<img(?<pre>[^>]*)src="(?:https?:)?(?:\/\/[^\/]+?)?(?<src>\/[^"]+\.svg)"(?<post>[^>]*?)[\s\/]*>(?!\s*<\/picture>)/s', function (array $match): string { // ^[/] |
|
54 | + if (!isset($this->svgFileArr[$match['src']])) { // check usage |
|
55 | + return $match[0]; |
|
56 | + } |
|
57 | + $attr = preg_replace('/\s(?:alt|ismap|loading|title|sizes|srcset|usemap|crossorigin|decoding|referrerpolicy)="[^"]*"/', '', $match['pre'].$match['post']); // cleanup |
|
58 | + |
|
59 | + return sprintf('<svg %s %s><use href="%s#%s"/></svg>', $this->svgFileArr[$match['src']]['attr'], trim($attr), $this->spritePath, $this->convertFilePath($match['src'])); |
|
60 | + }, $dom['body']); |
|
61 | + |
|
62 | + // https://developer.mozilla.org/en-US/docs/Web/HTML/Element/object#attributes |
|
63 | + $dom['body'] = preg_replace_callback('/<object(?<pre>[^>]*)data="(?<data>\/[^"]+\.svg)"(?<post>[^>]*?)[\s\/]*>(?:<\/object>)/s', function (array $match): string { // ^[/] |
|
64 | + if (!isset($this->svgFileArr[$match['data']])) { // check usage |
|
65 | + return $match[0]; |
|
66 | + } |
|
67 | + $attr = preg_replace('/\s(?:form|name|type|usemap)="[^"]*"/', '', $match['pre'].$match['post']); // cleanup |
|
68 | + |
|
69 | + return sprintf('<svg %s %s><use href="%s#%s"/></svg>', $this->svgFileArr[$match['data']]['attr'], trim($attr), $this->spritePath, $this->convertFilePath($match['data'])); |
|
70 | + }, $dom['body']); |
|
71 | + |
|
72 | + return $dom['head'].$dom['body']; |
|
73 | + } |
|
74 | + |
|
75 | + private function convertFilePath(string $path): string |
|
76 | + { |
|
77 | + return preg_replace('/.svg$|[^\w\-]/', '', str_replace('/', '-', ltrim($path, '/'))); // ^[^/] |
|
78 | + } |
|
79 | + |
|
80 | + private function addFileToSpriteArr(string $hash, string $path): ?array |
|
81 | + { |
|
82 | + if (!file_exists($this->sitePath.$path)) { |
|
83 | + return null; |
|
84 | + } |
|
85 | + |
|
86 | + if (preg_match('/(?:;base64|i:a?i?pgf)/', $svg = file_get_contents($this->sitePath.$path))) { // noop! |
|
87 | + return null; |
|
88 | + } |
|
89 | + |
|
90 | + if (preg_match('/<(?:style|defs)|url\(/', $svg)) { |
|
91 | + return null; // check links @ __construct |
|
92 | + } |
|
93 | + |
|
94 | + // https://developer.mozilla.org/en-US/docs/Web/SVG/Attribute/xlink:href |
|
95 | + $svg = preg_replace('/^.*?<svg|\s*(<\/svg>)(?!.*\1).*$|xlink:|\s(?:(?:version|xmlns)|(?:[a-z\-]+\:[a-z\-]+))="[^"]*"/s', '', $svg); // cleanup |
|
96 | + |
|
97 | + // $svg = preg_replace('/(?<=(?:id|class)=")/', $hash.'__', $svg); // extend IDs |
|
98 | + // $svg = preg_replace('/(?<=href="|url\()#/', $hash.'__', $svg); // recover IDs |
|
99 | + |
|
100 | + // $svg = preg_replace_callback('/<style[^>]*>(?<styl>.+?)<\/style>|<defs[^>]*>(?<defs>.+?)<\/defs>/s', function(array $match) use($hash): string { |
|
101 | + // |
|
102 | + // if(isset($match['styl'])) |
|
103 | + // { |
|
104 | + // $this->styl[] = preg_replace('/\s*(\.|#){1}(.+?)\s*\{/', '$1'.$hash.'__$2{', $match['styl']); // patch CSS # https://mathiasbynens.be/notes/css-escapes |
|
105 | + // } |
|
106 | + // if(isset($match['defs'])) |
|
107 | + // { |
|
108 | + // $this->defs[] = trim($match['defs']); |
|
109 | + // } |
|
110 | + // return ''; |
|
111 | + // }, $svg); |
|
112 | + |
|
113 | + // https://developer.mozilla.org/en-US/docs/Web/SVG/Element/svg#attributes |
|
114 | + $svg = preg_replace_callback('/([^>]*)\s*(?=>)/s', function (array $match) use (&$attr): string { |
|
115 | + if (false === preg_match_all('/(?!\s)(?<attr>[\w\-]+)="\s*(?<value>[^"]+)\s*"/', $match[1], $matches)) { |
|
116 | + return $match[0]; |
|
117 | + } |
|
118 | + foreach ($matches['attr'] as $index => $attribute) { |
|
119 | + switch ($attribute) { |
|
120 | + case 'id': |
|
121 | + case 'width': |
|
122 | + case 'height': |
|
123 | + unset($matches[0][$index]); |
|
124 | + break; |
|
125 | + |
|
126 | + case 'viewBox': |
|
127 | + if (false !== preg_match('/\S+\s\S+\s\+?(?<width>[\d\.]+)\s\+?(?<height>[\d\.]+)/', $matches['value'][$index], $match)) { |
|
128 | + $attr[] = sprintf('%s="0 0 %s %s"', $attribute, $match['width'], $match['height']); // save! |
|
129 | + } |
|
130 | + } |
|
131 | + } |
|
132 | + |
|
133 | + return implode(' ', $matches[0]); |
|
134 | + }, $svg, 1); |
|
135 | + |
|
136 | + if ($attr) { // TODO; beautify |
|
137 | + $this->svgs[] = sprintf('id="%s" %s', $this->convertFilePath($path), $svg); // prepend ID |
|
138 | + |
|
139 | + return ['attr' => implode(' ', $attr), 'hash' => $hash]; |
|
140 | + } |
|
141 | + |
|
142 | + return null; |
|
143 | + } |
|
144 | + |
|
145 | + private function populateCache(): bool |
|
146 | + { |
|
147 | + $storageArr = GeneralUtility::makeInstance(\TYPO3\CMS\Core\Resource\StorageRepository::class)->findAll(); |
|
148 | + foreach ($storageArr as $storage) { |
|
149 | + if ('relative' == $storage->getConfiguration()['pathType']) { |
|
150 | + $storageArr[$storage->getUid()] = rtrim($storage->getConfiguration()['basePath'], '/'); // [^/]$ |
|
151 | + } |
|
152 | + } |
|
153 | + unset($storageArr[0]); // keep! |
|
154 | + |
|
155 | + $fileArr = GeneralUtility::makeInstance(\HTML\Sourceopt\Resource\SvgFileRepository::class)->findAllByStorageUids(array_keys($storageArr)); |
|
156 | + foreach ($fileArr as $file) { |
|
157 | + $file['path'] = '/'.$storageArr[$file['storage']].$file['identifier']; // ^[/] |
|
158 | + $file['defs'] = $this->addFileToSpriteArr($file['sha1'], $file['path']); |
|
159 | + |
|
160 | + if (null !== $file['defs']) { |
|
161 | + $this->svgFileArr[$file['path']] = $file['defs']; |
|
162 | + } |
|
163 | + } |
|
164 | + unset($storageArr, $storage, $fileArr, $file); // save MEM |
|
165 | + |
|
166 | + $svg = preg_replace_callback( |
|
167 | + '/<use(?<pre>.*?)(?:xlink:)?href="(?<href>\/.+?\.svg)#[^"]+"(?<post>.*?)[\s\/]*>(?:<\/use>)?/s', |
|
168 | + function (array $match): string { |
|
169 | + if (!isset($this->svgFileArr[$match['href']])) { // check usage |
|
170 | + return $match[0]; |
|
171 | + } |
|
172 | + |
|
173 | + return sprintf('<use%s href="#%s"/>', $match['pre'].$match['post'], $this->convertFilePath($match['href'])); |
|
174 | + }, |
|
175 | + '<svg xmlns="http://www.w3.org/2000/svg">' |
|
176 | + // ."\n<style>\n".implode("\n", $this->styl)."\n</style>" |
|
177 | + // ."\n<defs>\n".implode("\n", $this->defs)."\n</defs>" |
|
178 | + ."\n<symbol ".implode("</symbol>\n<symbol ", $this->svgs)."</symbol>\n" |
|
179 | + .'</svg>' |
|
180 | + ); |
|
181 | + |
|
182 | + // unset($this->styl); // save MEM |
|
183 | + // unset($this->defs); // save MEM |
|
184 | + unset($this->svgs); // save MEM |
|
185 | + |
|
186 | + if ($GLOBALS['TSFE']->config['config']['sourceopt.']['formatHtml'] ?? false) { |
|
187 | + $svg = preg_replace('/(?<=>)\s+(?=<)/', '', $svg); // remove emptiness |
|
188 | + $svg = preg_replace('/[\t\v]/', ' ', $svg); // prepare shrinkage |
|
189 | + $svg = preg_replace('/\s{2,}/', ' ', $svg); // shrink whitespace |
|
190 | + } |
|
191 | + |
|
192 | + $svg = preg_replace('/<([a-z]+)\s*(\/|>\s*<\/\1)>\s*|\s+(?=\/>)/i', '', $svg); // remove emtpy TAGs & shorten endings |
|
193 | + $svg = preg_replace('/<((circle|ellipse|line|path|polygon|polyline|rect|stop|use)\s[^>]+?)\s*>\s*<\/\2>/', '<$1/>', $svg); // shorten/minify TAG syntax |
|
194 | + |
|
195 | + if (!is_dir($this->sitePath.$this->outputDir)) { |
|
196 | + GeneralUtility::mkdir_deep($this->sitePath.$this->outputDir); |
|
197 | + } |
|
198 | + |
|
199 | + $this->spritePath = $this->outputDir.hash('sha1', serialize($this->svgFileArr)).'.svg'; |
|
200 | + if (false === file_put_contents($this->sitePath.$this->spritePath, $svg)) { |
|
201 | + return false; |
|
202 | + } |
|
203 | + |
|
204 | + $this->svgCache->set('spritePath', $this->spritePath); |
|
205 | + $this->svgCache->set('svgFileArr', $this->svgFileArr); |
|
206 | + |
|
207 | + return true; |
|
208 | + } |
|
209 | 209 | } |