@@ -205,6 +205,7 @@ |
||
205 | 205 | /** |
206 | 206 | * Adds a module to the current doctype by first registering it, |
207 | 207 | * and then tacking it on to the active doctype |
208 | + * @param HTMLPurifier_HTMLModule $module |
|
208 | 209 | */ |
209 | 210 | public function addModule($module) |
210 | 211 | { |
@@ -174,7 +174,7 @@ discard block |
||
174 | 174 | $original_module = $module; |
175 | 175 | $ok = false; |
176 | 176 | foreach ($this->prefixes as $prefix) { |
177 | - $module = $prefix . $original_module; |
|
177 | + $module = $prefix.$original_module; |
|
178 | 178 | if (class_exists($module)) { |
179 | 179 | $ok = true; |
180 | 180 | break; |
@@ -184,7 +184,7 @@ discard block |
||
184 | 184 | $module = $original_module; |
185 | 185 | if (!class_exists($module)) { |
186 | 186 | trigger_error( |
187 | - $original_module . ' module does not exist', |
|
187 | + $original_module.' module does not exist', |
|
188 | 188 | E_USER_ERROR |
189 | 189 | ); |
190 | 190 | return; |
@@ -193,11 +193,11 @@ discard block |
||
193 | 193 | $module = new $module(); |
194 | 194 | } |
195 | 195 | if (empty($module->name)) { |
196 | - trigger_error('Module instance of ' . get_class($module) . ' must have name'); |
|
196 | + trigger_error('Module instance of '.get_class($module).' must have name'); |
|
197 | 197 | return; |
198 | 198 | } |
199 | 199 | if (!$overload && isset($this->registeredModules[$module->name])) { |
200 | - trigger_error('Overloading ' . $module->name . ' without explicit overload parameter', E_USER_WARNING); |
|
200 | + trigger_error('Overloading '.$module->name.' without explicit overload parameter', E_USER_WARNING); |
|
201 | 201 | } |
202 | 202 | $this->registeredModules[$module->name] = $module; |
203 | 203 | } |
@@ -65,7 +65,7 @@ |
||
65 | 65 | * deleted a node, and now need to see if this change affected any |
66 | 66 | * earlier nodes. Rewinding does not affect other injectors, and can |
67 | 67 | * result in infinite loops if not used carefully. |
68 | - * @param bool|int $offset |
|
68 | + * @param integer $offset |
|
69 | 69 | * @warning HTML Purifier will prevent you from fast-forwarding with this |
70 | 70 | * function. |
71 | 71 | */ |
@@ -104,9 +104,9 @@ |
||
104 | 104 | if ($result !== false) { |
105 | 105 | return $result; |
106 | 106 | } |
107 | - $this->currentNesting =& $context->get('CurrentNesting'); |
|
108 | - $this->currentToken =& $context->get('CurrentToken'); |
|
109 | - $this->inputZipper =& $context->get('InputZipper'); |
|
107 | + $this->currentNesting = & $context->get('CurrentNesting'); |
|
108 | + $this->currentToken = & $context->get('CurrentToken'); |
|
109 | + $this->inputZipper = & $context->get('InputZipper'); |
|
110 | 110 | return false; |
111 | 111 | } |
112 | 112 |
@@ -328,7 +328,7 @@ |
||
328 | 328 | * Determines if a particular token requires an earlier inline token |
329 | 329 | * to get a paragraph. This should be used with _forwardUntilEndToken |
330 | 330 | * @param HTMLPurifier_Token $current |
331 | - * @return bool |
|
331 | + * @return boolean|null |
|
332 | 332 | */ |
333 | 333 | private function _checkNeedsP($current) |
334 | 334 | { |
@@ -341,6 +341,7 @@ |
||
341 | 341 | /** |
342 | 342 | * Takes a string of HTML (fragment or document) and returns the content |
343 | 343 | * @todo Consider making protected |
344 | + * @param string $html |
|
344 | 345 | */ |
345 | 346 | public function extractBody($html) |
346 | 347 | { |
@@ -124,7 +124,7 @@ discard block |
||
124 | 124 | break; |
125 | 125 | default: |
126 | 126 | throw new HTMLPurifier_Exception( |
127 | - "Cannot instantiate unrecognized Lexer type " . |
|
127 | + "Cannot instantiate unrecognized Lexer type ". |
|
128 | 128 | htmlspecialchars($lexer) |
129 | 129 | ); |
130 | 130 | } |
@@ -138,7 +138,7 @@ discard block |
||
138 | 138 | // hack out something using XSLT, remove this stipulation |
139 | 139 | if ($needs_tracking && !$inst->tracksLineNumbers) { |
140 | 140 | throw new HTMLPurifier_Exception( |
141 | - 'Cannot use lexer that does not support line numbers with ' . |
|
141 | + 'Cannot use lexer that does not support line numbers with '. |
|
142 | 142 | 'Core.MaintainLineNumbers or Core.CollectErrors (use DirectLex instead)' |
143 | 143 | ); |
144 | 144 | } |
@@ -313,7 +313,7 @@ discard block |
||
313 | 313 | if ($config->get('Core.ConvertDocumentToFragment')) { |
314 | 314 | $e = false; |
315 | 315 | if ($config->get('Core.CollectErrors')) { |
316 | - $e =& $context->get('ErrorCollector'); |
|
316 | + $e = & $context->get('ErrorCollector'); |
|
317 | 317 | } |
318 | 318 | $new_html = $this->extractBody($html); |
319 | 319 | if ($e && $new_html != $html) { |
@@ -458,6 +458,9 @@ discard block |
||
458 | 458 | const CHARACTR = 4; |
459 | 459 | const EOF = 5; |
460 | 460 | |
461 | + /** |
|
462 | + * @param string $data |
|
463 | + */ |
|
461 | 464 | public function __construct($data) |
462 | 465 | { |
463 | 466 | $this->data = $data; |
@@ -478,6 +481,9 @@ discard block |
||
478 | 481 | return $this->tree->save(); |
479 | 482 | } |
480 | 483 | |
484 | + /** |
|
485 | + * @return string |
|
486 | + */ |
|
481 | 487 | private function char() |
482 | 488 | { |
483 | 489 | return ($this->char < $this->EOF) |
@@ -485,6 +491,11 @@ discard block |
||
485 | 491 | : false; |
486 | 492 | } |
487 | 493 | |
494 | + /** |
|
495 | + * @param integer $s |
|
496 | + * |
|
497 | + * @return string |
|
498 | + */ |
|
488 | 499 | private function character($s, $l = 0) |
489 | 500 | { |
490 | 501 | if ($s + $l < $this->EOF) { |
@@ -496,6 +507,10 @@ discard block |
||
496 | 507 | } |
497 | 508 | } |
498 | 509 | |
510 | + /** |
|
511 | + * @param string $char_class |
|
512 | + * @param integer $start |
|
513 | + */ |
|
499 | 514 | private function characters($char_class, $start) |
500 | 515 | { |
501 | 516 | return preg_replace('#^([' . $char_class . ']+).*#s', '\\1', substr($this->data, $start)); |
@@ -4645,6 +4660,9 @@ discard block |
||
4645 | 4660 | } |
4646 | 4661 | } |
4647 | 4662 | |
4663 | + /** |
|
4664 | + * @param string[] $elements |
|
4665 | + */ |
|
4648 | 4666 | private function clearStackToTableContext($elements) |
4649 | 4667 | { |
4650 | 4668 | /* When the steps above require the UA to clear the stack back to a |
@@ -469,7 +469,7 @@ discard block |
||
469 | 469 | $this->state = 'data'; |
470 | 470 | |
471 | 471 | while ($this->state !== null) { |
472 | - $this->{$this->state . 'State'}(); |
|
472 | + $this->{$this->state.'State'}(); |
|
473 | 473 | } |
474 | 474 | } |
475 | 475 | |
@@ -498,7 +498,7 @@ discard block |
||
498 | 498 | |
499 | 499 | private function characters($char_class, $start) |
500 | 500 | { |
501 | - return preg_replace('#^([' . $char_class . ']+).*#s', '\\1', substr($this->data, $start)); |
|
501 | + return preg_replace('#^(['.$char_class.']+).*#s', '\\1', substr($this->data, $start)); |
|
502 | 502 | } |
503 | 503 | |
504 | 504 | private function dataState() |
@@ -1289,7 +1289,7 @@ discard block |
||
1289 | 1289 | } else { |
1290 | 1290 | /* Append a U+002D HYPHEN-MINUS (-) character and the input |
1291 | 1291 | character to the comment token's data. Switch to the comment state. */ |
1292 | - $this->token['data'] .= '-' . $char; |
|
1292 | + $this->token['data'] .= '-'.$char; |
|
1293 | 1293 | $this->state = 'comment'; |
1294 | 1294 | } |
1295 | 1295 | } |
@@ -1313,7 +1313,7 @@ discard block |
||
1313 | 1313 | $this->state = 'data'; |
1314 | 1314 | |
1315 | 1315 | } else { |
1316 | - $this->token['data'] .= '--' . $char; |
|
1316 | + $this->token['data'] .= '--'.$char; |
|
1317 | 1317 | $this->state = 'comment'; |
1318 | 1318 | } |
1319 | 1319 | } |
@@ -1547,7 +1547,7 @@ discard block |
||
1547 | 1547 | |
1548 | 1548 | // Return a character token for the character corresponding to the |
1549 | 1549 | // entity name (as given by the second column of the entities table). |
1550 | - return html_entity_decode('&' . $entity . ';', ENT_QUOTES, 'UTF-8'); |
|
1550 | + return html_entity_decode('&'.$entity.';', ENT_QUOTES, 'UTF-8'); |
|
1551 | 1551 | } |
1552 | 1552 | |
1553 | 1553 | private function emitToken($token) |
@@ -2656,7 +2656,7 @@ discard block |
||
2656 | 2656 | |
2657 | 2657 | /* Act as if a stream of character tokens had been seen. */ |
2658 | 2658 | $this->insertText( |
2659 | - 'This is a searchable index. ' . |
|
2659 | + 'This is a searchable index. '. |
|
2660 | 2660 | 'Insert your search keywords here: ' |
2661 | 2661 | ); |
2662 | 2662 | |
@@ -2678,7 +2678,7 @@ discard block |
||
2678 | 2678 | /* Act as if a stream of character tokens had been seen |
2679 | 2679 | (see below for what they should say). */ |
2680 | 2680 | $this->insertText( |
2681 | - 'This is a searchable index. ' . |
|
2681 | + 'This is a searchable index. '. |
|
2682 | 2682 | 'Insert your search keywords here: ' |
2683 | 2683 | ); |
2684 | 2684 |
@@ -108,7 +108,7 @@ |
||
108 | 108 | /** |
109 | 109 | * Prints a simple key/value row in a table. |
110 | 110 | * @param string $name Key |
111 | - * @param mixed $value Value |
|
111 | + * @param string $value Value |
|
112 | 112 | * @return string |
113 | 113 | */ |
114 | 114 | protected function row($name, $value) |
@@ -77,8 +77,8 @@ discard block |
||
77 | 77 | */ |
78 | 78 | protected function element($tag, $contents, $attr = array(), $escape = true) |
79 | 79 | { |
80 | - return $this->start($tag, $attr) . |
|
81 | - ($escape ? $this->escape($contents) : $contents) . |
|
80 | + return $this->start($tag, $attr). |
|
81 | + ($escape ? $this->escape($contents) : $contents). |
|
82 | 82 | $this->end($tag); |
83 | 83 | } |
84 | 84 | |
@@ -117,9 +117,9 @@ discard block |
||
117 | 117 | $value = $value ? 'On' : 'Off'; |
118 | 118 | } |
119 | 119 | return |
120 | - $this->start('tr') . "\n" . |
|
121 | - $this->element('th', $name) . "\n" . |
|
122 | - $this->element('td', $value) . "\n" . |
|
120 | + $this->start('tr')."\n". |
|
121 | + $this->element('th', $name)."\n". |
|
122 | + $this->element('td', $value)."\n". |
|
123 | 123 | $this->end('tr'); |
124 | 124 | } |
125 | 125 | |
@@ -173,7 +173,7 @@ discard block |
||
173 | 173 | if ($five === null) { |
174 | 174 | $five = version_compare(PHP_VERSION, '5', '>='); |
175 | 175 | } |
176 | - $prefix = 'HTMLPurifier_' . $sec_prefix; |
|
176 | + $prefix = 'HTMLPurifier_'.$sec_prefix; |
|
177 | 177 | if (!$five) { |
178 | 178 | $prefix = strtolower($prefix); |
179 | 179 | } |
@@ -196,11 +196,11 @@ discard block |
||
196 | 196 | $class .= implode(', ', $values); |
197 | 197 | break; |
198 | 198 | case 'css_multiple': |
199 | - $class .= $this->getClass($obj->single, $sec_prefix) . ', '; |
|
199 | + $class .= $this->getClass($obj->single, $sec_prefix).', '; |
|
200 | 200 | $class .= $obj->max; |
201 | 201 | break; |
202 | 202 | case 'css_denyelementdecorator': |
203 | - $class .= $this->getClass($obj->def, $sec_prefix) . ', '; |
|
203 | + $class .= $this->getClass($obj->def, $sec_prefix).', '; |
|
204 | 204 | $class .= $obj->element; |
205 | 205 | break; |
206 | 206 | case 'css_importantdecorator': |
@@ -53,8 +53,8 @@ discard block |
||
53 | 53 | |
54 | 54 | /** |
55 | 55 | * Sets default column and row size for textareas in sub-printers |
56 | - * @param $cols Integer columns of textarea, null to use default |
|
57 | - * @param $rows Integer rows of textarea, null to use default |
|
56 | + * @param integer $cols Integer columns of textarea, null to use default |
|
57 | + * @param integer $rows Integer rows of textarea, null to use default |
|
58 | 58 | */ |
59 | 59 | public function setTextareaDimensions($cols = null, $rows = null) |
60 | 60 | { |
@@ -84,7 +84,7 @@ discard block |
||
84 | 84 | |
85 | 85 | /** |
86 | 86 | * Returns HTML output for a configuration form |
87 | - * @param HTMLPurifier_Config|array $config Configuration object of current form state, or an array |
|
87 | + * @param HTMLPurifier_Config $config Configuration object of current form state, or an array |
|
88 | 88 | * where [0] has an HTML namespace and [1] is being rendered. |
89 | 89 | * @param array|bool $allowed Optional namespace(s) and directives to restrict form to. |
90 | 90 | * @param bool $render_controls |
@@ -71,7 +71,7 @@ discard block |
||
71 | 71 | */ |
72 | 72 | public static function getCSS() |
73 | 73 | { |
74 | - return file_get_contents(HTMLPURIFIER_PREFIX . '/HTMLPurifier/Printer/ConfigForm.css'); |
|
74 | + return file_get_contents(HTMLPURIFIER_PREFIX.'/HTMLPurifier/Printer/ConfigForm.css'); |
|
75 | 75 | } |
76 | 76 | |
77 | 77 | /** |
@@ -79,7 +79,7 @@ discard block |
||
79 | 79 | */ |
80 | 80 | public static function getJavaScript() |
81 | 81 | { |
82 | - return file_get_contents(HTMLPURIFIER_PREFIX . '/HTMLPurifier/Printer/ConfigForm.js'); |
|
82 | + return file_get_contents(HTMLPURIFIER_PREFIX.'/HTMLPurifier/Printer/ConfigForm.js'); |
|
83 | 83 | } |
84 | 84 | |
85 | 85 | /** |
@@ -107,7 +107,7 @@ discard block |
||
107 | 107 | $all = array(); |
108 | 108 | foreach ($allowed as $key) { |
109 | 109 | list($ns, $directive) = $key; |
110 | - $all[$ns][$directive] = $config->get($ns . '.' . $directive); |
|
110 | + $all[$ns][$directive] = $config->get($ns.'.'.$directive); |
|
111 | 111 | } |
112 | 112 | |
113 | 113 | $ret = ''; |
@@ -163,7 +163,7 @@ discard block |
||
163 | 163 | if (!$this->compress || (strlen($directive) < $this->compress)) { |
164 | 164 | $directive_disp = $directive; |
165 | 165 | } else { |
166 | - $directive_disp = substr($directive, 0, $this->compress - 2) . '...'; |
|
166 | + $directive_disp = substr($directive, 0, $this->compress - 2).'...'; |
|
167 | 167 | $attr['title'] = $directive; |
168 | 168 | } |
169 | 169 | |
@@ -251,14 +251,14 @@ discard block |
||
251 | 251 | 'type' => 'checkbox', |
252 | 252 | 'value' => '1', |
253 | 253 | 'class' => 'null-toggle', |
254 | - 'name' => "$name" . "[Null_$ns.$directive]", |
|
254 | + 'name' => "$name"."[Null_$ns.$directive]", |
|
255 | 255 | 'id' => "$name:Null_$ns.$directive", |
256 | 256 | 'onclick' => "toggleWriteability('$name:$ns.$directive',checked)" // INLINE JAVASCRIPT!!!! |
257 | 257 | ); |
258 | 258 | if ($this->obj instanceof HTMLPurifier_Printer_ConfigForm_bool) { |
259 | 259 | // modify inline javascript slightly |
260 | 260 | $attr['onclick'] = |
261 | - "toggleWriteability('$name:Yes_$ns.$directive',checked);" . |
|
261 | + "toggleWriteability('$name:Yes_$ns.$directive',checked);". |
|
262 | 262 | "toggleWriteability('$name:No_$ns.$directive',checked)"; |
263 | 263 | } |
264 | 264 | if ($value === null) { |
@@ -327,7 +327,7 @@ discard block |
||
327 | 327 | case HTMLPurifier_VarParser::HASH: |
328 | 328 | $nvalue = ''; |
329 | 329 | foreach ($value as $i => $v) { |
330 | - $nvalue .= "$i:$v" . PHP_EOL; |
|
330 | + $nvalue .= "$i:$v".PHP_EOL; |
|
331 | 331 | } |
332 | 332 | $value = $nvalue; |
333 | 333 | break; |
@@ -340,7 +340,7 @@ discard block |
||
340 | 340 | $value = serialize($value); |
341 | 341 | } |
342 | 342 | $attr = array( |
343 | - 'name' => "$name" . "[$ns.$directive]", |
|
343 | + 'name' => "$name"."[$ns.$directive]", |
|
344 | 344 | 'id' => "$name:$ns.$directive" |
345 | 345 | ); |
346 | 346 | if ($value === null) { |
@@ -407,7 +407,7 @@ discard block |
||
407 | 407 | |
408 | 408 | $attr = array( |
409 | 409 | 'type' => 'radio', |
410 | - 'name' => "$name" . "[$ns.$directive]", |
|
410 | + 'name' => "$name"."[$ns.$directive]", |
|
411 | 411 | 'id' => "$name:Yes_$ns.$directive", |
412 | 412 | 'value' => '1' |
413 | 413 | ); |
@@ -426,7 +426,7 @@ discard block |
||
426 | 426 | |
427 | 427 | $attr = array( |
428 | 428 | 'type' => 'radio', |
429 | - 'name' => "$name" . "[$ns.$directive]", |
|
429 | + 'name' => "$name"."[$ns.$directive]", |
|
430 | 430 | 'id' => "$name:No_$ns.$directive", |
431 | 431 | 'value' => '0' |
432 | 432 | ); |
@@ -528,9 +528,10 @@ discard block |
||
528 | 528 | * being the current one) will be deleted. |
529 | 529 | * |
530 | 530 | * @param HTMLPurifier_Token|array|int|bool $token Token substitution value |
531 | - * @param HTMLPurifier_Injector|int $injector Injector that performed the substitution; default is if |
|
531 | + * @param integer $injector Injector that performed the substitution; default is if |
|
532 | 532 | * this is not an injector related operation. |
533 | 533 | * @throws HTMLPurifier_Exception |
534 | + * @return HTMLPurifier_Token |
|
534 | 535 | */ |
535 | 536 | protected function processToken($token, $injector = -1) |
536 | 537 | { |
@@ -577,6 +578,7 @@ discard block |
||
577 | 578 | * Inserts a token before the current token. Cursor now points to |
578 | 579 | * this token. You must reprocess after this. |
579 | 580 | * @param HTMLPurifier_Token $token |
581 | + * @return HTMLPurifier_Token |
|
580 | 582 | */ |
581 | 583 | private function insertBefore($token) |
582 | 584 | { |
@@ -151,8 +151,8 @@ |
||
151 | 151 | |
152 | 152 | // isset is in loop because $tokens size changes during loop exec |
153 | 153 | for (;; |
154 | - // only increment if we don't need to reprocess |
|
155 | - $reprocess ? $reprocess = false : $token = $zipper->next($token)) { |
|
154 | + // only increment if we don't need to reprocess |
|
155 | + $reprocess ? $reprocess = false : $token = $zipper->next($token)) { |
|
156 | 156 | |
157 | 157 | // check for a rewind |
158 | 158 | if (is_int($i)) { |
@@ -82,10 +82,10 @@ |
||
82 | 82 | $stack = array(); |
83 | 83 | |
84 | 84 | // member variables |
85 | - $this->stack =& $stack; |
|
86 | - $this->tokens =& $tokens; |
|
87 | - $this->token =& $token; |
|
88 | - $this->zipper =& $zipper; |
|
85 | + $this->stack = & $stack; |
|
86 | + $this->tokens = & $tokens; |
|
87 | + $this->token = & $token; |
|
88 | + $this->zipper = & $zipper; |
|
89 | 89 | $this->config = $config; |
90 | 90 | $this->context = $context; |
91 | 91 |
@@ -162,7 +162,9 @@ |
||
162 | 162 | $rewind_offset = $this->injectors[$i]->getRewindOffset(); |
163 | 163 | if (is_int($rewind_offset)) { |
164 | 164 | for ($j = 0; $j < $rewind_offset; $j++) { |
165 | - if (empty($zipper->front)) break; |
|
165 | + if (empty($zipper->front)) { |
|
166 | + break; |
|
167 | + } |
|
166 | 168 | $token = $zipper->prev($token); |
167 | 169 | // indicate that other injectors should not process this token, |
168 | 170 | // but we need to reprocess it |
@@ -25,6 +25,9 @@ discard block |
||
25 | 25 | |
26 | 26 | ### Simple Function Interface ### |
27 | 27 | |
28 | + /** |
|
29 | + * @param string $text |
|
30 | + */ |
|
28 | 31 | public static function defaultTransform($text) { |
29 | 32 | # |
30 | 33 | # Initialize the parser and return the result of its transform method. |
@@ -931,6 +934,10 @@ discard block |
||
931 | 934 | |
932 | 935 | protected $list_level = 0; |
933 | 936 | |
937 | + /** |
|
938 | + * @param string $list_str |
|
939 | + * @param string $marker_any_re |
|
940 | + */ |
|
934 | 941 | protected function processListItems($list_str, $marker_any_re) { |
935 | 942 | # |
936 | 943 | # Process the contents of a single ordered or unordered list, splitting it |
@@ -1034,6 +1041,9 @@ discard block |
||
1034 | 1041 | } |
1035 | 1042 | |
1036 | 1043 | |
1044 | + /** |
|
1045 | + * @param string $code |
|
1046 | + */ |
|
1037 | 1047 | protected function makeCodeSpan($code) { |
1038 | 1048 | # |
1039 | 1049 | # Create a code span markup for $code. Called from handleSpanToken. |
@@ -1311,6 +1321,9 @@ discard block |
||
1311 | 1321 | } |
1312 | 1322 | |
1313 | 1323 | |
1324 | + /** |
|
1325 | + * @return string |
|
1326 | + */ |
|
1314 | 1327 | protected function encodeAttribute($text) { |
1315 | 1328 | # |
1316 | 1329 | # Encode text for a double-quoted HTML attribute. This function |
@@ -1551,6 +1564,9 @@ discard block |
||
1551 | 1564 | # hanlde UTF-8 if the default function does not exist. |
1552 | 1565 | protected $utf8_strlen = 'mb_strlen'; |
1553 | 1566 | |
1567 | + /** |
|
1568 | + * @param string $text |
|
1569 | + */ |
|
1554 | 1570 | protected function detab($text) { |
1555 | 1571 | # |
1556 | 1572 | # Replace tabs with the appropriate amount of space. |
@@ -19,193 +19,193 @@ discard block |
||
19 | 19 | |
20 | 20 | class Markdown implements MarkdownInterface { |
21 | 21 | |
22 | - ### Version ### |
|
22 | + ### Version ### |
|
23 | 23 | |
24 | - const MARKDOWNLIB_VERSION = "1.5.0"; |
|
24 | + const MARKDOWNLIB_VERSION = "1.5.0"; |
|
25 | 25 | |
26 | - ### Simple Function Interface ### |
|
26 | + ### Simple Function Interface ### |
|
27 | 27 | |
28 | - public static function defaultTransform($text) { |
|
29 | - # |
|
30 | - # Initialize the parser and return the result of its transform method. |
|
31 | - # This will work fine for derived classes too. |
|
32 | - # |
|
33 | - # Take parser class on which this function was called. |
|
34 | - $parser_class = \get_called_class(); |
|
28 | + public static function defaultTransform($text) { |
|
29 | + # |
|
30 | + # Initialize the parser and return the result of its transform method. |
|
31 | + # This will work fine for derived classes too. |
|
32 | + # |
|
33 | + # Take parser class on which this function was called. |
|
34 | + $parser_class = \get_called_class(); |
|
35 | 35 | |
36 | - # try to take parser from the static parser list |
|
37 | - static $parser_list; |
|
38 | - $parser =& $parser_list[$parser_class]; |
|
36 | + # try to take parser from the static parser list |
|
37 | + static $parser_list; |
|
38 | + $parser =& $parser_list[$parser_class]; |
|
39 | 39 | |
40 | - # create the parser it not already set |
|
41 | - if (!$parser) |
|
42 | - $parser = new $parser_class; |
|
40 | + # create the parser it not already set |
|
41 | + if (!$parser) |
|
42 | + $parser = new $parser_class; |
|
43 | 43 | |
44 | - # Transform text using parser. |
|
45 | - return $parser->transform($text); |
|
46 | - } |
|
44 | + # Transform text using parser. |
|
45 | + return $parser->transform($text); |
|
46 | + } |
|
47 | 47 | |
48 | - ### Configuration Variables ### |
|
48 | + ### Configuration Variables ### |
|
49 | 49 | |
50 | - # Change to ">" for HTML output. |
|
51 | - public $empty_element_suffix = " />"; |
|
52 | - public $tab_width = 4; |
|
50 | + # Change to ">" for HTML output. |
|
51 | + public $empty_element_suffix = " />"; |
|
52 | + public $tab_width = 4; |
|
53 | 53 | |
54 | - # Change to `true` to disallow markup or entities. |
|
55 | - public $no_markup = false; |
|
56 | - public $no_entities = false; |
|
54 | + # Change to `true` to disallow markup or entities. |
|
55 | + public $no_markup = false; |
|
56 | + public $no_entities = false; |
|
57 | 57 | |
58 | - # Predefined urls and titles for reference links and images. |
|
59 | - public $predef_urls = array(); |
|
60 | - public $predef_titles = array(); |
|
61 | - |
|
62 | - # Optional filter function for URLs |
|
63 | - public $url_filter_func = null; |
|
64 | - |
|
65 | - # Optional header id="" generation callback function. |
|
66 | - public $header_id_func = null; |
|
67 | - |
|
68 | - # Class attribute to toggle "enhanced ordered list" behaviour |
|
69 | - # setting this to true will allow ordered lists to start from the index |
|
70 | - # number that is defined first. For example: |
|
71 | - # 2. List item two |
|
72 | - # 3. List item three |
|
73 | - # |
|
74 | - # becomes |
|
75 | - # <ol start="2"> |
|
76 | - # <li>List item two</li> |
|
77 | - # <li>List item three</li> |
|
78 | - # </ol> |
|
79 | - public $enhanced_ordered_list = false; |
|
80 | - |
|
81 | - ### Parser Implementation ### |
|
82 | - |
|
83 | - # Regex to match balanced [brackets]. |
|
84 | - # Needed to insert a maximum bracked depth while converting to PHP. |
|
85 | - protected $nested_brackets_depth = 6; |
|
86 | - protected $nested_brackets_re; |
|
58 | + # Predefined urls and titles for reference links and images. |
|
59 | + public $predef_urls = array(); |
|
60 | + public $predef_titles = array(); |
|
61 | + |
|
62 | + # Optional filter function for URLs |
|
63 | + public $url_filter_func = null; |
|
64 | + |
|
65 | + # Optional header id="" generation callback function. |
|
66 | + public $header_id_func = null; |
|
67 | + |
|
68 | + # Class attribute to toggle "enhanced ordered list" behaviour |
|
69 | + # setting this to true will allow ordered lists to start from the index |
|
70 | + # number that is defined first. For example: |
|
71 | + # 2. List item two |
|
72 | + # 3. List item three |
|
73 | + # |
|
74 | + # becomes |
|
75 | + # <ol start="2"> |
|
76 | + # <li>List item two</li> |
|
77 | + # <li>List item three</li> |
|
78 | + # </ol> |
|
79 | + public $enhanced_ordered_list = false; |
|
80 | + |
|
81 | + ### Parser Implementation ### |
|
82 | + |
|
83 | + # Regex to match balanced [brackets]. |
|
84 | + # Needed to insert a maximum bracked depth while converting to PHP. |
|
85 | + protected $nested_brackets_depth = 6; |
|
86 | + protected $nested_brackets_re; |
|
87 | 87 | |
88 | - protected $nested_url_parenthesis_depth = 4; |
|
89 | - protected $nested_url_parenthesis_re; |
|
88 | + protected $nested_url_parenthesis_depth = 4; |
|
89 | + protected $nested_url_parenthesis_re; |
|
90 | 90 | |
91 | - # Table of hash values for escaped characters: |
|
92 | - protected $escape_chars = '\`*_{}[]()>#+-.!'; |
|
93 | - protected $escape_chars_re; |
|
91 | + # Table of hash values for escaped characters: |
|
92 | + protected $escape_chars = '\`*_{}[]()>#+-.!'; |
|
93 | + protected $escape_chars_re; |
|
94 | 94 | |
95 | 95 | |
96 | - public function __construct() { |
|
97 | - # |
|
98 | - # Constructor function. Initialize appropriate member variables. |
|
99 | - # |
|
100 | - $this->_initDetab(); |
|
101 | - $this->prepareItalicsAndBold(); |
|
96 | + public function __construct() { |
|
97 | + # |
|
98 | + # Constructor function. Initialize appropriate member variables. |
|
99 | + # |
|
100 | + $this->_initDetab(); |
|
101 | + $this->prepareItalicsAndBold(); |
|
102 | 102 | |
103 | - $this->nested_brackets_re = |
|
104 | - str_repeat('(?>[^\[\]]+|\[', $this->nested_brackets_depth). |
|
105 | - str_repeat('\])*', $this->nested_brackets_depth); |
|
103 | + $this->nested_brackets_re = |
|
104 | + str_repeat('(?>[^\[\]]+|\[', $this->nested_brackets_depth). |
|
105 | + str_repeat('\])*', $this->nested_brackets_depth); |
|
106 | 106 | |
107 | - $this->nested_url_parenthesis_re = |
|
108 | - str_repeat('(?>[^()\s]+|\(', $this->nested_url_parenthesis_depth). |
|
109 | - str_repeat('(?>\)))*', $this->nested_url_parenthesis_depth); |
|
107 | + $this->nested_url_parenthesis_re = |
|
108 | + str_repeat('(?>[^()\s]+|\(', $this->nested_url_parenthesis_depth). |
|
109 | + str_repeat('(?>\)))*', $this->nested_url_parenthesis_depth); |
|
110 | 110 | |
111 | - $this->escape_chars_re = '['.preg_quote($this->escape_chars).']'; |
|
111 | + $this->escape_chars_re = '['.preg_quote($this->escape_chars).']'; |
|
112 | 112 | |
113 | - # Sort document, block, and span gamut in ascendent priority order. |
|
114 | - asort($this->document_gamut); |
|
115 | - asort($this->block_gamut); |
|
116 | - asort($this->span_gamut); |
|
117 | - } |
|
113 | + # Sort document, block, and span gamut in ascendent priority order. |
|
114 | + asort($this->document_gamut); |
|
115 | + asort($this->block_gamut); |
|
116 | + asort($this->span_gamut); |
|
117 | + } |
|
118 | 118 | |
119 | 119 | |
120 | - # Internal hashes used during transformation. |
|
121 | - protected $urls = array(); |
|
122 | - protected $titles = array(); |
|
123 | - protected $html_hashes = array(); |
|
120 | + # Internal hashes used during transformation. |
|
121 | + protected $urls = array(); |
|
122 | + protected $titles = array(); |
|
123 | + protected $html_hashes = array(); |
|
124 | 124 | |
125 | - # Status flag to avoid invalid nesting. |
|
126 | - protected $in_anchor = false; |
|
125 | + # Status flag to avoid invalid nesting. |
|
126 | + protected $in_anchor = false; |
|
127 | 127 | |
128 | 128 | |
129 | - protected function setup() { |
|
130 | - # |
|
131 | - # Called before the transformation process starts to setup parser |
|
132 | - # states. |
|
133 | - # |
|
134 | - # Clear global hashes. |
|
135 | - $this->urls = $this->predef_urls; |
|
136 | - $this->titles = $this->predef_titles; |
|
137 | - $this->html_hashes = array(); |
|
129 | + protected function setup() { |
|
130 | + # |
|
131 | + # Called before the transformation process starts to setup parser |
|
132 | + # states. |
|
133 | + # |
|
134 | + # Clear global hashes. |
|
135 | + $this->urls = $this->predef_urls; |
|
136 | + $this->titles = $this->predef_titles; |
|
137 | + $this->html_hashes = array(); |
|
138 | 138 | |
139 | - $this->in_anchor = false; |
|
140 | - } |
|
139 | + $this->in_anchor = false; |
|
140 | + } |
|
141 | 141 | |
142 | - protected function teardown() { |
|
143 | - # |
|
144 | - # Called after the transformation process to clear any variable |
|
145 | - # which may be taking up memory unnecessarly. |
|
146 | - # |
|
147 | - $this->urls = array(); |
|
148 | - $this->titles = array(); |
|
149 | - $this->html_hashes = array(); |
|
150 | - } |
|
151 | - |
|
152 | - |
|
153 | - public function transform($text) { |
|
154 | - # |
|
155 | - # Main function. Performs some preprocessing on the input text |
|
156 | - # and pass it through the document gamut. |
|
157 | - # |
|
158 | - $this->setup(); |
|
142 | + protected function teardown() { |
|
143 | + # |
|
144 | + # Called after the transformation process to clear any variable |
|
145 | + # which may be taking up memory unnecessarly. |
|
146 | + # |
|
147 | + $this->urls = array(); |
|
148 | + $this->titles = array(); |
|
149 | + $this->html_hashes = array(); |
|
150 | + } |
|
151 | + |
|
152 | + |
|
153 | + public function transform($text) { |
|
154 | + # |
|
155 | + # Main function. Performs some preprocessing on the input text |
|
156 | + # and pass it through the document gamut. |
|
157 | + # |
|
158 | + $this->setup(); |
|
159 | 159 | |
160 | - # Remove UTF-8 BOM and marker character in input, if present. |
|
161 | - $text = preg_replace('{^\xEF\xBB\xBF|\x1A}', '', $text); |
|
160 | + # Remove UTF-8 BOM and marker character in input, if present. |
|
161 | + $text = preg_replace('{^\xEF\xBB\xBF|\x1A}', '', $text); |
|
162 | 162 | |
163 | - # Standardize line endings: |
|
164 | - # DOS to Unix and Mac to Unix |
|
165 | - $text = preg_replace('{\r\n?}', "\n", $text); |
|
163 | + # Standardize line endings: |
|
164 | + # DOS to Unix and Mac to Unix |
|
165 | + $text = preg_replace('{\r\n?}', "\n", $text); |
|
166 | 166 | |
167 | - # Make sure $text ends with a couple of newlines: |
|
168 | - $text .= "\n\n"; |
|
167 | + # Make sure $text ends with a couple of newlines: |
|
168 | + $text .= "\n\n"; |
|
169 | 169 | |
170 | - # Convert all tabs to spaces. |
|
171 | - $text = $this->detab($text); |
|
170 | + # Convert all tabs to spaces. |
|
171 | + $text = $this->detab($text); |
|
172 | 172 | |
173 | - # Turn block-level HTML blocks into hash entries |
|
174 | - $text = $this->hashHTMLBlocks($text); |
|
173 | + # Turn block-level HTML blocks into hash entries |
|
174 | + $text = $this->hashHTMLBlocks($text); |
|
175 | 175 | |
176 | - # Strip any lines consisting only of spaces and tabs. |
|
177 | - # This makes subsequent regexen easier to write, because we can |
|
178 | - # match consecutive blank lines with /\n+/ instead of something |
|
179 | - # contorted like /[ ]*\n+/ . |
|
180 | - $text = preg_replace('/^[ ]+$/m', '', $text); |
|
176 | + # Strip any lines consisting only of spaces and tabs. |
|
177 | + # This makes subsequent regexen easier to write, because we can |
|
178 | + # match consecutive blank lines with /\n+/ instead of something |
|
179 | + # contorted like /[ ]*\n+/ . |
|
180 | + $text = preg_replace('/^[ ]+$/m', '', $text); |
|
181 | 181 | |
182 | - # Run document gamut methods. |
|
183 | - foreach ($this->document_gamut as $method => $priority) { |
|
184 | - $text = $this->$method($text); |
|
185 | - } |
|
182 | + # Run document gamut methods. |
|
183 | + foreach ($this->document_gamut as $method => $priority) { |
|
184 | + $text = $this->$method($text); |
|
185 | + } |
|
186 | 186 | |
187 | - $this->teardown(); |
|
187 | + $this->teardown(); |
|
188 | 188 | |
189 | - return $text . "\n"; |
|
190 | - } |
|
189 | + return $text . "\n"; |
|
190 | + } |
|
191 | 191 | |
192 | - protected $document_gamut = array( |
|
193 | - # Strip link definitions, store in hashes. |
|
194 | - "stripLinkDefinitions" => 20, |
|
192 | + protected $document_gamut = array( |
|
193 | + # Strip link definitions, store in hashes. |
|
194 | + "stripLinkDefinitions" => 20, |
|
195 | 195 | |
196 | - "runBasicBlockGamut" => 30, |
|
197 | - ); |
|
196 | + "runBasicBlockGamut" => 30, |
|
197 | + ); |
|
198 | 198 | |
199 | 199 | |
200 | - protected function stripLinkDefinitions($text) { |
|
201 | - # |
|
202 | - # Strips link definitions from text, stores the URLs and titles in |
|
203 | - # hash references. |
|
204 | - # |
|
205 | - $less_than_tab = $this->tab_width - 1; |
|
200 | + protected function stripLinkDefinitions($text) { |
|
201 | + # |
|
202 | + # Strips link definitions from text, stores the URLs and titles in |
|
203 | + # hash references. |
|
204 | + # |
|
205 | + $less_than_tab = $this->tab_width - 1; |
|
206 | 206 | |
207 | - # Link defs are in the form: ^[id]: url "optional title" |
|
208 | - $text = preg_replace_callback('{ |
|
207 | + # Link defs are in the form: ^[id]: url "optional title" |
|
208 | + $text = preg_replace_callback('{ |
|
209 | 209 | ^[ ]{0,'.$less_than_tab.'}\[(.+)\][ ]?: # id = $1 |
210 | 210 | [ ]* |
211 | 211 | \n? # maybe *one* newline |
@@ -227,46 +227,46 @@ discard block |
||
227 | 227 | )? # title is optional |
228 | 228 | (?:\n+|\Z) |
229 | 229 | }xm', |
230 | - array($this, '_stripLinkDefinitions_callback'), |
|
231 | - $text); |
|
232 | - return $text; |
|
233 | - } |
|
234 | - protected function _stripLinkDefinitions_callback($matches) { |
|
235 | - $link_id = strtolower($matches[1]); |
|
236 | - $url = $matches[2] == '' ? $matches[3] : $matches[2]; |
|
237 | - $this->urls[$link_id] = $url; |
|
238 | - $this->titles[$link_id] =& $matches[4]; |
|
239 | - return ''; # String that will replace the block |
|
240 | - } |
|
241 | - |
|
242 | - |
|
243 | - protected function hashHTMLBlocks($text) { |
|
244 | - if ($this->no_markup) return $text; |
|
245 | - |
|
246 | - $less_than_tab = $this->tab_width - 1; |
|
247 | - |
|
248 | - # Hashify HTML blocks: |
|
249 | - # We only want to do this for block-level HTML tags, such as headers, |
|
250 | - # lists, and tables. That's because we still want to wrap <p>s around |
|
251 | - # "paragraphs" that are wrapped in non-block-level tags, such as anchors, |
|
252 | - # phrase emphasis, and spans. The list of tags we're looking for is |
|
253 | - # hard-coded: |
|
254 | - # |
|
255 | - # * List "a" is made of tags which can be both inline or block-level. |
|
256 | - # These will be treated block-level when the start tag is alone on |
|
257 | - # its line, otherwise they're not matched here and will be taken as |
|
258 | - # inline later. |
|
259 | - # * List "b" is made of tags which are always block-level; |
|
260 | - # |
|
261 | - $block_tags_a_re = 'ins|del'; |
|
262 | - $block_tags_b_re = 'p|div|h[1-6]|blockquote|pre|table|dl|ol|ul|address|'. |
|
263 | - 'script|noscript|style|form|fieldset|iframe|math|svg|'. |
|
264 | - 'article|section|nav|aside|hgroup|header|footer|'. |
|
265 | - 'figure'; |
|
266 | - |
|
267 | - # Regular expression for the content of a block tag. |
|
268 | - $nested_tags_level = 4; |
|
269 | - $attr = ' |
|
230 | + array($this, '_stripLinkDefinitions_callback'), |
|
231 | + $text); |
|
232 | + return $text; |
|
233 | + } |
|
234 | + protected function _stripLinkDefinitions_callback($matches) { |
|
235 | + $link_id = strtolower($matches[1]); |
|
236 | + $url = $matches[2] == '' ? $matches[3] : $matches[2]; |
|
237 | + $this->urls[$link_id] = $url; |
|
238 | + $this->titles[$link_id] =& $matches[4]; |
|
239 | + return ''; # String that will replace the block |
|
240 | + } |
|
241 | + |
|
242 | + |
|
243 | + protected function hashHTMLBlocks($text) { |
|
244 | + if ($this->no_markup) return $text; |
|
245 | + |
|
246 | + $less_than_tab = $this->tab_width - 1; |
|
247 | + |
|
248 | + # Hashify HTML blocks: |
|
249 | + # We only want to do this for block-level HTML tags, such as headers, |
|
250 | + # lists, and tables. That's because we still want to wrap <p>s around |
|
251 | + # "paragraphs" that are wrapped in non-block-level tags, such as anchors, |
|
252 | + # phrase emphasis, and spans. The list of tags we're looking for is |
|
253 | + # hard-coded: |
|
254 | + # |
|
255 | + # * List "a" is made of tags which can be both inline or block-level. |
|
256 | + # These will be treated block-level when the start tag is alone on |
|
257 | + # its line, otherwise they're not matched here and will be taken as |
|
258 | + # inline later. |
|
259 | + # * List "b" is made of tags which are always block-level; |
|
260 | + # |
|
261 | + $block_tags_a_re = 'ins|del'; |
|
262 | + $block_tags_b_re = 'p|div|h[1-6]|blockquote|pre|table|dl|ol|ul|address|'. |
|
263 | + 'script|noscript|style|form|fieldset|iframe|math|svg|'. |
|
264 | + 'article|section|nav|aside|hgroup|header|footer|'. |
|
265 | + 'figure'; |
|
266 | + |
|
267 | + # Regular expression for the content of a block tag. |
|
268 | + $nested_tags_level = 4; |
|
269 | + $attr = ' |
|
270 | 270 | (?> # optional tag attributes |
271 | 271 | \s # starts with whitespace |
272 | 272 | (?> |
@@ -280,8 +280,8 @@ discard block |
||
280 | 280 | )* |
281 | 281 | )? |
282 | 282 | '; |
283 | - $content = |
|
284 | - str_repeat(' |
|
283 | + $content = |
|
284 | + str_repeat(' |
|
285 | 285 | (?> |
286 | 286 | [^<]+ # content without tag |
287 | 287 | | |
@@ -291,29 +291,29 @@ discard block |
||
291 | 291 | /> |
292 | 292 | | |
293 | 293 | >', $nested_tags_level). # end of opening tag |
294 | - '.*?'. # last level nested tag content |
|
295 | - str_repeat(' |
|
294 | + '.*?'. # last level nested tag content |
|
295 | + str_repeat(' |
|
296 | 296 | </\2\s*> # closing nested tag |
297 | 297 | ) |
298 | 298 | | |
299 | 299 | <(?!/\2\s*> # other tags with a different name |
300 | 300 | ) |
301 | 301 | )*', |
302 | - $nested_tags_level); |
|
303 | - $content2 = str_replace('\2', '\3', $content); |
|
304 | - |
|
305 | - # First, look for nested blocks, e.g.: |
|
306 | - # <div> |
|
307 | - # <div> |
|
308 | - # tags for inner block must be indented. |
|
309 | - # </div> |
|
310 | - # </div> |
|
311 | - # |
|
312 | - # The outermost tags must start at the left margin for this to match, and |
|
313 | - # the inner nested divs must be indented. |
|
314 | - # We need to do this before the next, more liberal match, because the next |
|
315 | - # match will start at the first `<div>` and stop at the first `</div>`. |
|
316 | - $text = preg_replace_callback('{(?> |
|
302 | + $nested_tags_level); |
|
303 | + $content2 = str_replace('\2', '\3', $content); |
|
304 | + |
|
305 | + # First, look for nested blocks, e.g.: |
|
306 | + # <div> |
|
307 | + # <div> |
|
308 | + # tags for inner block must be indented. |
|
309 | + # </div> |
|
310 | + # </div> |
|
311 | + # |
|
312 | + # The outermost tags must start at the left margin for this to match, and |
|
313 | + # the inner nested divs must be indented. |
|
314 | + # We need to do this before the next, more liberal match, because the next |
|
315 | + # match will start at the first `<div>` and stop at the first `</div>`. |
|
316 | + $text = preg_replace_callback('{(?> |
|
317 | 317 | (?> |
318 | 318 | (?<=\n) # Starting on its own line |
319 | 319 | | # or |
@@ -374,97 +374,97 @@ discard block |
||
374 | 374 | |
375 | 375 | ) |
376 | 376 | )}Sxmi', |
377 | - array($this, '_hashHTMLBlocks_callback'), |
|
378 | - $text); |
|
379 | - |
|
380 | - return $text; |
|
381 | - } |
|
382 | - protected function _hashHTMLBlocks_callback($matches) { |
|
383 | - $text = $matches[1]; |
|
384 | - $key = $this->hashBlock($text); |
|
385 | - return "\n\n$key\n\n"; |
|
386 | - } |
|
377 | + array($this, '_hashHTMLBlocks_callback'), |
|
378 | + $text); |
|
379 | + |
|
380 | + return $text; |
|
381 | + } |
|
382 | + protected function _hashHTMLBlocks_callback($matches) { |
|
383 | + $text = $matches[1]; |
|
384 | + $key = $this->hashBlock($text); |
|
385 | + return "\n\n$key\n\n"; |
|
386 | + } |
|
387 | 387 | |
388 | 388 | |
389 | - protected function hashPart($text, $boundary = 'X') { |
|
390 | - # |
|
391 | - # Called whenever a tag must be hashed when a function insert an atomic |
|
392 | - # element in the text stream. Passing $text to through this function gives |
|
393 | - # a unique text-token which will be reverted back when calling unhash. |
|
394 | - # |
|
395 | - # The $boundary argument specify what character should be used to surround |
|
396 | - # the token. By convension, "B" is used for block elements that needs not |
|
397 | - # to be wrapped into paragraph tags at the end, ":" is used for elements |
|
398 | - # that are word separators and "X" is used in the general case. |
|
399 | - # |
|
400 | - # Swap back any tag hash found in $text so we do not have to `unhash` |
|
401 | - # multiple times at the end. |
|
402 | - $text = $this->unhash($text); |
|
389 | + protected function hashPart($text, $boundary = 'X') { |
|
390 | + # |
|
391 | + # Called whenever a tag must be hashed when a function insert an atomic |
|
392 | + # element in the text stream. Passing $text to through this function gives |
|
393 | + # a unique text-token which will be reverted back when calling unhash. |
|
394 | + # |
|
395 | + # The $boundary argument specify what character should be used to surround |
|
396 | + # the token. By convension, "B" is used for block elements that needs not |
|
397 | + # to be wrapped into paragraph tags at the end, ":" is used for elements |
|
398 | + # that are word separators and "X" is used in the general case. |
|
399 | + # |
|
400 | + # Swap back any tag hash found in $text so we do not have to `unhash` |
|
401 | + # multiple times at the end. |
|
402 | + $text = $this->unhash($text); |
|
403 | 403 | |
404 | - # Then hash the block. |
|
405 | - static $i = 0; |
|
406 | - $key = "$boundary\x1A" . ++$i . $boundary; |
|
407 | - $this->html_hashes[$key] = $text; |
|
408 | - return $key; # String that will replace the tag. |
|
409 | - } |
|
410 | - |
|
411 | - |
|
412 | - protected function hashBlock($text) { |
|
413 | - # |
|
414 | - # Shortcut function for hashPart with block-level boundaries. |
|
415 | - # |
|
416 | - return $this->hashPart($text, 'B'); |
|
417 | - } |
|
418 | - |
|
419 | - |
|
420 | - protected $block_gamut = array( |
|
421 | - # |
|
422 | - # These are all the transformations that form block-level |
|
423 | - # tags like paragraphs, headers, and list items. |
|
424 | - # |
|
425 | - "doHeaders" => 10, |
|
426 | - "doHorizontalRules" => 20, |
|
404 | + # Then hash the block. |
|
405 | + static $i = 0; |
|
406 | + $key = "$boundary\x1A" . ++$i . $boundary; |
|
407 | + $this->html_hashes[$key] = $text; |
|
408 | + return $key; # String that will replace the tag. |
|
409 | + } |
|
410 | + |
|
411 | + |
|
412 | + protected function hashBlock($text) { |
|
413 | + # |
|
414 | + # Shortcut function for hashPart with block-level boundaries. |
|
415 | + # |
|
416 | + return $this->hashPart($text, 'B'); |
|
417 | + } |
|
418 | + |
|
419 | + |
|
420 | + protected $block_gamut = array( |
|
421 | + # |
|
422 | + # These are all the transformations that form block-level |
|
423 | + # tags like paragraphs, headers, and list items. |
|
424 | + # |
|
425 | + "doHeaders" => 10, |
|
426 | + "doHorizontalRules" => 20, |
|
427 | 427 | |
428 | - "doLists" => 40, |
|
429 | - "doCodeBlocks" => 50, |
|
430 | - "doBlockQuotes" => 60, |
|
431 | - ); |
|
432 | - |
|
433 | - protected function runBlockGamut($text) { |
|
434 | - # |
|
435 | - # Run block gamut tranformations. |
|
436 | - # |
|
437 | - # We need to escape raw HTML in Markdown source before doing anything |
|
438 | - # else. This need to be done for each block, and not only at the |
|
439 | - # begining in the Markdown function since hashed blocks can be part of |
|
440 | - # list items and could have been indented. Indented blocks would have |
|
441 | - # been seen as a code block in a previous pass of hashHTMLBlocks. |
|
442 | - $text = $this->hashHTMLBlocks($text); |
|
428 | + "doLists" => 40, |
|
429 | + "doCodeBlocks" => 50, |
|
430 | + "doBlockQuotes" => 60, |
|
431 | + ); |
|
432 | + |
|
433 | + protected function runBlockGamut($text) { |
|
434 | + # |
|
435 | + # Run block gamut tranformations. |
|
436 | + # |
|
437 | + # We need to escape raw HTML in Markdown source before doing anything |
|
438 | + # else. This need to be done for each block, and not only at the |
|
439 | + # begining in the Markdown function since hashed blocks can be part of |
|
440 | + # list items and could have been indented. Indented blocks would have |
|
441 | + # been seen as a code block in a previous pass of hashHTMLBlocks. |
|
442 | + $text = $this->hashHTMLBlocks($text); |
|
443 | 443 | |
444 | - return $this->runBasicBlockGamut($text); |
|
445 | - } |
|
444 | + return $this->runBasicBlockGamut($text); |
|
445 | + } |
|
446 | 446 | |
447 | - protected function runBasicBlockGamut($text) { |
|
448 | - # |
|
449 | - # Run block gamut tranformations, without hashing HTML blocks. This is |
|
450 | - # useful when HTML blocks are known to be already hashed, like in the first |
|
451 | - # whole-document pass. |
|
452 | - # |
|
453 | - foreach ($this->block_gamut as $method => $priority) { |
|
454 | - $text = $this->$method($text); |
|
455 | - } |
|
447 | + protected function runBasicBlockGamut($text) { |
|
448 | + # |
|
449 | + # Run block gamut tranformations, without hashing HTML blocks. This is |
|
450 | + # useful when HTML blocks are known to be already hashed, like in the first |
|
451 | + # whole-document pass. |
|
452 | + # |
|
453 | + foreach ($this->block_gamut as $method => $priority) { |
|
454 | + $text = $this->$method($text); |
|
455 | + } |
|
456 | 456 | |
457 | - # Finally form paragraph and restore hashed blocks. |
|
458 | - $text = $this->formParagraphs($text); |
|
457 | + # Finally form paragraph and restore hashed blocks. |
|
458 | + $text = $this->formParagraphs($text); |
|
459 | 459 | |
460 | - return $text; |
|
461 | - } |
|
460 | + return $text; |
|
461 | + } |
|
462 | 462 | |
463 | 463 | |
464 | - protected function doHorizontalRules($text) { |
|
465 | - # Do Horizontal Rules: |
|
466 | - return preg_replace( |
|
467 | - '{ |
|
464 | + protected function doHorizontalRules($text) { |
|
465 | + # Do Horizontal Rules: |
|
466 | + return preg_replace( |
|
467 | + '{ |
|
468 | 468 | ^[ ]{0,3} # Leading space |
469 | 469 | ([-*_]) # $1: First marker |
470 | 470 | (?> # Repeated marker group |
@@ -474,68 +474,68 @@ discard block |
||
474 | 474 | [ ]* # Tailing spaces |
475 | 475 | $ # End of line. |
476 | 476 | }mx', |
477 | - "\n".$this->hashBlock("<hr$this->empty_element_suffix")."\n", |
|
478 | - $text); |
|
479 | - } |
|
480 | - |
|
481 | - |
|
482 | - protected $span_gamut = array( |
|
483 | - # |
|
484 | - # These are all the transformations that occur *within* block-level |
|
485 | - # tags like paragraphs, headers, and list items. |
|
486 | - # |
|
487 | - # Process character escapes, code spans, and inline HTML |
|
488 | - # in one shot. |
|
489 | - "parseSpan" => -30, |
|
490 | - |
|
491 | - # Process anchor and image tags. Images must come first, |
|
492 | - # because ![foo][f] looks like an anchor. |
|
493 | - "doImages" => 10, |
|
494 | - "doAnchors" => 20, |
|
477 | + "\n".$this->hashBlock("<hr$this->empty_element_suffix")."\n", |
|
478 | + $text); |
|
479 | + } |
|
480 | + |
|
481 | + |
|
482 | + protected $span_gamut = array( |
|
483 | + # |
|
484 | + # These are all the transformations that occur *within* block-level |
|
485 | + # tags like paragraphs, headers, and list items. |
|
486 | + # |
|
487 | + # Process character escapes, code spans, and inline HTML |
|
488 | + # in one shot. |
|
489 | + "parseSpan" => -30, |
|
490 | + |
|
491 | + # Process anchor and image tags. Images must come first, |
|
492 | + # because ![foo][f] looks like an anchor. |
|
493 | + "doImages" => 10, |
|
494 | + "doAnchors" => 20, |
|
495 | 495 | |
496 | - # Make links out of things like `<http://example.com/>` |
|
497 | - # Must come after doAnchors, because you can use < and > |
|
498 | - # delimiters in inline links like [this](<url>). |
|
499 | - "doAutoLinks" => 30, |
|
500 | - "encodeAmpsAndAngles" => 40, |
|
501 | - |
|
502 | - "doItalicsAndBold" => 50, |
|
503 | - "doHardBreaks" => 60, |
|
504 | - ); |
|
505 | - |
|
506 | - protected function runSpanGamut($text) { |
|
507 | - # |
|
508 | - # Run span gamut tranformations. |
|
509 | - # |
|
510 | - foreach ($this->span_gamut as $method => $priority) { |
|
511 | - $text = $this->$method($text); |
|
512 | - } |
|
513 | - |
|
514 | - return $text; |
|
515 | - } |
|
496 | + # Make links out of things like `<http://example.com/>` |
|
497 | + # Must come after doAnchors, because you can use < and > |
|
498 | + # delimiters in inline links like [this](<url>). |
|
499 | + "doAutoLinks" => 30, |
|
500 | + "encodeAmpsAndAngles" => 40, |
|
501 | + |
|
502 | + "doItalicsAndBold" => 50, |
|
503 | + "doHardBreaks" => 60, |
|
504 | + ); |
|
505 | + |
|
506 | + protected function runSpanGamut($text) { |
|
507 | + # |
|
508 | + # Run span gamut tranformations. |
|
509 | + # |
|
510 | + foreach ($this->span_gamut as $method => $priority) { |
|
511 | + $text = $this->$method($text); |
|
512 | + } |
|
513 | + |
|
514 | + return $text; |
|
515 | + } |
|
516 | 516 | |
517 | 517 | |
518 | - protected function doHardBreaks($text) { |
|
519 | - # Do hard breaks: |
|
520 | - return preg_replace_callback('/ {2,}\n/', |
|
521 | - array($this, '_doHardBreaks_callback'), $text); |
|
522 | - } |
|
523 | - protected function _doHardBreaks_callback($matches) { |
|
524 | - return $this->hashPart("<br$this->empty_element_suffix\n"); |
|
525 | - } |
|
526 | - |
|
527 | - |
|
528 | - protected function doAnchors($text) { |
|
529 | - # |
|
530 | - # Turn Markdown link shortcuts into XHTML <a> tags. |
|
531 | - # |
|
532 | - if ($this->in_anchor) return $text; |
|
533 | - $this->in_anchor = true; |
|
518 | + protected function doHardBreaks($text) { |
|
519 | + # Do hard breaks: |
|
520 | + return preg_replace_callback('/ {2,}\n/', |
|
521 | + array($this, '_doHardBreaks_callback'), $text); |
|
522 | + } |
|
523 | + protected function _doHardBreaks_callback($matches) { |
|
524 | + return $this->hashPart("<br$this->empty_element_suffix\n"); |
|
525 | + } |
|
526 | + |
|
527 | + |
|
528 | + protected function doAnchors($text) { |
|
529 | + # |
|
530 | + # Turn Markdown link shortcuts into XHTML <a> tags. |
|
531 | + # |
|
532 | + if ($this->in_anchor) return $text; |
|
533 | + $this->in_anchor = true; |
|
534 | 534 | |
535 | - # |
|
536 | - # First, handle reference-style links: [link text] [id] |
|
537 | - # |
|
538 | - $text = preg_replace_callback('{ |
|
535 | + # |
|
536 | + # First, handle reference-style links: [link text] [id] |
|
537 | + # |
|
538 | + $text = preg_replace_callback('{ |
|
539 | 539 | ( # wrap whole match in $1 |
540 | 540 | \[ |
541 | 541 | ('.$this->nested_brackets_re.') # link text = $2 |
@@ -549,12 +549,12 @@ discard block |
||
549 | 549 | \] |
550 | 550 | ) |
551 | 551 | }xs', |
552 | - array($this, '_doAnchors_reference_callback'), $text); |
|
552 | + array($this, '_doAnchors_reference_callback'), $text); |
|
553 | 553 | |
554 | - # |
|
555 | - # Next, inline-style links: [link text](url "optional title") |
|
556 | - # |
|
557 | - $text = preg_replace_callback('{ |
|
554 | + # |
|
555 | + # Next, inline-style links: [link text](url "optional title") |
|
556 | + # |
|
557 | + $text = preg_replace_callback('{ |
|
558 | 558 | ( # wrap whole match in $1 |
559 | 559 | \[ |
560 | 560 | ('.$this->nested_brackets_re.') # link text = $2 |
@@ -576,94 +576,94 @@ discard block |
||
576 | 576 | \) |
577 | 577 | ) |
578 | 578 | }xs', |
579 | - array($this, '_doAnchors_inline_callback'), $text); |
|
580 | - |
|
581 | - # |
|
582 | - # Last, handle reference-style shortcuts: [link text] |
|
583 | - # These must come last in case you've also got [link text][1] |
|
584 | - # or [link text](/foo) |
|
585 | - # |
|
586 | - $text = preg_replace_callback('{ |
|
579 | + array($this, '_doAnchors_inline_callback'), $text); |
|
580 | + |
|
581 | + # |
|
582 | + # Last, handle reference-style shortcuts: [link text] |
|
583 | + # These must come last in case you've also got [link text][1] |
|
584 | + # or [link text](/foo) |
|
585 | + # |
|
586 | + $text = preg_replace_callback('{ |
|
587 | 587 | ( # wrap whole match in $1 |
588 | 588 | \[ |
589 | 589 | ([^\[\]]+) # link text = $2; can\'t contain [ or ] |
590 | 590 | \] |
591 | 591 | ) |
592 | 592 | }xs', |
593 | - array($this, '_doAnchors_reference_callback'), $text); |
|
594 | - |
|
595 | - $this->in_anchor = false; |
|
596 | - return $text; |
|
597 | - } |
|
598 | - protected function _doAnchors_reference_callback($matches) { |
|
599 | - $whole_match = $matches[1]; |
|
600 | - $link_text = $matches[2]; |
|
601 | - $link_id =& $matches[3]; |
|
602 | - |
|
603 | - if ($link_id == "") { |
|
604 | - # for shortcut links like [this][] or [this]. |
|
605 | - $link_id = $link_text; |
|
606 | - } |
|
593 | + array($this, '_doAnchors_reference_callback'), $text); |
|
594 | + |
|
595 | + $this->in_anchor = false; |
|
596 | + return $text; |
|
597 | + } |
|
598 | + protected function _doAnchors_reference_callback($matches) { |
|
599 | + $whole_match = $matches[1]; |
|
600 | + $link_text = $matches[2]; |
|
601 | + $link_id =& $matches[3]; |
|
602 | + |
|
603 | + if ($link_id == "") { |
|
604 | + # for shortcut links like [this][] or [this]. |
|
605 | + $link_id = $link_text; |
|
606 | + } |
|
607 | 607 | |
608 | - # lower-case and turn embedded newlines into spaces |
|
609 | - $link_id = strtolower($link_id); |
|
610 | - $link_id = preg_replace('{[ ]?\n}', ' ', $link_id); |
|
608 | + # lower-case and turn embedded newlines into spaces |
|
609 | + $link_id = strtolower($link_id); |
|
610 | + $link_id = preg_replace('{[ ]?\n}', ' ', $link_id); |
|
611 | 611 | |
612 | - if (isset($this->urls[$link_id])) { |
|
613 | - $url = $this->urls[$link_id]; |
|
614 | - $url = $this->encodeURLAttribute($url); |
|
612 | + if (isset($this->urls[$link_id])) { |
|
613 | + $url = $this->urls[$link_id]; |
|
614 | + $url = $this->encodeURLAttribute($url); |
|
615 | 615 | |
616 | - $result = "<a href=\"$url\""; |
|
617 | - if ( isset( $this->titles[$link_id] ) ) { |
|
618 | - $title = $this->titles[$link_id]; |
|
619 | - $title = $this->encodeAttribute($title); |
|
620 | - $result .= " title=\"$title\""; |
|
621 | - } |
|
616 | + $result = "<a href=\"$url\""; |
|
617 | + if ( isset( $this->titles[$link_id] ) ) { |
|
618 | + $title = $this->titles[$link_id]; |
|
619 | + $title = $this->encodeAttribute($title); |
|
620 | + $result .= " title=\"$title\""; |
|
621 | + } |
|
622 | 622 | |
623 | - $link_text = $this->runSpanGamut($link_text); |
|
624 | - $result .= ">$link_text</a>"; |
|
625 | - $result = $this->hashPart($result); |
|
626 | - } |
|
627 | - else { |
|
628 | - $result = $whole_match; |
|
629 | - } |
|
630 | - return $result; |
|
631 | - } |
|
632 | - protected function _doAnchors_inline_callback($matches) { |
|
633 | - $whole_match = $matches[1]; |
|
634 | - $link_text = $this->runSpanGamut($matches[2]); |
|
635 | - $url = $matches[3] == '' ? $matches[4] : $matches[3]; |
|
636 | - $title =& $matches[7]; |
|
637 | - |
|
638 | - // if the URL was of the form <s p a c e s> it got caught by the HTML |
|
639 | - // tag parser and hashed. Need to reverse the process before using the URL. |
|
640 | - $unhashed = $this->unhash($url); |
|
641 | - if ($unhashed != $url) |
|
642 | - $url = preg_replace('/^<(.*)>$/', '\1', $unhashed); |
|
643 | - |
|
644 | - $url = $this->encodeURLAttribute($url); |
|
645 | - |
|
646 | - $result = "<a href=\"$url\""; |
|
647 | - if (isset($title)) { |
|
648 | - $title = $this->encodeAttribute($title); |
|
649 | - $result .= " title=\"$title\""; |
|
650 | - } |
|
623 | + $link_text = $this->runSpanGamut($link_text); |
|
624 | + $result .= ">$link_text</a>"; |
|
625 | + $result = $this->hashPart($result); |
|
626 | + } |
|
627 | + else { |
|
628 | + $result = $whole_match; |
|
629 | + } |
|
630 | + return $result; |
|
631 | + } |
|
632 | + protected function _doAnchors_inline_callback($matches) { |
|
633 | + $whole_match = $matches[1]; |
|
634 | + $link_text = $this->runSpanGamut($matches[2]); |
|
635 | + $url = $matches[3] == '' ? $matches[4] : $matches[3]; |
|
636 | + $title =& $matches[7]; |
|
637 | + |
|
638 | + // if the URL was of the form <s p a c e s> it got caught by the HTML |
|
639 | + // tag parser and hashed. Need to reverse the process before using the URL. |
|
640 | + $unhashed = $this->unhash($url); |
|
641 | + if ($unhashed != $url) |
|
642 | + $url = preg_replace('/^<(.*)>$/', '\1', $unhashed); |
|
643 | + |
|
644 | + $url = $this->encodeURLAttribute($url); |
|
645 | + |
|
646 | + $result = "<a href=\"$url\""; |
|
647 | + if (isset($title)) { |
|
648 | + $title = $this->encodeAttribute($title); |
|
649 | + $result .= " title=\"$title\""; |
|
650 | + } |
|
651 | 651 | |
652 | - $link_text = $this->runSpanGamut($link_text); |
|
653 | - $result .= ">$link_text</a>"; |
|
652 | + $link_text = $this->runSpanGamut($link_text); |
|
653 | + $result .= ">$link_text</a>"; |
|
654 | 654 | |
655 | - return $this->hashPart($result); |
|
656 | - } |
|
655 | + return $this->hashPart($result); |
|
656 | + } |
|
657 | 657 | |
658 | 658 | |
659 | - protected function doImages($text) { |
|
660 | - # |
|
661 | - # Turn Markdown image shortcuts into <img> tags. |
|
662 | - # |
|
663 | - # |
|
664 | - # First, handle reference-style labeled images: ![alt text][id] |
|
665 | - # |
|
666 | - $text = preg_replace_callback('{ |
|
659 | + protected function doImages($text) { |
|
660 | + # |
|
661 | + # Turn Markdown image shortcuts into <img> tags. |
|
662 | + # |
|
663 | + # |
|
664 | + # First, handle reference-style labeled images: ![alt text][id] |
|
665 | + # |
|
666 | + $text = preg_replace_callback('{ |
|
667 | 667 | ( # wrap whole match in $1 |
668 | 668 | !\[ |
669 | 669 | ('.$this->nested_brackets_re.') # alt text = $2 |
@@ -678,13 +678,13 @@ discard block |
||
678 | 678 | |
679 | 679 | ) |
680 | 680 | }xs', |
681 | - array($this, '_doImages_reference_callback'), $text); |
|
681 | + array($this, '_doImages_reference_callback'), $text); |
|
682 | 682 | |
683 | - # |
|
684 | - # Next, handle inline images:  |
|
685 | - # Don't forget: encode * and _ |
|
686 | - # |
|
687 | - $text = preg_replace_callback('{ |
|
683 | + # |
|
684 | + # Next, handle inline images:  |
|
685 | + # Don't forget: encode * and _ |
|
686 | + # |
|
687 | + $text = preg_replace_callback('{ |
|
688 | 688 | ( # wrap whole match in $1 |
689 | 689 | !\[ |
690 | 690 | ('.$this->nested_brackets_re.') # alt text = $2 |
@@ -707,76 +707,76 @@ discard block |
||
707 | 707 | \) |
708 | 708 | ) |
709 | 709 | }xs', |
710 | - array($this, '_doImages_inline_callback'), $text); |
|
711 | - |
|
712 | - return $text; |
|
713 | - } |
|
714 | - protected function _doImages_reference_callback($matches) { |
|
715 | - $whole_match = $matches[1]; |
|
716 | - $alt_text = $matches[2]; |
|
717 | - $link_id = strtolower($matches[3]); |
|
718 | - |
|
719 | - if ($link_id == "") { |
|
720 | - $link_id = strtolower($alt_text); # for shortcut links like ![this][]. |
|
721 | - } |
|
722 | - |
|
723 | - $alt_text = $this->encodeAttribute($alt_text); |
|
724 | - if (isset($this->urls[$link_id])) { |
|
725 | - $url = $this->encodeURLAttribute($this->urls[$link_id]); |
|
726 | - $result = "<img src=\"$url\" alt=\"$alt_text\""; |
|
727 | - if (isset($this->titles[$link_id])) { |
|
728 | - $title = $this->titles[$link_id]; |
|
729 | - $title = $this->encodeAttribute($title); |
|
730 | - $result .= " title=\"$title\""; |
|
731 | - } |
|
732 | - $result .= $this->empty_element_suffix; |
|
733 | - $result = $this->hashPart($result); |
|
734 | - } |
|
735 | - else { |
|
736 | - # If there's no such link ID, leave intact: |
|
737 | - $result = $whole_match; |
|
738 | - } |
|
739 | - |
|
740 | - return $result; |
|
741 | - } |
|
742 | - protected function _doImages_inline_callback($matches) { |
|
743 | - $whole_match = $matches[1]; |
|
744 | - $alt_text = $matches[2]; |
|
745 | - $url = $matches[3] == '' ? $matches[4] : $matches[3]; |
|
746 | - $title =& $matches[7]; |
|
747 | - |
|
748 | - $alt_text = $this->encodeAttribute($alt_text); |
|
749 | - $url = $this->encodeURLAttribute($url); |
|
750 | - $result = "<img src=\"$url\" alt=\"$alt_text\""; |
|
751 | - if (isset($title)) { |
|
752 | - $title = $this->encodeAttribute($title); |
|
753 | - $result .= " title=\"$title\""; # $title already quoted |
|
754 | - } |
|
755 | - $result .= $this->empty_element_suffix; |
|
756 | - |
|
757 | - return $this->hashPart($result); |
|
758 | - } |
|
759 | - |
|
760 | - |
|
761 | - protected function doHeaders($text) { |
|
762 | - # Setext-style headers: |
|
763 | - # Header 1 |
|
764 | - # ======== |
|
765 | - # |
|
766 | - # Header 2 |
|
767 | - # -------- |
|
768 | - # |
|
769 | - $text = preg_replace_callback('{ ^(.+?)[ ]*\n(=+|-+)[ ]*\n+ }mx', |
|
770 | - array($this, '_doHeaders_callback_setext'), $text); |
|
771 | - |
|
772 | - # atx-style headers: |
|
773 | - # # Header 1 |
|
774 | - # ## Header 2 |
|
775 | - # ## Header 2 with closing hashes ## |
|
776 | - # ... |
|
777 | - # ###### Header 6 |
|
778 | - # |
|
779 | - $text = preg_replace_callback('{ |
|
710 | + array($this, '_doImages_inline_callback'), $text); |
|
711 | + |
|
712 | + return $text; |
|
713 | + } |
|
714 | + protected function _doImages_reference_callback($matches) { |
|
715 | + $whole_match = $matches[1]; |
|
716 | + $alt_text = $matches[2]; |
|
717 | + $link_id = strtolower($matches[3]); |
|
718 | + |
|
719 | + if ($link_id == "") { |
|
720 | + $link_id = strtolower($alt_text); # for shortcut links like ![this][]. |
|
721 | + } |
|
722 | + |
|
723 | + $alt_text = $this->encodeAttribute($alt_text); |
|
724 | + if (isset($this->urls[$link_id])) { |
|
725 | + $url = $this->encodeURLAttribute($this->urls[$link_id]); |
|
726 | + $result = "<img src=\"$url\" alt=\"$alt_text\""; |
|
727 | + if (isset($this->titles[$link_id])) { |
|
728 | + $title = $this->titles[$link_id]; |
|
729 | + $title = $this->encodeAttribute($title); |
|
730 | + $result .= " title=\"$title\""; |
|
731 | + } |
|
732 | + $result .= $this->empty_element_suffix; |
|
733 | + $result = $this->hashPart($result); |
|
734 | + } |
|
735 | + else { |
|
736 | + # If there's no such link ID, leave intact: |
|
737 | + $result = $whole_match; |
|
738 | + } |
|
739 | + |
|
740 | + return $result; |
|
741 | + } |
|
742 | + protected function _doImages_inline_callback($matches) { |
|
743 | + $whole_match = $matches[1]; |
|
744 | + $alt_text = $matches[2]; |
|
745 | + $url = $matches[3] == '' ? $matches[4] : $matches[3]; |
|
746 | + $title =& $matches[7]; |
|
747 | + |
|
748 | + $alt_text = $this->encodeAttribute($alt_text); |
|
749 | + $url = $this->encodeURLAttribute($url); |
|
750 | + $result = "<img src=\"$url\" alt=\"$alt_text\""; |
|
751 | + if (isset($title)) { |
|
752 | + $title = $this->encodeAttribute($title); |
|
753 | + $result .= " title=\"$title\""; # $title already quoted |
|
754 | + } |
|
755 | + $result .= $this->empty_element_suffix; |
|
756 | + |
|
757 | + return $this->hashPart($result); |
|
758 | + } |
|
759 | + |
|
760 | + |
|
761 | + protected function doHeaders($text) { |
|
762 | + # Setext-style headers: |
|
763 | + # Header 1 |
|
764 | + # ======== |
|
765 | + # |
|
766 | + # Header 2 |
|
767 | + # -------- |
|
768 | + # |
|
769 | + $text = preg_replace_callback('{ ^(.+?)[ ]*\n(=+|-+)[ ]*\n+ }mx', |
|
770 | + array($this, '_doHeaders_callback_setext'), $text); |
|
771 | + |
|
772 | + # atx-style headers: |
|
773 | + # # Header 1 |
|
774 | + # ## Header 2 |
|
775 | + # ## Header 2 with closing hashes ## |
|
776 | + # ... |
|
777 | + # ###### Header 6 |
|
778 | + # |
|
779 | + $text = preg_replace_callback('{ |
|
780 | 780 | ^(\#{1,6}) # $1 = string of #\'s |
781 | 781 | [ ]* |
782 | 782 | (.+?) # $2 = Header text |
@@ -784,69 +784,69 @@ discard block |
||
784 | 784 | \#* # optional closing #\'s (not counted) |
785 | 785 | \n+ |
786 | 786 | }xm', |
787 | - array($this, '_doHeaders_callback_atx'), $text); |
|
787 | + array($this, '_doHeaders_callback_atx'), $text); |
|
788 | 788 | |
789 | - return $text; |
|
790 | - } |
|
789 | + return $text; |
|
790 | + } |
|
791 | 791 | |
792 | - protected function _doHeaders_callback_setext($matches) { |
|
793 | - # Terrible hack to check we haven't found an empty list item. |
|
794 | - if ($matches[2] == '-' && preg_match('{^-(?: |$)}', $matches[1])) |
|
795 | - return $matches[0]; |
|
792 | + protected function _doHeaders_callback_setext($matches) { |
|
793 | + # Terrible hack to check we haven't found an empty list item. |
|
794 | + if ($matches[2] == '-' && preg_match('{^-(?: |$)}', $matches[1])) |
|
795 | + return $matches[0]; |
|
796 | 796 | |
797 | - $level = $matches[2]{0} == '=' ? 1 : 2; |
|
798 | - |
|
799 | - # id attribute generation |
|
800 | - $idAtt = $this->_generateIdFromHeaderValue($matches[1]); |
|
801 | - |
|
802 | - $block = "<h$level$idAtt>".$this->runSpanGamut($matches[1])."</h$level>"; |
|
803 | - return "\n" . $this->hashBlock($block) . "\n\n"; |
|
804 | - } |
|
805 | - protected function _doHeaders_callback_atx($matches) { |
|
806 | - |
|
807 | - # id attribute generation |
|
808 | - $idAtt = $this->_generateIdFromHeaderValue($matches[2]); |
|
809 | - |
|
810 | - $level = strlen($matches[1]); |
|
811 | - $block = "<h$level$idAtt>".$this->runSpanGamut($matches[2])."</h$level>"; |
|
812 | - return "\n" . $this->hashBlock($block) . "\n\n"; |
|
813 | - } |
|
814 | - |
|
815 | - protected function _generateIdFromHeaderValue($headerValue) { |
|
816 | - |
|
817 | - # if a header_id_func property is set, we can use it to automatically |
|
818 | - # generate an id attribute. |
|
819 | - # |
|
820 | - # This method returns a string in the form id="foo", or an empty string |
|
821 | - # otherwise. |
|
822 | - if (!is_callable($this->header_id_func)) { |
|
823 | - return ""; |
|
824 | - } |
|
825 | - $idValue = call_user_func($this->header_id_func, $headerValue); |
|
826 | - if (!$idValue) return ""; |
|
827 | - |
|
828 | - return ' id="' . $this->encodeAttribute($idValue) . '"'; |
|
829 | - |
|
830 | - } |
|
831 | - |
|
832 | - protected function doLists($text) { |
|
833 | - # |
|
834 | - # Form HTML ordered (numbered) and unordered (bulleted) lists. |
|
835 | - # |
|
836 | - $less_than_tab = $this->tab_width - 1; |
|
837 | - |
|
838 | - # Re-usable patterns to match list item bullets and number markers: |
|
839 | - $marker_ul_re = '[*+-]'; |
|
840 | - $marker_ol_re = '\d+[\.]'; |
|
841 | - |
|
842 | - $markers_relist = array( |
|
843 | - $marker_ul_re => $marker_ol_re, |
|
844 | - $marker_ol_re => $marker_ul_re, |
|
845 | - ); |
|
846 | - |
|
847 | - foreach ($markers_relist as $marker_re => $other_marker_re) { |
|
848 | - # Re-usable pattern to match any entirel ul or ol list: |
|
849 | - $whole_list_re = ' |
|
797 | + $level = $matches[2]{0} == '=' ? 1 : 2; |
|
798 | + |
|
799 | + # id attribute generation |
|
800 | + $idAtt = $this->_generateIdFromHeaderValue($matches[1]); |
|
801 | + |
|
802 | + $block = "<h$level$idAtt>".$this->runSpanGamut($matches[1])."</h$level>"; |
|
803 | + return "\n" . $this->hashBlock($block) . "\n\n"; |
|
804 | + } |
|
805 | + protected function _doHeaders_callback_atx($matches) { |
|
806 | + |
|
807 | + # id attribute generation |
|
808 | + $idAtt = $this->_generateIdFromHeaderValue($matches[2]); |
|
809 | + |
|
810 | + $level = strlen($matches[1]); |
|
811 | + $block = "<h$level$idAtt>".$this->runSpanGamut($matches[2])."</h$level>"; |
|
812 | + return "\n" . $this->hashBlock($block) . "\n\n"; |
|
813 | + } |
|
814 | + |
|
815 | + protected function _generateIdFromHeaderValue($headerValue) { |
|
816 | + |
|
817 | + # if a header_id_func property is set, we can use it to automatically |
|
818 | + # generate an id attribute. |
|
819 | + # |
|
820 | + # This method returns a string in the form id="foo", or an empty string |
|
821 | + # otherwise. |
|
822 | + if (!is_callable($this->header_id_func)) { |
|
823 | + return ""; |
|
824 | + } |
|
825 | + $idValue = call_user_func($this->header_id_func, $headerValue); |
|
826 | + if (!$idValue) return ""; |
|
827 | + |
|
828 | + return ' id="' . $this->encodeAttribute($idValue) . '"'; |
|
829 | + |
|
830 | + } |
|
831 | + |
|
832 | + protected function doLists($text) { |
|
833 | + # |
|
834 | + # Form HTML ordered (numbered) and unordered (bulleted) lists. |
|
835 | + # |
|
836 | + $less_than_tab = $this->tab_width - 1; |
|
837 | + |
|
838 | + # Re-usable patterns to match list item bullets and number markers: |
|
839 | + $marker_ul_re = '[*+-]'; |
|
840 | + $marker_ol_re = '\d+[\.]'; |
|
841 | + |
|
842 | + $markers_relist = array( |
|
843 | + $marker_ul_re => $marker_ol_re, |
|
844 | + $marker_ol_re => $marker_ul_re, |
|
845 | + ); |
|
846 | + |
|
847 | + foreach ($markers_relist as $marker_re => $other_marker_re) { |
|
848 | + # Re-usable pattern to match any entirel ul or ol list: |
|
849 | + $whole_list_re = ' |
|
850 | 850 | ( # $1 = whole list |
851 | 851 | ( # $2 |
852 | 852 | ([ ]{0,'.$less_than_tab.'}) # $3 = number of spaces |
@@ -873,96 +873,96 @@ discard block |
||
873 | 873 | ) |
874 | 874 | '; // mx |
875 | 875 | |
876 | - # We use a different prefix before nested lists than top-level lists. |
|
877 | - # See extended comment in _ProcessListItems(). |
|
876 | + # We use a different prefix before nested lists than top-level lists. |
|
877 | + # See extended comment in _ProcessListItems(). |
|
878 | 878 | |
879 | - if ($this->list_level) { |
|
880 | - $text = preg_replace_callback('{ |
|
879 | + if ($this->list_level) { |
|
880 | + $text = preg_replace_callback('{ |
|
881 | 881 | ^ |
882 | 882 | '.$whole_list_re.' |
883 | 883 | }mx', |
884 | - array($this, '_doLists_callback'), $text); |
|
885 | - } |
|
886 | - else { |
|
887 | - $text = preg_replace_callback('{ |
|
884 | + array($this, '_doLists_callback'), $text); |
|
885 | + } |
|
886 | + else { |
|
887 | + $text = preg_replace_callback('{ |
|
888 | 888 | (?:(?<=\n)\n|\A\n?) # Must eat the newline |
889 | 889 | '.$whole_list_re.' |
890 | 890 | }mx', |
891 | - array($this, '_doLists_callback'), $text); |
|
892 | - } |
|
893 | - } |
|
894 | - |
|
895 | - return $text; |
|
896 | - } |
|
897 | - protected function _doLists_callback($matches) { |
|
898 | - # Re-usable patterns to match list item bullets and number markers: |
|
899 | - $marker_ul_re = '[*+-]'; |
|
900 | - $marker_ol_re = '\d+[\.]'; |
|
901 | - $marker_any_re = "(?:$marker_ul_re|$marker_ol_re)"; |
|
902 | - $marker_ol_start_re = '[0-9]+'; |
|
903 | - |
|
904 | - $list = $matches[1]; |
|
905 | - $list_type = preg_match("/$marker_ul_re/", $matches[4]) ? "ul" : "ol"; |
|
906 | - |
|
907 | - $marker_any_re = ( $list_type == "ul" ? $marker_ul_re : $marker_ol_re ); |
|
908 | - |
|
909 | - $list .= "\n"; |
|
910 | - $result = $this->processListItems($list, $marker_any_re); |
|
911 | - |
|
912 | - $ol_start = 1; |
|
913 | - if ($this->enhanced_ordered_list) { |
|
914 | - # Get the start number for ordered list. |
|
915 | - if ($list_type == 'ol') { |
|
916 | - $ol_start_array = array(); |
|
917 | - $ol_start_check = preg_match("/$marker_ol_start_re/", $matches[4], $ol_start_array); |
|
918 | - if ($ol_start_check){ |
|
919 | - $ol_start = $ol_start_array[0]; |
|
920 | - } |
|
921 | - } |
|
922 | - } |
|
923 | - |
|
924 | - if ($ol_start > 1 && $list_type == 'ol'){ |
|
925 | - $result = $this->hashBlock("<$list_type start=\"$ol_start\">\n" . $result . "</$list_type>"); |
|
926 | - } else { |
|
927 | - $result = $this->hashBlock("<$list_type>\n" . $result . "</$list_type>"); |
|
928 | - } |
|
929 | - return "\n". $result ."\n\n"; |
|
930 | - } |
|
931 | - |
|
932 | - protected $list_level = 0; |
|
933 | - |
|
934 | - protected function processListItems($list_str, $marker_any_re) { |
|
935 | - # |
|
936 | - # Process the contents of a single ordered or unordered list, splitting it |
|
937 | - # into individual list items. |
|
938 | - # |
|
939 | - # The $this->list_level global keeps track of when we're inside a list. |
|
940 | - # Each time we enter a list, we increment it; when we leave a list, |
|
941 | - # we decrement. If it's zero, we're not in a list anymore. |
|
942 | - # |
|
943 | - # We do this because when we're not inside a list, we want to treat |
|
944 | - # something like this: |
|
945 | - # |
|
946 | - # I recommend upgrading to version |
|
947 | - # 8. Oops, now this line is treated |
|
948 | - # as a sub-list. |
|
949 | - # |
|
950 | - # As a single paragraph, despite the fact that the second line starts |
|
951 | - # with a digit-period-space sequence. |
|
952 | - # |
|
953 | - # Whereas when we're inside a list (or sub-list), that line will be |
|
954 | - # treated as the start of a sub-list. What a kludge, huh? This is |
|
955 | - # an aspect of Markdown's syntax that's hard to parse perfectly |
|
956 | - # without resorting to mind-reading. Perhaps the solution is to |
|
957 | - # change the syntax rules such that sub-lists must start with a |
|
958 | - # starting cardinal number; e.g. "1." or "a.". |
|
891 | + array($this, '_doLists_callback'), $text); |
|
892 | + } |
|
893 | + } |
|
894 | + |
|
895 | + return $text; |
|
896 | + } |
|
897 | + protected function _doLists_callback($matches) { |
|
898 | + # Re-usable patterns to match list item bullets and number markers: |
|
899 | + $marker_ul_re = '[*+-]'; |
|
900 | + $marker_ol_re = '\d+[\.]'; |
|
901 | + $marker_any_re = "(?:$marker_ul_re|$marker_ol_re)"; |
|
902 | + $marker_ol_start_re = '[0-9]+'; |
|
903 | + |
|
904 | + $list = $matches[1]; |
|
905 | + $list_type = preg_match("/$marker_ul_re/", $matches[4]) ? "ul" : "ol"; |
|
906 | + |
|
907 | + $marker_any_re = ( $list_type == "ul" ? $marker_ul_re : $marker_ol_re ); |
|
908 | + |
|
909 | + $list .= "\n"; |
|
910 | + $result = $this->processListItems($list, $marker_any_re); |
|
911 | + |
|
912 | + $ol_start = 1; |
|
913 | + if ($this->enhanced_ordered_list) { |
|
914 | + # Get the start number for ordered list. |
|
915 | + if ($list_type == 'ol') { |
|
916 | + $ol_start_array = array(); |
|
917 | + $ol_start_check = preg_match("/$marker_ol_start_re/", $matches[4], $ol_start_array); |
|
918 | + if ($ol_start_check){ |
|
919 | + $ol_start = $ol_start_array[0]; |
|
920 | + } |
|
921 | + } |
|
922 | + } |
|
923 | + |
|
924 | + if ($ol_start > 1 && $list_type == 'ol'){ |
|
925 | + $result = $this->hashBlock("<$list_type start=\"$ol_start\">\n" . $result . "</$list_type>"); |
|
926 | + } else { |
|
927 | + $result = $this->hashBlock("<$list_type>\n" . $result . "</$list_type>"); |
|
928 | + } |
|
929 | + return "\n". $result ."\n\n"; |
|
930 | + } |
|
931 | + |
|
932 | + protected $list_level = 0; |
|
933 | + |
|
934 | + protected function processListItems($list_str, $marker_any_re) { |
|
935 | + # |
|
936 | + # Process the contents of a single ordered or unordered list, splitting it |
|
937 | + # into individual list items. |
|
938 | + # |
|
939 | + # The $this->list_level global keeps track of when we're inside a list. |
|
940 | + # Each time we enter a list, we increment it; when we leave a list, |
|
941 | + # we decrement. If it's zero, we're not in a list anymore. |
|
942 | + # |
|
943 | + # We do this because when we're not inside a list, we want to treat |
|
944 | + # something like this: |
|
945 | + # |
|
946 | + # I recommend upgrading to version |
|
947 | + # 8. Oops, now this line is treated |
|
948 | + # as a sub-list. |
|
949 | + # |
|
950 | + # As a single paragraph, despite the fact that the second line starts |
|
951 | + # with a digit-period-space sequence. |
|
952 | + # |
|
953 | + # Whereas when we're inside a list (or sub-list), that line will be |
|
954 | + # treated as the start of a sub-list. What a kludge, huh? This is |
|
955 | + # an aspect of Markdown's syntax that's hard to parse perfectly |
|
956 | + # without resorting to mind-reading. Perhaps the solution is to |
|
957 | + # change the syntax rules such that sub-lists must start with a |
|
958 | + # starting cardinal number; e.g. "1." or "a.". |
|
959 | 959 | |
960 | - $this->list_level++; |
|
960 | + $this->list_level++; |
|
961 | 961 | |
962 | - # trim trailing blank lines: |
|
963 | - $list_str = preg_replace("/\n{2,}\\z/", "\n", $list_str); |
|
962 | + # trim trailing blank lines: |
|
963 | + $list_str = preg_replace("/\n{2,}\\z/", "\n", $list_str); |
|
964 | 964 | |
965 | - $list_str = preg_replace_callback('{ |
|
965 | + $list_str = preg_replace_callback('{ |
|
966 | 966 | (\n)? # leading line = $1 |
967 | 967 | (^[ ]*) # leading whitespace = $2 |
968 | 968 | ('.$marker_any_re.' # list marker and space = $3 |
@@ -972,41 +972,41 @@ discard block |
||
972 | 972 | (?:(\n+(?=\n))|\n) # tailing blank line = $5 |
973 | 973 | (?= \n* (\z | \2 ('.$marker_any_re.') (?:[ ]+|(?=\n)))) |
974 | 974 | }xm', |
975 | - array($this, '_processListItems_callback'), $list_str); |
|
976 | - |
|
977 | - $this->list_level--; |
|
978 | - return $list_str; |
|
979 | - } |
|
980 | - protected function _processListItems_callback($matches) { |
|
981 | - $item = $matches[4]; |
|
982 | - $leading_line =& $matches[1]; |
|
983 | - $leading_space =& $matches[2]; |
|
984 | - $marker_space = $matches[3]; |
|
985 | - $tailing_blank_line =& $matches[5]; |
|
986 | - |
|
987 | - if ($leading_line || $tailing_blank_line || |
|
988 | - preg_match('/\n{2,}/', $item)) |
|
989 | - { |
|
990 | - # Replace marker with the appropriate whitespace indentation |
|
991 | - $item = $leading_space . str_repeat(' ', strlen($marker_space)) . $item; |
|
992 | - $item = $this->runBlockGamut($this->outdent($item)."\n"); |
|
993 | - } |
|
994 | - else { |
|
995 | - # Recursion for sub-lists: |
|
996 | - $item = $this->doLists($this->outdent($item)); |
|
997 | - $item = preg_replace('/\n+$/', '', $item); |
|
998 | - $item = $this->runSpanGamut($item); |
|
999 | - } |
|
1000 | - |
|
1001 | - return "<li>" . $item . "</li>\n"; |
|
1002 | - } |
|
1003 | - |
|
1004 | - |
|
1005 | - protected function doCodeBlocks($text) { |
|
1006 | - # |
|
1007 | - # Process Markdown `<pre><code>` blocks. |
|
1008 | - # |
|
1009 | - $text = preg_replace_callback('{ |
|
975 | + array($this, '_processListItems_callback'), $list_str); |
|
976 | + |
|
977 | + $this->list_level--; |
|
978 | + return $list_str; |
|
979 | + } |
|
980 | + protected function _processListItems_callback($matches) { |
|
981 | + $item = $matches[4]; |
|
982 | + $leading_line =& $matches[1]; |
|
983 | + $leading_space =& $matches[2]; |
|
984 | + $marker_space = $matches[3]; |
|
985 | + $tailing_blank_line =& $matches[5]; |
|
986 | + |
|
987 | + if ($leading_line || $tailing_blank_line || |
|
988 | + preg_match('/\n{2,}/', $item)) |
|
989 | + { |
|
990 | + # Replace marker with the appropriate whitespace indentation |
|
991 | + $item = $leading_space . str_repeat(' ', strlen($marker_space)) . $item; |
|
992 | + $item = $this->runBlockGamut($this->outdent($item)."\n"); |
|
993 | + } |
|
994 | + else { |
|
995 | + # Recursion for sub-lists: |
|
996 | + $item = $this->doLists($this->outdent($item)); |
|
997 | + $item = preg_replace('/\n+$/', '', $item); |
|
998 | + $item = $this->runSpanGamut($item); |
|
999 | + } |
|
1000 | + |
|
1001 | + return "<li>" . $item . "</li>\n"; |
|
1002 | + } |
|
1003 | + |
|
1004 | + |
|
1005 | + protected function doCodeBlocks($text) { |
|
1006 | + # |
|
1007 | + # Process Markdown `<pre><code>` blocks. |
|
1008 | + # |
|
1009 | + $text = preg_replace_callback('{ |
|
1010 | 1010 | (?:\n\n|\A\n?) |
1011 | 1011 | ( # $1 = the code block -- one or more lines, starting with a space/tab |
1012 | 1012 | (?> |
@@ -1016,197 +1016,197 @@ discard block |
||
1016 | 1016 | ) |
1017 | 1017 | ((?=^[ ]{0,'.$this->tab_width.'}\S)|\Z) # Lookahead for non-space at line-start, or end of doc |
1018 | 1018 | }xm', |
1019 | - array($this, '_doCodeBlocks_callback'), $text); |
|
1020 | - |
|
1021 | - return $text; |
|
1022 | - } |
|
1023 | - protected function _doCodeBlocks_callback($matches) { |
|
1024 | - $codeblock = $matches[1]; |
|
1025 | - |
|
1026 | - $codeblock = $this->outdent($codeblock); |
|
1027 | - $codeblock = htmlspecialchars($codeblock, ENT_NOQUOTES); |
|
1028 | - |
|
1029 | - # trim leading newlines and trailing newlines |
|
1030 | - $codeblock = preg_replace('/\A\n+|\n+\z/', '', $codeblock); |
|
1031 | - |
|
1032 | - $codeblock = "<pre><code>$codeblock\n</code></pre>"; |
|
1033 | - return "\n\n".$this->hashBlock($codeblock)."\n\n"; |
|
1034 | - } |
|
1035 | - |
|
1036 | - |
|
1037 | - protected function makeCodeSpan($code) { |
|
1038 | - # |
|
1039 | - # Create a code span markup for $code. Called from handleSpanToken. |
|
1040 | - # |
|
1041 | - $code = htmlspecialchars(trim($code), ENT_NOQUOTES); |
|
1042 | - return $this->hashPart("<code>$code</code>"); |
|
1043 | - } |
|
1044 | - |
|
1045 | - |
|
1046 | - protected $em_relist = array( |
|
1047 | - '' => '(?:(?<!\*)\*(?!\*)|(?<!_)_(?!_))(?![\.,:;]?\s)', |
|
1048 | - '*' => '(?<![\s*])\*(?!\*)', |
|
1049 | - '_' => '(?<![\s_])_(?!_)', |
|
1050 | - ); |
|
1051 | - protected $strong_relist = array( |
|
1052 | - '' => '(?:(?<!\*)\*\*(?!\*)|(?<!_)__(?!_))(?![\.,:;]?\s)', |
|
1053 | - '**' => '(?<![\s*])\*\*(?!\*)', |
|
1054 | - '__' => '(?<![\s_])__(?!_)', |
|
1055 | - ); |
|
1056 | - protected $em_strong_relist = array( |
|
1057 | - '' => '(?:(?<!\*)\*\*\*(?!\*)|(?<!_)___(?!_))(?![\.,:;]?\s)', |
|
1058 | - '***' => '(?<![\s*])\*\*\*(?!\*)', |
|
1059 | - '___' => '(?<![\s_])___(?!_)', |
|
1060 | - ); |
|
1061 | - protected $em_strong_prepared_relist; |
|
1019 | + array($this, '_doCodeBlocks_callback'), $text); |
|
1020 | + |
|
1021 | + return $text; |
|
1022 | + } |
|
1023 | + protected function _doCodeBlocks_callback($matches) { |
|
1024 | + $codeblock = $matches[1]; |
|
1025 | + |
|
1026 | + $codeblock = $this->outdent($codeblock); |
|
1027 | + $codeblock = htmlspecialchars($codeblock, ENT_NOQUOTES); |
|
1028 | + |
|
1029 | + # trim leading newlines and trailing newlines |
|
1030 | + $codeblock = preg_replace('/\A\n+|\n+\z/', '', $codeblock); |
|
1031 | + |
|
1032 | + $codeblock = "<pre><code>$codeblock\n</code></pre>"; |
|
1033 | + return "\n\n".$this->hashBlock($codeblock)."\n\n"; |
|
1034 | + } |
|
1035 | + |
|
1036 | + |
|
1037 | + protected function makeCodeSpan($code) { |
|
1038 | + # |
|
1039 | + # Create a code span markup for $code. Called from handleSpanToken. |
|
1040 | + # |
|
1041 | + $code = htmlspecialchars(trim($code), ENT_NOQUOTES); |
|
1042 | + return $this->hashPart("<code>$code</code>"); |
|
1043 | + } |
|
1044 | + |
|
1045 | + |
|
1046 | + protected $em_relist = array( |
|
1047 | + '' => '(?:(?<!\*)\*(?!\*)|(?<!_)_(?!_))(?![\.,:;]?\s)', |
|
1048 | + '*' => '(?<![\s*])\*(?!\*)', |
|
1049 | + '_' => '(?<![\s_])_(?!_)', |
|
1050 | + ); |
|
1051 | + protected $strong_relist = array( |
|
1052 | + '' => '(?:(?<!\*)\*\*(?!\*)|(?<!_)__(?!_))(?![\.,:;]?\s)', |
|
1053 | + '**' => '(?<![\s*])\*\*(?!\*)', |
|
1054 | + '__' => '(?<![\s_])__(?!_)', |
|
1055 | + ); |
|
1056 | + protected $em_strong_relist = array( |
|
1057 | + '' => '(?:(?<!\*)\*\*\*(?!\*)|(?<!_)___(?!_))(?![\.,:;]?\s)', |
|
1058 | + '***' => '(?<![\s*])\*\*\*(?!\*)', |
|
1059 | + '___' => '(?<![\s_])___(?!_)', |
|
1060 | + ); |
|
1061 | + protected $em_strong_prepared_relist; |
|
1062 | 1062 | |
1063 | - protected function prepareItalicsAndBold() { |
|
1064 | - # |
|
1065 | - # Prepare regular expressions for searching emphasis tokens in any |
|
1066 | - # context. |
|
1067 | - # |
|
1068 | - foreach ($this->em_relist as $em => $em_re) { |
|
1069 | - foreach ($this->strong_relist as $strong => $strong_re) { |
|
1070 | - # Construct list of allowed token expressions. |
|
1071 | - $token_relist = array(); |
|
1072 | - if (isset($this->em_strong_relist["$em$strong"])) { |
|
1073 | - $token_relist[] = $this->em_strong_relist["$em$strong"]; |
|
1074 | - } |
|
1075 | - $token_relist[] = $em_re; |
|
1076 | - $token_relist[] = $strong_re; |
|
1063 | + protected function prepareItalicsAndBold() { |
|
1064 | + # |
|
1065 | + # Prepare regular expressions for searching emphasis tokens in any |
|
1066 | + # context. |
|
1067 | + # |
|
1068 | + foreach ($this->em_relist as $em => $em_re) { |
|
1069 | + foreach ($this->strong_relist as $strong => $strong_re) { |
|
1070 | + # Construct list of allowed token expressions. |
|
1071 | + $token_relist = array(); |
|
1072 | + if (isset($this->em_strong_relist["$em$strong"])) { |
|
1073 | + $token_relist[] = $this->em_strong_relist["$em$strong"]; |
|
1074 | + } |
|
1075 | + $token_relist[] = $em_re; |
|
1076 | + $token_relist[] = $strong_re; |
|
1077 | 1077 | |
1078 | - # Construct master expression from list. |
|
1079 | - $token_re = '{('. implode('|', $token_relist) .')}'; |
|
1080 | - $this->em_strong_prepared_relist["$em$strong"] = $token_re; |
|
1081 | - } |
|
1082 | - } |
|
1083 | - } |
|
1078 | + # Construct master expression from list. |
|
1079 | + $token_re = '{('. implode('|', $token_relist) .')}'; |
|
1080 | + $this->em_strong_prepared_relist["$em$strong"] = $token_re; |
|
1081 | + } |
|
1082 | + } |
|
1083 | + } |
|
1084 | 1084 | |
1085 | - protected function doItalicsAndBold($text) { |
|
1086 | - $token_stack = array(''); |
|
1087 | - $text_stack = array(''); |
|
1088 | - $em = ''; |
|
1089 | - $strong = ''; |
|
1090 | - $tree_char_em = false; |
|
1085 | + protected function doItalicsAndBold($text) { |
|
1086 | + $token_stack = array(''); |
|
1087 | + $text_stack = array(''); |
|
1088 | + $em = ''; |
|
1089 | + $strong = ''; |
|
1090 | + $tree_char_em = false; |
|
1091 | 1091 | |
1092 | - while (1) { |
|
1093 | - # |
|
1094 | - # Get prepared regular expression for seraching emphasis tokens |
|
1095 | - # in current context. |
|
1096 | - # |
|
1097 | - $token_re = $this->em_strong_prepared_relist["$em$strong"]; |
|
1092 | + while (1) { |
|
1093 | + # |
|
1094 | + # Get prepared regular expression for seraching emphasis tokens |
|
1095 | + # in current context. |
|
1096 | + # |
|
1097 | + $token_re = $this->em_strong_prepared_relist["$em$strong"]; |
|
1098 | 1098 | |
1099 | - # |
|
1100 | - # Each loop iteration search for the next emphasis token. |
|
1101 | - # Each token is then passed to handleSpanToken. |
|
1102 | - # |
|
1103 | - $parts = preg_split($token_re, $text, 2, PREG_SPLIT_DELIM_CAPTURE); |
|
1104 | - $text_stack[0] .= $parts[0]; |
|
1105 | - $token =& $parts[1]; |
|
1106 | - $text =& $parts[2]; |
|
1099 | + # |
|
1100 | + # Each loop iteration search for the next emphasis token. |
|
1101 | + # Each token is then passed to handleSpanToken. |
|
1102 | + # |
|
1103 | + $parts = preg_split($token_re, $text, 2, PREG_SPLIT_DELIM_CAPTURE); |
|
1104 | + $text_stack[0] .= $parts[0]; |
|
1105 | + $token =& $parts[1]; |
|
1106 | + $text =& $parts[2]; |
|
1107 | 1107 | |
1108 | - if (empty($token)) { |
|
1109 | - # Reached end of text span: empty stack without emitting. |
|
1110 | - # any more emphasis. |
|
1111 | - while ($token_stack[0]) { |
|
1112 | - $text_stack[1] .= array_shift($token_stack); |
|
1113 | - $text_stack[0] .= array_shift($text_stack); |
|
1114 | - } |
|
1115 | - break; |
|
1116 | - } |
|
1108 | + if (empty($token)) { |
|
1109 | + # Reached end of text span: empty stack without emitting. |
|
1110 | + # any more emphasis. |
|
1111 | + while ($token_stack[0]) { |
|
1112 | + $text_stack[1] .= array_shift($token_stack); |
|
1113 | + $text_stack[0] .= array_shift($text_stack); |
|
1114 | + } |
|
1115 | + break; |
|
1116 | + } |
|
1117 | 1117 | |
1118 | - $token_len = strlen($token); |
|
1119 | - if ($tree_char_em) { |
|
1120 | - # Reached closing marker while inside a three-char emphasis. |
|
1121 | - if ($token_len == 3) { |
|
1122 | - # Three-char closing marker, close em and strong. |
|
1123 | - array_shift($token_stack); |
|
1124 | - $span = array_shift($text_stack); |
|
1125 | - $span = $this->runSpanGamut($span); |
|
1126 | - $span = "<strong><em>$span</em></strong>"; |
|
1127 | - $text_stack[0] .= $this->hashPart($span); |
|
1128 | - $em = ''; |
|
1129 | - $strong = ''; |
|
1130 | - } else { |
|
1131 | - # Other closing marker: close one em or strong and |
|
1132 | - # change current token state to match the other |
|
1133 | - $token_stack[0] = str_repeat($token{0}, 3-$token_len); |
|
1134 | - $tag = $token_len == 2 ? "strong" : "em"; |
|
1135 | - $span = $text_stack[0]; |
|
1136 | - $span = $this->runSpanGamut($span); |
|
1137 | - $span = "<$tag>$span</$tag>"; |
|
1138 | - $text_stack[0] = $this->hashPart($span); |
|
1139 | - $$tag = ''; # $$tag stands for $em or $strong |
|
1140 | - } |
|
1141 | - $tree_char_em = false; |
|
1142 | - } else if ($token_len == 3) { |
|
1143 | - if ($em) { |
|
1144 | - # Reached closing marker for both em and strong. |
|
1145 | - # Closing strong marker: |
|
1146 | - for ($i = 0; $i < 2; ++$i) { |
|
1147 | - $shifted_token = array_shift($token_stack); |
|
1148 | - $tag = strlen($shifted_token) == 2 ? "strong" : "em"; |
|
1149 | - $span = array_shift($text_stack); |
|
1150 | - $span = $this->runSpanGamut($span); |
|
1151 | - $span = "<$tag>$span</$tag>"; |
|
1152 | - $text_stack[0] .= $this->hashPart($span); |
|
1153 | - $$tag = ''; # $$tag stands for $em or $strong |
|
1154 | - } |
|
1155 | - } else { |
|
1156 | - # Reached opening three-char emphasis marker. Push on token |
|
1157 | - # stack; will be handled by the special condition above. |
|
1158 | - $em = $token{0}; |
|
1159 | - $strong = "$em$em"; |
|
1160 | - array_unshift($token_stack, $token); |
|
1161 | - array_unshift($text_stack, ''); |
|
1162 | - $tree_char_em = true; |
|
1163 | - } |
|
1164 | - } else if ($token_len == 2) { |
|
1165 | - if ($strong) { |
|
1166 | - # Unwind any dangling emphasis marker: |
|
1167 | - if (strlen($token_stack[0]) == 1) { |
|
1168 | - $text_stack[1] .= array_shift($token_stack); |
|
1169 | - $text_stack[0] .= array_shift($text_stack); |
|
1170 | - } |
|
1171 | - # Closing strong marker: |
|
1172 | - array_shift($token_stack); |
|
1173 | - $span = array_shift($text_stack); |
|
1174 | - $span = $this->runSpanGamut($span); |
|
1175 | - $span = "<strong>$span</strong>"; |
|
1176 | - $text_stack[0] .= $this->hashPart($span); |
|
1177 | - $strong = ''; |
|
1178 | - } else { |
|
1179 | - array_unshift($token_stack, $token); |
|
1180 | - array_unshift($text_stack, ''); |
|
1181 | - $strong = $token; |
|
1182 | - } |
|
1183 | - } else { |
|
1184 | - # Here $token_len == 1 |
|
1185 | - if ($em) { |
|
1186 | - if (strlen($token_stack[0]) == 1) { |
|
1187 | - # Closing emphasis marker: |
|
1188 | - array_shift($token_stack); |
|
1189 | - $span = array_shift($text_stack); |
|
1190 | - $span = $this->runSpanGamut($span); |
|
1191 | - $span = "<em>$span</em>"; |
|
1192 | - $text_stack[0] .= $this->hashPart($span); |
|
1193 | - $em = ''; |
|
1194 | - } else { |
|
1195 | - $text_stack[0] .= $token; |
|
1196 | - } |
|
1197 | - } else { |
|
1198 | - array_unshift($token_stack, $token); |
|
1199 | - array_unshift($text_stack, ''); |
|
1200 | - $em = $token; |
|
1201 | - } |
|
1202 | - } |
|
1203 | - } |
|
1204 | - return $text_stack[0]; |
|
1205 | - } |
|
1206 | - |
|
1207 | - |
|
1208 | - protected function doBlockQuotes($text) { |
|
1209 | - $text = preg_replace_callback('/ |
|
1118 | + $token_len = strlen($token); |
|
1119 | + if ($tree_char_em) { |
|
1120 | + # Reached closing marker while inside a three-char emphasis. |
|
1121 | + if ($token_len == 3) { |
|
1122 | + # Three-char closing marker, close em and strong. |
|
1123 | + array_shift($token_stack); |
|
1124 | + $span = array_shift($text_stack); |
|
1125 | + $span = $this->runSpanGamut($span); |
|
1126 | + $span = "<strong><em>$span</em></strong>"; |
|
1127 | + $text_stack[0] .= $this->hashPart($span); |
|
1128 | + $em = ''; |
|
1129 | + $strong = ''; |
|
1130 | + } else { |
|
1131 | + # Other closing marker: close one em or strong and |
|
1132 | + # change current token state to match the other |
|
1133 | + $token_stack[0] = str_repeat($token{0}, 3-$token_len); |
|
1134 | + $tag = $token_len == 2 ? "strong" : "em"; |
|
1135 | + $span = $text_stack[0]; |
|
1136 | + $span = $this->runSpanGamut($span); |
|
1137 | + $span = "<$tag>$span</$tag>"; |
|
1138 | + $text_stack[0] = $this->hashPart($span); |
|
1139 | + $$tag = ''; # $$tag stands for $em or $strong |
|
1140 | + } |
|
1141 | + $tree_char_em = false; |
|
1142 | + } else if ($token_len == 3) { |
|
1143 | + if ($em) { |
|
1144 | + # Reached closing marker for both em and strong. |
|
1145 | + # Closing strong marker: |
|
1146 | + for ($i = 0; $i < 2; ++$i) { |
|
1147 | + $shifted_token = array_shift($token_stack); |
|
1148 | + $tag = strlen($shifted_token) == 2 ? "strong" : "em"; |
|
1149 | + $span = array_shift($text_stack); |
|
1150 | + $span = $this->runSpanGamut($span); |
|
1151 | + $span = "<$tag>$span</$tag>"; |
|
1152 | + $text_stack[0] .= $this->hashPart($span); |
|
1153 | + $$tag = ''; # $$tag stands for $em or $strong |
|
1154 | + } |
|
1155 | + } else { |
|
1156 | + # Reached opening three-char emphasis marker. Push on token |
|
1157 | + # stack; will be handled by the special condition above. |
|
1158 | + $em = $token{0}; |
|
1159 | + $strong = "$em$em"; |
|
1160 | + array_unshift($token_stack, $token); |
|
1161 | + array_unshift($text_stack, ''); |
|
1162 | + $tree_char_em = true; |
|
1163 | + } |
|
1164 | + } else if ($token_len == 2) { |
|
1165 | + if ($strong) { |
|
1166 | + # Unwind any dangling emphasis marker: |
|
1167 | + if (strlen($token_stack[0]) == 1) { |
|
1168 | + $text_stack[1] .= array_shift($token_stack); |
|
1169 | + $text_stack[0] .= array_shift($text_stack); |
|
1170 | + } |
|
1171 | + # Closing strong marker: |
|
1172 | + array_shift($token_stack); |
|
1173 | + $span = array_shift($text_stack); |
|
1174 | + $span = $this->runSpanGamut($span); |
|
1175 | + $span = "<strong>$span</strong>"; |
|
1176 | + $text_stack[0] .= $this->hashPart($span); |
|
1177 | + $strong = ''; |
|
1178 | + } else { |
|
1179 | + array_unshift($token_stack, $token); |
|
1180 | + array_unshift($text_stack, ''); |
|
1181 | + $strong = $token; |
|
1182 | + } |
|
1183 | + } else { |
|
1184 | + # Here $token_len == 1 |
|
1185 | + if ($em) { |
|
1186 | + if (strlen($token_stack[0]) == 1) { |
|
1187 | + # Closing emphasis marker: |
|
1188 | + array_shift($token_stack); |
|
1189 | + $span = array_shift($text_stack); |
|
1190 | + $span = $this->runSpanGamut($span); |
|
1191 | + $span = "<em>$span</em>"; |
|
1192 | + $text_stack[0] .= $this->hashPart($span); |
|
1193 | + $em = ''; |
|
1194 | + } else { |
|
1195 | + $text_stack[0] .= $token; |
|
1196 | + } |
|
1197 | + } else { |
|
1198 | + array_unshift($token_stack, $token); |
|
1199 | + array_unshift($text_stack, ''); |
|
1200 | + $em = $token; |
|
1201 | + } |
|
1202 | + } |
|
1203 | + } |
|
1204 | + return $text_stack[0]; |
|
1205 | + } |
|
1206 | + |
|
1207 | + |
|
1208 | + protected function doBlockQuotes($text) { |
|
1209 | + $text = preg_replace_callback('/ |
|
1210 | 1210 | ( # Wrap whole match in $1 |
1211 | 1211 | (?> |
1212 | 1212 | ^[ ]*>[ ]? # ">" at the start of a line |
@@ -1216,58 +1216,58 @@ discard block |
||
1216 | 1216 | )+ |
1217 | 1217 | ) |
1218 | 1218 | /xm', |
1219 | - array($this, '_doBlockQuotes_callback'), $text); |
|
1220 | - |
|
1221 | - return $text; |
|
1222 | - } |
|
1223 | - protected function _doBlockQuotes_callback($matches) { |
|
1224 | - $bq = $matches[1]; |
|
1225 | - # trim one level of quoting - trim whitespace-only lines |
|
1226 | - $bq = preg_replace('/^[ ]*>[ ]?|^[ ]+$/m', '', $bq); |
|
1227 | - $bq = $this->runBlockGamut($bq); # recurse |
|
1228 | - |
|
1229 | - $bq = preg_replace('/^/m', " ", $bq); |
|
1230 | - # These leading spaces cause problem with <pre> content, |
|
1231 | - # so we need to fix that: |
|
1232 | - $bq = preg_replace_callback('{(\s*<pre>.+?</pre>)}sx', |
|
1233 | - array($this, '_doBlockQuotes_callback2'), $bq); |
|
1234 | - |
|
1235 | - return "\n". $this->hashBlock("<blockquote>\n$bq\n</blockquote>")."\n\n"; |
|
1236 | - } |
|
1237 | - protected function _doBlockQuotes_callback2($matches) { |
|
1238 | - $pre = $matches[1]; |
|
1239 | - $pre = preg_replace('/^ /m', '', $pre); |
|
1240 | - return $pre; |
|
1241 | - } |
|
1242 | - |
|
1243 | - |
|
1244 | - protected function formParagraphs($text) { |
|
1245 | - # |
|
1246 | - # Params: |
|
1247 | - # $text - string to process with html <p> tags |
|
1248 | - # |
|
1249 | - # Strip leading and trailing lines: |
|
1250 | - $text = preg_replace('/\A\n+|\n+\z/', '', $text); |
|
1251 | - |
|
1252 | - $grafs = preg_split('/\n{2,}/', $text, -1, PREG_SPLIT_NO_EMPTY); |
|
1253 | - |
|
1254 | - # |
|
1255 | - # Wrap <p> tags and unhashify HTML blocks |
|
1256 | - # |
|
1257 | - foreach ($grafs as $key => $value) { |
|
1258 | - if (!preg_match('/^B\x1A[0-9]+B$/', $value)) { |
|
1259 | - # Is a paragraph. |
|
1260 | - $value = $this->runSpanGamut($value); |
|
1261 | - $value = preg_replace('/^([ ]*)/', "<p>", $value); |
|
1262 | - $value .= "</p>"; |
|
1263 | - $grafs[$key] = $this->unhash($value); |
|
1264 | - } |
|
1265 | - else { |
|
1266 | - # Is a block. |
|
1267 | - # Modify elements of @grafs in-place... |
|
1268 | - $graf = $value; |
|
1269 | - $block = $this->html_hashes[$graf]; |
|
1270 | - $graf = $block; |
|
1219 | + array($this, '_doBlockQuotes_callback'), $text); |
|
1220 | + |
|
1221 | + return $text; |
|
1222 | + } |
|
1223 | + protected function _doBlockQuotes_callback($matches) { |
|
1224 | + $bq = $matches[1]; |
|
1225 | + # trim one level of quoting - trim whitespace-only lines |
|
1226 | + $bq = preg_replace('/^[ ]*>[ ]?|^[ ]+$/m', '', $bq); |
|
1227 | + $bq = $this->runBlockGamut($bq); # recurse |
|
1228 | + |
|
1229 | + $bq = preg_replace('/^/m', " ", $bq); |
|
1230 | + # These leading spaces cause problem with <pre> content, |
|
1231 | + # so we need to fix that: |
|
1232 | + $bq = preg_replace_callback('{(\s*<pre>.+?</pre>)}sx', |
|
1233 | + array($this, '_doBlockQuotes_callback2'), $bq); |
|
1234 | + |
|
1235 | + return "\n". $this->hashBlock("<blockquote>\n$bq\n</blockquote>")."\n\n"; |
|
1236 | + } |
|
1237 | + protected function _doBlockQuotes_callback2($matches) { |
|
1238 | + $pre = $matches[1]; |
|
1239 | + $pre = preg_replace('/^ /m', '', $pre); |
|
1240 | + return $pre; |
|
1241 | + } |
|
1242 | + |
|
1243 | + |
|
1244 | + protected function formParagraphs($text) { |
|
1245 | + # |
|
1246 | + # Params: |
|
1247 | + # $text - string to process with html <p> tags |
|
1248 | + # |
|
1249 | + # Strip leading and trailing lines: |
|
1250 | + $text = preg_replace('/\A\n+|\n+\z/', '', $text); |
|
1251 | + |
|
1252 | + $grafs = preg_split('/\n{2,}/', $text, -1, PREG_SPLIT_NO_EMPTY); |
|
1253 | + |
|
1254 | + # |
|
1255 | + # Wrap <p> tags and unhashify HTML blocks |
|
1256 | + # |
|
1257 | + foreach ($grafs as $key => $value) { |
|
1258 | + if (!preg_match('/^B\x1A[0-9]+B$/', $value)) { |
|
1259 | + # Is a paragraph. |
|
1260 | + $value = $this->runSpanGamut($value); |
|
1261 | + $value = preg_replace('/^([ ]*)/', "<p>", $value); |
|
1262 | + $value .= "</p>"; |
|
1263 | + $grafs[$key] = $this->unhash($value); |
|
1264 | + } |
|
1265 | + else { |
|
1266 | + # Is a block. |
|
1267 | + # Modify elements of @grafs in-place... |
|
1268 | + $graf = $value; |
|
1269 | + $block = $this->html_hashes[$graf]; |
|
1270 | + $graf = $block; |
|
1271 | 1271 | // if (preg_match('{ |
1272 | 1272 | // \A |
1273 | 1273 | // ( # $1 = <div> tag |
@@ -1303,79 +1303,79 @@ discard block |
||
1303 | 1303 | // |
1304 | 1304 | // $graf = $div_open . "\n" . $div_content . "\n" . $div_close; |
1305 | 1305 | // } |
1306 | - $grafs[$key] = $graf; |
|
1307 | - } |
|
1308 | - } |
|
1309 | - |
|
1310 | - return implode("\n\n", $grafs); |
|
1311 | - } |
|
1312 | - |
|
1313 | - |
|
1314 | - protected function encodeAttribute($text) { |
|
1315 | - # |
|
1316 | - # Encode text for a double-quoted HTML attribute. This function |
|
1317 | - # is *not* suitable for attributes enclosed in single quotes. |
|
1318 | - # |
|
1319 | - $text = $this->encodeAmpsAndAngles($text); |
|
1320 | - $text = str_replace('"', '"', $text); |
|
1321 | - return $text; |
|
1322 | - } |
|
1323 | - |
|
1324 | - |
|
1325 | - protected function encodeURLAttribute($url, &$text = null) { |
|
1326 | - # |
|
1327 | - # Encode text for a double-quoted HTML attribute containing a URL, |
|
1328 | - # applying the URL filter if set. Also generates the textual |
|
1329 | - # representation for the URL (removing mailto: or tel:) storing it in $text. |
|
1330 | - # This function is *not* suitable for attributes enclosed in single quotes. |
|
1331 | - # |
|
1332 | - if ($this->url_filter_func) |
|
1333 | - $url = call_user_func($this->url_filter_func, $url); |
|
1334 | - |
|
1335 | - if (preg_match('{^mailto:}i', $url)) |
|
1336 | - $url = $this->encodeEntityObfuscatedAttribute($url, $text, 7); |
|
1337 | - else if (preg_match('{^tel:}i', $url)) |
|
1338 | - { |
|
1339 | - $url = $this->encodeAttribute($url); |
|
1340 | - $text = substr($url, 4); |
|
1341 | - } |
|
1342 | - else |
|
1343 | - { |
|
1344 | - $url = $this->encodeAttribute($url); |
|
1345 | - $text = $url; |
|
1346 | - } |
|
1347 | - |
|
1348 | - return $url; |
|
1349 | - } |
|
1306 | + $grafs[$key] = $graf; |
|
1307 | + } |
|
1308 | + } |
|
1309 | + |
|
1310 | + return implode("\n\n", $grafs); |
|
1311 | + } |
|
1312 | + |
|
1313 | + |
|
1314 | + protected function encodeAttribute($text) { |
|
1315 | + # |
|
1316 | + # Encode text for a double-quoted HTML attribute. This function |
|
1317 | + # is *not* suitable for attributes enclosed in single quotes. |
|
1318 | + # |
|
1319 | + $text = $this->encodeAmpsAndAngles($text); |
|
1320 | + $text = str_replace('"', '"', $text); |
|
1321 | + return $text; |
|
1322 | + } |
|
1323 | + |
|
1324 | + |
|
1325 | + protected function encodeURLAttribute($url, &$text = null) { |
|
1326 | + # |
|
1327 | + # Encode text for a double-quoted HTML attribute containing a URL, |
|
1328 | + # applying the URL filter if set. Also generates the textual |
|
1329 | + # representation for the URL (removing mailto: or tel:) storing it in $text. |
|
1330 | + # This function is *not* suitable for attributes enclosed in single quotes. |
|
1331 | + # |
|
1332 | + if ($this->url_filter_func) |
|
1333 | + $url = call_user_func($this->url_filter_func, $url); |
|
1334 | + |
|
1335 | + if (preg_match('{^mailto:}i', $url)) |
|
1336 | + $url = $this->encodeEntityObfuscatedAttribute($url, $text, 7); |
|
1337 | + else if (preg_match('{^tel:}i', $url)) |
|
1338 | + { |
|
1339 | + $url = $this->encodeAttribute($url); |
|
1340 | + $text = substr($url, 4); |
|
1341 | + } |
|
1342 | + else |
|
1343 | + { |
|
1344 | + $url = $this->encodeAttribute($url); |
|
1345 | + $text = $url; |
|
1346 | + } |
|
1347 | + |
|
1348 | + return $url; |
|
1349 | + } |
|
1350 | 1350 | |
1351 | 1351 | |
1352 | - protected function encodeAmpsAndAngles($text) { |
|
1353 | - # |
|
1354 | - # Smart processing for ampersands and angle brackets that need to |
|
1355 | - # be encoded. Valid character entities are left alone unless the |
|
1356 | - # no-entities mode is set. |
|
1357 | - # |
|
1358 | - if ($this->no_entities) { |
|
1359 | - $text = str_replace('&', '&', $text); |
|
1360 | - } else { |
|
1361 | - # Ampersand-encoding based entirely on Nat Irons's Amputator |
|
1362 | - # MT plugin: <http://bumppo.net/projects/amputator/> |
|
1363 | - $text = preg_replace('/&(?!#?[xX]?(?:[0-9a-fA-F]+|\w+);)/', |
|
1364 | - '&', $text); |
|
1365 | - } |
|
1366 | - # Encode remaining <'s |
|
1367 | - $text = str_replace('<', '<', $text); |
|
1368 | - |
|
1369 | - return $text; |
|
1370 | - } |
|
1371 | - |
|
1372 | - |
|
1373 | - protected function doAutoLinks($text) { |
|
1374 | - $text = preg_replace_callback('{<((https?|ftp|dict|tel):[^\'">\s]+)>}i', |
|
1375 | - array($this, '_doAutoLinks_url_callback'), $text); |
|
1376 | - |
|
1377 | - # Email addresses: <[email protected]> |
|
1378 | - $text = preg_replace_callback('{ |
|
1352 | + protected function encodeAmpsAndAngles($text) { |
|
1353 | + # |
|
1354 | + # Smart processing for ampersands and angle brackets that need to |
|
1355 | + # be encoded. Valid character entities are left alone unless the |
|
1356 | + # no-entities mode is set. |
|
1357 | + # |
|
1358 | + if ($this->no_entities) { |
|
1359 | + $text = str_replace('&', '&', $text); |
|
1360 | + } else { |
|
1361 | + # Ampersand-encoding based entirely on Nat Irons's Amputator |
|
1362 | + # MT plugin: <http://bumppo.net/projects/amputator/> |
|
1363 | + $text = preg_replace('/&(?!#?[xX]?(?:[0-9a-fA-F]+|\w+);)/', |
|
1364 | + '&', $text); |
|
1365 | + } |
|
1366 | + # Encode remaining <'s |
|
1367 | + $text = str_replace('<', '<', $text); |
|
1368 | + |
|
1369 | + return $text; |
|
1370 | + } |
|
1371 | + |
|
1372 | + |
|
1373 | + protected function doAutoLinks($text) { |
|
1374 | + $text = preg_replace_callback('{<((https?|ftp|dict|tel):[^\'">\s]+)>}i', |
|
1375 | + array($this, '_doAutoLinks_url_callback'), $text); |
|
1376 | + |
|
1377 | + # Email addresses: <[email protected]> |
|
1378 | + $text = preg_replace_callback('{ |
|
1379 | 1379 | < |
1380 | 1380 | (?:mailto:)? |
1381 | 1381 | ( |
@@ -1393,76 +1393,76 @@ discard block |
||
1393 | 1393 | ) |
1394 | 1394 | > |
1395 | 1395 | }xi', |
1396 | - array($this, '_doAutoLinks_email_callback'), $text); |
|
1397 | - |
|
1398 | - return $text; |
|
1399 | - } |
|
1400 | - protected function _doAutoLinks_url_callback($matches) { |
|
1401 | - $url = $this->encodeURLAttribute($matches[1], $text); |
|
1402 | - $link = "<a href=\"$url\">$text</a>"; |
|
1403 | - return $this->hashPart($link); |
|
1404 | - } |
|
1405 | - protected function _doAutoLinks_email_callback($matches) { |
|
1406 | - $addr = $matches[1]; |
|
1407 | - $url = $this->encodeURLAttribute("mailto:$addr", $text); |
|
1408 | - $link = "<a href=\"$url\">$text</a>"; |
|
1409 | - return $this->hashPart($link); |
|
1410 | - } |
|
1411 | - |
|
1412 | - |
|
1413 | - protected function encodeEntityObfuscatedAttribute($text, &$tail = null, $head_length = 0) { |
|
1414 | - # |
|
1415 | - # Input: some text to obfuscate, e.g. "mailto:[email protected]" |
|
1416 | - # |
|
1417 | - # Output: the same text but with most characters encoded as either a |
|
1418 | - # decimal or hex entity, in the hopes of foiling most address |
|
1419 | - # harvesting spam bots. E.g.: |
|
1420 | - # |
|
1421 | - # mailto:foo |
|
1422 | - # @example.co |
|
1423 | - # m |
|
1424 | - # |
|
1425 | - # Note: the additional output $tail is assigned the same value as the |
|
1426 | - # ouput, minus the number of characters specified by $head_length. |
|
1427 | - # |
|
1428 | - # Based by a filter by Matthew Wickline, posted to BBEdit-Talk. |
|
1429 | - # With some optimizations by Milian Wolff. Forced encoding of HTML |
|
1430 | - # attribute special characters by Allan Odgaard. |
|
1431 | - # |
|
1432 | - if ($text == "") return $tail = ""; |
|
1433 | - |
|
1434 | - $chars = preg_split('/(?<!^)(?!$)/', $text); |
|
1435 | - $seed = (int)abs(crc32($text) / strlen($text)); # Deterministic seed. |
|
1436 | - |
|
1437 | - foreach ($chars as $key => $char) { |
|
1438 | - $ord = ord($char); |
|
1439 | - # Ignore non-ascii chars. |
|
1440 | - if ($ord < 128) { |
|
1441 | - $r = ($seed * (1 + $key)) % 100; # Pseudo-random function. |
|
1442 | - # roughly 10% raw, 45% hex, 45% dec |
|
1443 | - # '@' *must* be encoded. I insist. |
|
1444 | - # '"' and '>' have to be encoded inside the attribute |
|
1445 | - if ($r > 90 && strpos('@"&>', $char) === false) /* do nothing */; |
|
1446 | - else if ($r < 45) $chars[$key] = '&#x'.dechex($ord).';'; |
|
1447 | - else $chars[$key] = '&#'.$ord.';'; |
|
1448 | - } |
|
1449 | - } |
|
1450 | - |
|
1451 | - $text = implode('', $chars); |
|
1452 | - $tail = $head_length ? implode('', array_slice($chars, $head_length)) : $text; |
|
1453 | - |
|
1454 | - return $text; |
|
1455 | - } |
|
1456 | - |
|
1457 | - |
|
1458 | - protected function parseSpan($str) { |
|
1459 | - # |
|
1460 | - # Take the string $str and parse it into tokens, hashing embeded HTML, |
|
1461 | - # escaped characters and handling code spans. |
|
1462 | - # |
|
1463 | - $output = ''; |
|
1396 | + array($this, '_doAutoLinks_email_callback'), $text); |
|
1397 | + |
|
1398 | + return $text; |
|
1399 | + } |
|
1400 | + protected function _doAutoLinks_url_callback($matches) { |
|
1401 | + $url = $this->encodeURLAttribute($matches[1], $text); |
|
1402 | + $link = "<a href=\"$url\">$text</a>"; |
|
1403 | + return $this->hashPart($link); |
|
1404 | + } |
|
1405 | + protected function _doAutoLinks_email_callback($matches) { |
|
1406 | + $addr = $matches[1]; |
|
1407 | + $url = $this->encodeURLAttribute("mailto:$addr", $text); |
|
1408 | + $link = "<a href=\"$url\">$text</a>"; |
|
1409 | + return $this->hashPart($link); |
|
1410 | + } |
|
1411 | + |
|
1412 | + |
|
1413 | + protected function encodeEntityObfuscatedAttribute($text, &$tail = null, $head_length = 0) { |
|
1414 | + # |
|
1415 | + # Input: some text to obfuscate, e.g. "mailto:[email protected]" |
|
1416 | + # |
|
1417 | + # Output: the same text but with most characters encoded as either a |
|
1418 | + # decimal or hex entity, in the hopes of foiling most address |
|
1419 | + # harvesting spam bots. E.g.: |
|
1420 | + # |
|
1421 | + # mailto:foo |
|
1422 | + # @example.co |
|
1423 | + # m |
|
1424 | + # |
|
1425 | + # Note: the additional output $tail is assigned the same value as the |
|
1426 | + # ouput, minus the number of characters specified by $head_length. |
|
1427 | + # |
|
1428 | + # Based by a filter by Matthew Wickline, posted to BBEdit-Talk. |
|
1429 | + # With some optimizations by Milian Wolff. Forced encoding of HTML |
|
1430 | + # attribute special characters by Allan Odgaard. |
|
1431 | + # |
|
1432 | + if ($text == "") return $tail = ""; |
|
1433 | + |
|
1434 | + $chars = preg_split('/(?<!^)(?!$)/', $text); |
|
1435 | + $seed = (int)abs(crc32($text) / strlen($text)); # Deterministic seed. |
|
1436 | + |
|
1437 | + foreach ($chars as $key => $char) { |
|
1438 | + $ord = ord($char); |
|
1439 | + # Ignore non-ascii chars. |
|
1440 | + if ($ord < 128) { |
|
1441 | + $r = ($seed * (1 + $key)) % 100; # Pseudo-random function. |
|
1442 | + # roughly 10% raw, 45% hex, 45% dec |
|
1443 | + # '@' *must* be encoded. I insist. |
|
1444 | + # '"' and '>' have to be encoded inside the attribute |
|
1445 | + if ($r > 90 && strpos('@"&>', $char) === false) /* do nothing */; |
|
1446 | + else if ($r < 45) $chars[$key] = '&#x'.dechex($ord).';'; |
|
1447 | + else $chars[$key] = '&#'.$ord.';'; |
|
1448 | + } |
|
1449 | + } |
|
1450 | + |
|
1451 | + $text = implode('', $chars); |
|
1452 | + $tail = $head_length ? implode('', array_slice($chars, $head_length)) : $text; |
|
1453 | + |
|
1454 | + return $text; |
|
1455 | + } |
|
1456 | + |
|
1457 | + |
|
1458 | + protected function parseSpan($str) { |
|
1459 | + # |
|
1460 | + # Take the string $str and parse it into tokens, hashing embeded HTML, |
|
1461 | + # escaped characters and handling code spans. |
|
1462 | + # |
|
1463 | + $output = ''; |
|
1464 | 1464 | |
1465 | - $span_re = '{ |
|
1465 | + $span_re = '{ |
|
1466 | 1466 | ( |
1467 | 1467 | \\\\'.$this->escape_chars_re.' |
1468 | 1468 | | |
@@ -1488,122 +1488,122 @@ discard block |
||
1488 | 1488 | ) |
1489 | 1489 | }xs'; |
1490 | 1490 | |
1491 | - while (1) { |
|
1492 | - # |
|
1493 | - # Each loop iteration seach for either the next tag, the next |
|
1494 | - # openning code span marker, or the next escaped character. |
|
1495 | - # Each token is then passed to handleSpanToken. |
|
1496 | - # |
|
1497 | - $parts = preg_split($span_re, $str, 2, PREG_SPLIT_DELIM_CAPTURE); |
|
1491 | + while (1) { |
|
1492 | + # |
|
1493 | + # Each loop iteration seach for either the next tag, the next |
|
1494 | + # openning code span marker, or the next escaped character. |
|
1495 | + # Each token is then passed to handleSpanToken. |
|
1496 | + # |
|
1497 | + $parts = preg_split($span_re, $str, 2, PREG_SPLIT_DELIM_CAPTURE); |
|
1498 | 1498 | |
1499 | - # Create token from text preceding tag. |
|
1500 | - if ($parts[0] != "") { |
|
1501 | - $output .= $parts[0]; |
|
1502 | - } |
|
1499 | + # Create token from text preceding tag. |
|
1500 | + if ($parts[0] != "") { |
|
1501 | + $output .= $parts[0]; |
|
1502 | + } |
|
1503 | 1503 | |
1504 | - # Check if we reach the end. |
|
1505 | - if (isset($parts[1])) { |
|
1506 | - $output .= $this->handleSpanToken($parts[1], $parts[2]); |
|
1507 | - $str = $parts[2]; |
|
1508 | - } |
|
1509 | - else { |
|
1510 | - break; |
|
1511 | - } |
|
1512 | - } |
|
1504 | + # Check if we reach the end. |
|
1505 | + if (isset($parts[1])) { |
|
1506 | + $output .= $this->handleSpanToken($parts[1], $parts[2]); |
|
1507 | + $str = $parts[2]; |
|
1508 | + } |
|
1509 | + else { |
|
1510 | + break; |
|
1511 | + } |
|
1512 | + } |
|
1513 | 1513 | |
1514 | - return $output; |
|
1515 | - } |
|
1514 | + return $output; |
|
1515 | + } |
|
1516 | 1516 | |
1517 | 1517 | |
1518 | - protected function handleSpanToken($token, &$str) { |
|
1519 | - # |
|
1520 | - # Handle $token provided by parseSpan by determining its nature and |
|
1521 | - # returning the corresponding value that should replace it. |
|
1522 | - # |
|
1523 | - switch ($token{0}) { |
|
1524 | - case "\\": |
|
1525 | - return $this->hashPart("&#". ord($token{1}). ";"); |
|
1526 | - case "`": |
|
1527 | - # Search for end marker in remaining text. |
|
1528 | - if (preg_match('/^(.*?[^`])'.preg_quote($token).'(?!`)(.*)$/sm', |
|
1529 | - $str, $matches)) |
|
1530 | - { |
|
1531 | - $str = $matches[2]; |
|
1532 | - $codespan = $this->makeCodeSpan($matches[1]); |
|
1533 | - return $this->hashPart($codespan); |
|
1534 | - } |
|
1535 | - return $token; // return as text since no ending marker found. |
|
1536 | - default: |
|
1537 | - return $this->hashPart($token); |
|
1538 | - } |
|
1539 | - } |
|
1540 | - |
|
1541 | - |
|
1542 | - protected function outdent($text) { |
|
1543 | - # |
|
1544 | - # Remove one level of line-leading tabs or spaces |
|
1545 | - # |
|
1546 | - return preg_replace('/^(\t|[ ]{1,'.$this->tab_width.'})/m', '', $text); |
|
1547 | - } |
|
1548 | - |
|
1549 | - |
|
1550 | - # String length function for detab. `_initDetab` will create a function to |
|
1551 | - # hanlde UTF-8 if the default function does not exist. |
|
1552 | - protected $utf8_strlen = 'mb_strlen'; |
|
1518 | + protected function handleSpanToken($token, &$str) { |
|
1519 | + # |
|
1520 | + # Handle $token provided by parseSpan by determining its nature and |
|
1521 | + # returning the corresponding value that should replace it. |
|
1522 | + # |
|
1523 | + switch ($token{0}) { |
|
1524 | + case "\\": |
|
1525 | + return $this->hashPart("&#". ord($token{1}). ";"); |
|
1526 | + case "`": |
|
1527 | + # Search for end marker in remaining text. |
|
1528 | + if (preg_match('/^(.*?[^`])'.preg_quote($token).'(?!`)(.*)$/sm', |
|
1529 | + $str, $matches)) |
|
1530 | + { |
|
1531 | + $str = $matches[2]; |
|
1532 | + $codespan = $this->makeCodeSpan($matches[1]); |
|
1533 | + return $this->hashPart($codespan); |
|
1534 | + } |
|
1535 | + return $token; // return as text since no ending marker found. |
|
1536 | + default: |
|
1537 | + return $this->hashPart($token); |
|
1538 | + } |
|
1539 | + } |
|
1540 | + |
|
1541 | + |
|
1542 | + protected function outdent($text) { |
|
1543 | + # |
|
1544 | + # Remove one level of line-leading tabs or spaces |
|
1545 | + # |
|
1546 | + return preg_replace('/^(\t|[ ]{1,'.$this->tab_width.'})/m', '', $text); |
|
1547 | + } |
|
1548 | + |
|
1549 | + |
|
1550 | + # String length function for detab. `_initDetab` will create a function to |
|
1551 | + # hanlde UTF-8 if the default function does not exist. |
|
1552 | + protected $utf8_strlen = 'mb_strlen'; |
|
1553 | 1553 | |
1554 | - protected function detab($text) { |
|
1555 | - # |
|
1556 | - # Replace tabs with the appropriate amount of space. |
|
1557 | - # |
|
1558 | - # For each line we separate the line in blocks delemited by |
|
1559 | - # tab characters. Then we reconstruct every line by adding the |
|
1560 | - # appropriate number of space between each blocks. |
|
1554 | + protected function detab($text) { |
|
1555 | + # |
|
1556 | + # Replace tabs with the appropriate amount of space. |
|
1557 | + # |
|
1558 | + # For each line we separate the line in blocks delemited by |
|
1559 | + # tab characters. Then we reconstruct every line by adding the |
|
1560 | + # appropriate number of space between each blocks. |
|
1561 | 1561 | |
1562 | - $text = preg_replace_callback('/^.*\t.*$/m', |
|
1563 | - array($this, '_detab_callback'), $text); |
|
1564 | - |
|
1565 | - return $text; |
|
1566 | - } |
|
1567 | - protected function _detab_callback($matches) { |
|
1568 | - $line = $matches[0]; |
|
1569 | - $strlen = $this->utf8_strlen; # strlen function for UTF-8. |
|
1562 | + $text = preg_replace_callback('/^.*\t.*$/m', |
|
1563 | + array($this, '_detab_callback'), $text); |
|
1564 | + |
|
1565 | + return $text; |
|
1566 | + } |
|
1567 | + protected function _detab_callback($matches) { |
|
1568 | + $line = $matches[0]; |
|
1569 | + $strlen = $this->utf8_strlen; # strlen function for UTF-8. |
|
1570 | 1570 | |
1571 | - # Split in blocks. |
|
1572 | - $blocks = explode("\t", $line); |
|
1573 | - # Add each blocks to the line. |
|
1574 | - $line = $blocks[0]; |
|
1575 | - unset($blocks[0]); # Do not add first block twice. |
|
1576 | - foreach ($blocks as $block) { |
|
1577 | - # Calculate amount of space, insert spaces, insert block. |
|
1578 | - $amount = $this->tab_width - |
|
1579 | - $strlen($line, 'UTF-8') % $this->tab_width; |
|
1580 | - $line .= str_repeat(" ", $amount) . $block; |
|
1581 | - } |
|
1582 | - return $line; |
|
1583 | - } |
|
1584 | - protected function _initDetab() { |
|
1585 | - # |
|
1586 | - # Check for the availability of the function in the `utf8_strlen` property |
|
1587 | - # (initially `mb_strlen`). If the function is not available, create a |
|
1588 | - # function that will loosely count the number of UTF-8 characters with a |
|
1589 | - # regular expression. |
|
1590 | - # |
|
1591 | - if (function_exists($this->utf8_strlen)) return; |
|
1592 | - $this->utf8_strlen = create_function('$text', 'return preg_match_all( |
|
1571 | + # Split in blocks. |
|
1572 | + $blocks = explode("\t", $line); |
|
1573 | + # Add each blocks to the line. |
|
1574 | + $line = $blocks[0]; |
|
1575 | + unset($blocks[0]); # Do not add first block twice. |
|
1576 | + foreach ($blocks as $block) { |
|
1577 | + # Calculate amount of space, insert spaces, insert block. |
|
1578 | + $amount = $this->tab_width - |
|
1579 | + $strlen($line, 'UTF-8') % $this->tab_width; |
|
1580 | + $line .= str_repeat(" ", $amount) . $block; |
|
1581 | + } |
|
1582 | + return $line; |
|
1583 | + } |
|
1584 | + protected function _initDetab() { |
|
1585 | + # |
|
1586 | + # Check for the availability of the function in the `utf8_strlen` property |
|
1587 | + # (initially `mb_strlen`). If the function is not available, create a |
|
1588 | + # function that will loosely count the number of UTF-8 characters with a |
|
1589 | + # regular expression. |
|
1590 | + # |
|
1591 | + if (function_exists($this->utf8_strlen)) return; |
|
1592 | + $this->utf8_strlen = create_function('$text', 'return preg_match_all( |
|
1593 | 1593 | "/[\\\\x00-\\\\xBF]|[\\\\xC0-\\\\xFF][\\\\x80-\\\\xBF]*/", |
1594 | 1594 | $text, $m);'); |
1595 | - } |
|
1596 | - |
|
1597 | - |
|
1598 | - protected function unhash($text) { |
|
1599 | - # |
|
1600 | - # Swap back in all the tags hashed by _HashHTMLBlocks. |
|
1601 | - # |
|
1602 | - return preg_replace_callback('/(.)\x1A[0-9]+\1/', |
|
1603 | - array($this, '_unhash_callback'), $text); |
|
1604 | - } |
|
1605 | - protected function _unhash_callback($matches) { |
|
1606 | - return $this->html_hashes[$matches[0]]; |
|
1607 | - } |
|
1595 | + } |
|
1596 | + |
|
1597 | + |
|
1598 | + protected function unhash($text) { |
|
1599 | + # |
|
1600 | + # Swap back in all the tags hashed by _HashHTMLBlocks. |
|
1601 | + # |
|
1602 | + return preg_replace_callback('/(.)\x1A[0-9]+\1/', |
|
1603 | + array($this, '_unhash_callback'), $text); |
|
1604 | + } |
|
1605 | + protected function _unhash_callback($matches) { |
|
1606 | + return $this->html_hashes[$matches[0]]; |
|
1607 | + } |
|
1608 | 1608 | |
1609 | 1609 | } |
@@ -21,7 +21,7 @@ discard block |
||
21 | 21 | |
22 | 22 | ### Version ### |
23 | 23 | |
24 | - const MARKDOWNLIB_VERSION = "1.5.0"; |
|
24 | + const MARKDOWNLIB_VERSION = "1.5.0"; |
|
25 | 25 | |
26 | 26 | ### Simple Function Interface ### |
27 | 27 | |
@@ -35,7 +35,7 @@ discard block |
||
35 | 35 | |
36 | 36 | # try to take parser from the static parser list |
37 | 37 | static $parser_list; |
38 | - $parser =& $parser_list[$parser_class]; |
|
38 | + $parser = & $parser_list[$parser_class]; |
|
39 | 39 | |
40 | 40 | # create the parser it not already set |
41 | 41 | if (!$parser) |
@@ -186,7 +186,7 @@ discard block |
||
186 | 186 | |
187 | 187 | $this->teardown(); |
188 | 188 | |
189 | - return $text . "\n"; |
|
189 | + return $text."\n"; |
|
190 | 190 | } |
191 | 191 | |
192 | 192 | protected $document_gamut = array( |
@@ -235,7 +235,7 @@ discard block |
||
235 | 235 | $link_id = strtolower($matches[1]); |
236 | 236 | $url = $matches[2] == '' ? $matches[3] : $matches[2]; |
237 | 237 | $this->urls[$link_id] = $url; |
238 | - $this->titles[$link_id] =& $matches[4]; |
|
238 | + $this->titles[$link_id] = & $matches[4]; |
|
239 | 239 | return ''; # String that will replace the block |
240 | 240 | } |
241 | 241 | |
@@ -290,8 +290,8 @@ discard block |
||
290 | 290 | (?> |
291 | 291 | /> |
292 | 292 | | |
293 | - >', $nested_tags_level). # end of opening tag |
|
294 | - '.*?'. # last level nested tag content |
|
293 | + >', $nested_tags_level).# end of opening tag |
|
294 | + '.*?'.# last level nested tag content |
|
295 | 295 | str_repeat(' |
296 | 296 | </\2\s*> # closing nested tag |
297 | 297 | ) |
@@ -403,7 +403,7 @@ discard block |
||
403 | 403 | |
404 | 404 | # Then hash the block. |
405 | 405 | static $i = 0; |
406 | - $key = "$boundary\x1A" . ++$i . $boundary; |
|
406 | + $key = "$boundary\x1A".++$i.$boundary; |
|
407 | 407 | $this->html_hashes[$key] = $text; |
408 | 408 | return $key; # String that will replace the tag. |
409 | 409 | } |
@@ -596,9 +596,9 @@ discard block |
||
596 | 596 | return $text; |
597 | 597 | } |
598 | 598 | protected function _doAnchors_reference_callback($matches) { |
599 | - $whole_match = $matches[1]; |
|
600 | - $link_text = $matches[2]; |
|
601 | - $link_id =& $matches[3]; |
|
599 | + $whole_match = $matches[1]; |
|
600 | + $link_text = $matches[2]; |
|
601 | + $link_id = & $matches[3]; |
|
602 | 602 | |
603 | 603 | if ($link_id == "") { |
604 | 604 | # for shortcut links like [this][] or [this]. |
@@ -614,10 +614,10 @@ discard block |
||
614 | 614 | $url = $this->encodeURLAttribute($url); |
615 | 615 | |
616 | 616 | $result = "<a href=\"$url\""; |
617 | - if ( isset( $this->titles[$link_id] ) ) { |
|
617 | + if (isset($this->titles[$link_id])) { |
|
618 | 618 | $title = $this->titles[$link_id]; |
619 | 619 | $title = $this->encodeAttribute($title); |
620 | - $result .= " title=\"$title\""; |
|
620 | + $result .= " title=\"$title\""; |
|
621 | 621 | } |
622 | 622 | |
623 | 623 | $link_text = $this->runSpanGamut($link_text); |
@@ -630,10 +630,10 @@ discard block |
||
630 | 630 | return $result; |
631 | 631 | } |
632 | 632 | protected function _doAnchors_inline_callback($matches) { |
633 | - $whole_match = $matches[1]; |
|
634 | - $link_text = $this->runSpanGamut($matches[2]); |
|
635 | - $url = $matches[3] == '' ? $matches[4] : $matches[3]; |
|
636 | - $title =& $matches[7]; |
|
633 | + $whole_match = $matches[1]; |
|
634 | + $link_text = $this->runSpanGamut($matches[2]); |
|
635 | + $url = $matches[3] == '' ? $matches[4] : $matches[3]; |
|
636 | + $title = & $matches[7]; |
|
637 | 637 | |
638 | 638 | // if the URL was of the form <s p a c e s> it got caught by the HTML |
639 | 639 | // tag parser and hashed. Need to reverse the process before using the URL. |
@@ -646,7 +646,7 @@ discard block |
||
646 | 646 | $result = "<a href=\"$url\""; |
647 | 647 | if (isset($title)) { |
648 | 648 | $title = $this->encodeAttribute($title); |
649 | - $result .= " title=\"$title\""; |
|
649 | + $result .= " title=\"$title\""; |
|
650 | 650 | } |
651 | 651 | |
652 | 652 | $link_text = $this->runSpanGamut($link_text); |
@@ -727,7 +727,7 @@ discard block |
||
727 | 727 | if (isset($this->titles[$link_id])) { |
728 | 728 | $title = $this->titles[$link_id]; |
729 | 729 | $title = $this->encodeAttribute($title); |
730 | - $result .= " title=\"$title\""; |
|
730 | + $result .= " title=\"$title\""; |
|
731 | 731 | } |
732 | 732 | $result .= $this->empty_element_suffix; |
733 | 733 | $result = $this->hashPart($result); |
@@ -740,17 +740,17 @@ discard block |
||
740 | 740 | return $result; |
741 | 741 | } |
742 | 742 | protected function _doImages_inline_callback($matches) { |
743 | - $whole_match = $matches[1]; |
|
744 | - $alt_text = $matches[2]; |
|
745 | - $url = $matches[3] == '' ? $matches[4] : $matches[3]; |
|
746 | - $title =& $matches[7]; |
|
743 | + $whole_match = $matches[1]; |
|
744 | + $alt_text = $matches[2]; |
|
745 | + $url = $matches[3] == '' ? $matches[4] : $matches[3]; |
|
746 | + $title = & $matches[7]; |
|
747 | 747 | |
748 | 748 | $alt_text = $this->encodeAttribute($alt_text); |
749 | 749 | $url = $this->encodeURLAttribute($url); |
750 | 750 | $result = "<img src=\"$url\" alt=\"$alt_text\""; |
751 | 751 | if (isset($title)) { |
752 | 752 | $title = $this->encodeAttribute($title); |
753 | - $result .= " title=\"$title\""; # $title already quoted |
|
753 | + $result .= " title=\"$title\""; # $title already quoted |
|
754 | 754 | } |
755 | 755 | $result .= $this->empty_element_suffix; |
756 | 756 | |
@@ -800,7 +800,7 @@ discard block |
||
800 | 800 | $idAtt = $this->_generateIdFromHeaderValue($matches[1]); |
801 | 801 | |
802 | 802 | $block = "<h$level$idAtt>".$this->runSpanGamut($matches[1])."</h$level>"; |
803 | - return "\n" . $this->hashBlock($block) . "\n\n"; |
|
803 | + return "\n".$this->hashBlock($block)."\n\n"; |
|
804 | 804 | } |
805 | 805 | protected function _doHeaders_callback_atx($matches) { |
806 | 806 | |
@@ -809,7 +809,7 @@ discard block |
||
809 | 809 | |
810 | 810 | $level = strlen($matches[1]); |
811 | 811 | $block = "<h$level$idAtt>".$this->runSpanGamut($matches[2])."</h$level>"; |
812 | - return "\n" . $this->hashBlock($block) . "\n\n"; |
|
812 | + return "\n".$this->hashBlock($block)."\n\n"; |
|
813 | 813 | } |
814 | 814 | |
815 | 815 | protected function _generateIdFromHeaderValue($headerValue) { |
@@ -825,7 +825,7 @@ discard block |
||
825 | 825 | $idValue = call_user_func($this->header_id_func, $headerValue); |
826 | 826 | if (!$idValue) return ""; |
827 | 827 | |
828 | - return ' id="' . $this->encodeAttribute($idValue) . '"'; |
|
828 | + return ' id="'.$this->encodeAttribute($idValue).'"'; |
|
829 | 829 | |
830 | 830 | } |
831 | 831 | |
@@ -904,7 +904,7 @@ discard block |
||
904 | 904 | $list = $matches[1]; |
905 | 905 | $list_type = preg_match("/$marker_ul_re/", $matches[4]) ? "ul" : "ol"; |
906 | 906 | |
907 | - $marker_any_re = ( $list_type == "ul" ? $marker_ul_re : $marker_ol_re ); |
|
907 | + $marker_any_re = ($list_type == "ul" ? $marker_ul_re : $marker_ol_re); |
|
908 | 908 | |
909 | 909 | $list .= "\n"; |
910 | 910 | $result = $this->processListItems($list, $marker_any_re); |
@@ -915,18 +915,18 @@ discard block |
||
915 | 915 | if ($list_type == 'ol') { |
916 | 916 | $ol_start_array = array(); |
917 | 917 | $ol_start_check = preg_match("/$marker_ol_start_re/", $matches[4], $ol_start_array); |
918 | - if ($ol_start_check){ |
|
918 | + if ($ol_start_check) { |
|
919 | 919 | $ol_start = $ol_start_array[0]; |
920 | 920 | } |
921 | 921 | } |
922 | 922 | } |
923 | 923 | |
924 | - if ($ol_start > 1 && $list_type == 'ol'){ |
|
925 | - $result = $this->hashBlock("<$list_type start=\"$ol_start\">\n" . $result . "</$list_type>"); |
|
924 | + if ($ol_start > 1 && $list_type == 'ol') { |
|
925 | + $result = $this->hashBlock("<$list_type start=\"$ol_start\">\n".$result."</$list_type>"); |
|
926 | 926 | } else { |
927 | - $result = $this->hashBlock("<$list_type>\n" . $result . "</$list_type>"); |
|
927 | + $result = $this->hashBlock("<$list_type>\n".$result."</$list_type>"); |
|
928 | 928 | } |
929 | - return "\n". $result ."\n\n"; |
|
929 | + return "\n".$result."\n\n"; |
|
930 | 930 | } |
931 | 931 | |
932 | 932 | protected $list_level = 0; |
@@ -979,16 +979,16 @@ discard block |
||
979 | 979 | } |
980 | 980 | protected function _processListItems_callback($matches) { |
981 | 981 | $item = $matches[4]; |
982 | - $leading_line =& $matches[1]; |
|
983 | - $leading_space =& $matches[2]; |
|
982 | + $leading_line = & $matches[1]; |
|
983 | + $leading_space = & $matches[2]; |
|
984 | 984 | $marker_space = $matches[3]; |
985 | - $tailing_blank_line =& $matches[5]; |
|
985 | + $tailing_blank_line = & $matches[5]; |
|
986 | 986 | |
987 | 987 | if ($leading_line || $tailing_blank_line || |
988 | 988 | preg_match('/\n{2,}/', $item)) |
989 | 989 | { |
990 | 990 | # Replace marker with the appropriate whitespace indentation |
991 | - $item = $leading_space . str_repeat(' ', strlen($marker_space)) . $item; |
|
991 | + $item = $leading_space.str_repeat(' ', strlen($marker_space)).$item; |
|
992 | 992 | $item = $this->runBlockGamut($this->outdent($item)."\n"); |
993 | 993 | } |
994 | 994 | else { |
@@ -998,7 +998,7 @@ discard block |
||
998 | 998 | $item = $this->runSpanGamut($item); |
999 | 999 | } |
1000 | 1000 | |
1001 | - return "<li>" . $item . "</li>\n"; |
|
1001 | + return "<li>".$item."</li>\n"; |
|
1002 | 1002 | } |
1003 | 1003 | |
1004 | 1004 | |
@@ -1076,7 +1076,7 @@ discard block |
||
1076 | 1076 | $token_relist[] = $strong_re; |
1077 | 1077 | |
1078 | 1078 | # Construct master expression from list. |
1079 | - $token_re = '{('. implode('|', $token_relist) .')}'; |
|
1079 | + $token_re = '{('.implode('|', $token_relist).')}'; |
|
1080 | 1080 | $this->em_strong_prepared_relist["$em$strong"] = $token_re; |
1081 | 1081 | } |
1082 | 1082 | } |
@@ -1102,8 +1102,8 @@ discard block |
||
1102 | 1102 | # |
1103 | 1103 | $parts = preg_split($token_re, $text, 2, PREG_SPLIT_DELIM_CAPTURE); |
1104 | 1104 | $text_stack[0] .= $parts[0]; |
1105 | - $token =& $parts[1]; |
|
1106 | - $text =& $parts[2]; |
|
1105 | + $token = & $parts[1]; |
|
1106 | + $text = & $parts[2]; |
|
1107 | 1107 | |
1108 | 1108 | if (empty($token)) { |
1109 | 1109 | # Reached end of text span: empty stack without emitting. |
@@ -1130,7 +1130,7 @@ discard block |
||
1130 | 1130 | } else { |
1131 | 1131 | # Other closing marker: close one em or strong and |
1132 | 1132 | # change current token state to match the other |
1133 | - $token_stack[0] = str_repeat($token{0}, 3-$token_len); |
|
1133 | + $token_stack[0] = str_repeat($token{0}, 3 - $token_len); |
|
1134 | 1134 | $tag = $token_len == 2 ? "strong" : "em"; |
1135 | 1135 | $span = $text_stack[0]; |
1136 | 1136 | $span = $this->runSpanGamut($span); |
@@ -1224,7 +1224,7 @@ discard block |
||
1224 | 1224 | $bq = $matches[1]; |
1225 | 1225 | # trim one level of quoting - trim whitespace-only lines |
1226 | 1226 | $bq = preg_replace('/^[ ]*>[ ]?|^[ ]+$/m', '', $bq); |
1227 | - $bq = $this->runBlockGamut($bq); # recurse |
|
1227 | + $bq = $this->runBlockGamut($bq); # recurse |
|
1228 | 1228 | |
1229 | 1229 | $bq = preg_replace('/^/m', " ", $bq); |
1230 | 1230 | # These leading spaces cause problem with <pre> content, |
@@ -1232,7 +1232,7 @@ discard block |
||
1232 | 1232 | $bq = preg_replace_callback('{(\s*<pre>.+?</pre>)}sx', |
1233 | 1233 | array($this, '_doBlockQuotes_callback2'), $bq); |
1234 | 1234 | |
1235 | - return "\n". $this->hashBlock("<blockquote>\n$bq\n</blockquote>")."\n\n"; |
|
1235 | + return "\n".$this->hashBlock("<blockquote>\n$bq\n</blockquote>")."\n\n"; |
|
1236 | 1236 | } |
1237 | 1237 | protected function _doBlockQuotes_callback2($matches) { |
1238 | 1238 | $pre = $matches[1]; |
@@ -1432,7 +1432,7 @@ discard block |
||
1432 | 1432 | if ($text == "") return $tail = ""; |
1433 | 1433 | |
1434 | 1434 | $chars = preg_split('/(?<!^)(?!$)/', $text); |
1435 | - $seed = (int)abs(crc32($text) / strlen($text)); # Deterministic seed. |
|
1435 | + $seed = (int) abs(crc32($text) / strlen($text)); # Deterministic seed. |
|
1436 | 1436 | |
1437 | 1437 | foreach ($chars as $key => $char) { |
1438 | 1438 | $ord = ord($char); |
@@ -1468,7 +1468,7 @@ discard block |
||
1468 | 1468 | | |
1469 | 1469 | (?<![`\\\\]) |
1470 | 1470 | `+ # code span marker |
1471 | - '.( $this->no_markup ? '' : ' |
|
1471 | + '.($this->no_markup ? '' : ' |
|
1472 | 1472 | | |
1473 | 1473 | <!-- .*? --> # comment |
1474 | 1474 | | |
@@ -1522,7 +1522,7 @@ discard block |
||
1522 | 1522 | # |
1523 | 1523 | switch ($token{0}) { |
1524 | 1524 | case "\\": |
1525 | - return $this->hashPart("&#". ord($token{1}). ";"); |
|
1525 | + return $this->hashPart("&#".ord($token{1}).";"); |
|
1526 | 1526 | case "`": |
1527 | 1527 | # Search for end marker in remaining text. |
1528 | 1528 | if (preg_match('/^(.*?[^`])'.preg_quote($token).'(?!`)(.*)$/sm', |
@@ -1577,7 +1577,7 @@ discard block |
||
1577 | 1577 | # Calculate amount of space, insert spaces, insert block. |
1578 | 1578 | $amount = $this->tab_width - |
1579 | 1579 | $strlen($line, 'UTF-8') % $this->tab_width; |
1580 | - $line .= str_repeat(" ", $amount) . $block; |
|
1580 | + $line .= str_repeat(" ", $amount).$block; |
|
1581 | 1581 | } |
1582 | 1582 | return $line; |
1583 | 1583 | } |
@@ -38,8 +38,9 @@ discard block |
||
38 | 38 | $parser =& $parser_list[$parser_class]; |
39 | 39 | |
40 | 40 | # create the parser it not already set |
41 | - if (!$parser) |
|
42 | - $parser = new $parser_class; |
|
41 | + if (!$parser) { |
|
42 | + $parser = new $parser_class; |
|
43 | + } |
|
43 | 44 | |
44 | 45 | # Transform text using parser. |
45 | 46 | return $parser->transform($text); |
@@ -241,7 +242,9 @@ discard block |
||
241 | 242 | |
242 | 243 | |
243 | 244 | protected function hashHTMLBlocks($text) { |
244 | - if ($this->no_markup) return $text; |
|
245 | + if ($this->no_markup) { |
|
246 | + return $text; |
|
247 | + } |
|
245 | 248 | |
246 | 249 | $less_than_tab = $this->tab_width - 1; |
247 | 250 | |
@@ -529,7 +532,9 @@ discard block |
||
529 | 532 | # |
530 | 533 | # Turn Markdown link shortcuts into XHTML <a> tags. |
531 | 534 | # |
532 | - if ($this->in_anchor) return $text; |
|
535 | + if ($this->in_anchor) { |
|
536 | + return $text; |
|
537 | + } |
|
533 | 538 | $this->in_anchor = true; |
534 | 539 | |
535 | 540 | # |
@@ -623,8 +628,7 @@ discard block |
||
623 | 628 | $link_text = $this->runSpanGamut($link_text); |
624 | 629 | $result .= ">$link_text</a>"; |
625 | 630 | $result = $this->hashPart($result); |
626 | - } |
|
627 | - else { |
|
631 | + } else { |
|
628 | 632 | $result = $whole_match; |
629 | 633 | } |
630 | 634 | return $result; |
@@ -638,8 +642,9 @@ discard block |
||
638 | 642 | // if the URL was of the form <s p a c e s> it got caught by the HTML |
639 | 643 | // tag parser and hashed. Need to reverse the process before using the URL. |
640 | 644 | $unhashed = $this->unhash($url); |
641 | - if ($unhashed != $url) |
|
642 | - $url = preg_replace('/^<(.*)>$/', '\1', $unhashed); |
|
645 | + if ($unhashed != $url) { |
|
646 | + $url = preg_replace('/^<(.*)>$/', '\1', $unhashed); |
|
647 | + } |
|
643 | 648 | |
644 | 649 | $url = $this->encodeURLAttribute($url); |
645 | 650 | |
@@ -731,8 +736,7 @@ discard block |
||
731 | 736 | } |
732 | 737 | $result .= $this->empty_element_suffix; |
733 | 738 | $result = $this->hashPart($result); |
734 | - } |
|
735 | - else { |
|
739 | + } else { |
|
736 | 740 | # If there's no such link ID, leave intact: |
737 | 741 | $result = $whole_match; |
738 | 742 | } |
@@ -791,8 +795,9 @@ discard block |
||
791 | 795 | |
792 | 796 | protected function _doHeaders_callback_setext($matches) { |
793 | 797 | # Terrible hack to check we haven't found an empty list item. |
794 | - if ($matches[2] == '-' && preg_match('{^-(?: |$)}', $matches[1])) |
|
795 | - return $matches[0]; |
|
798 | + if ($matches[2] == '-' && preg_match('{^-(?: |$)}', $matches[1])) { |
|
799 | + return $matches[0]; |
|
800 | + } |
|
796 | 801 | |
797 | 802 | $level = $matches[2]{0} == '=' ? 1 : 2; |
798 | 803 | |
@@ -823,7 +828,9 @@ discard block |
||
823 | 828 | return ""; |
824 | 829 | } |
825 | 830 | $idValue = call_user_func($this->header_id_func, $headerValue); |
826 | - if (!$idValue) return ""; |
|
831 | + if (!$idValue) { |
|
832 | + return ""; |
|
833 | + } |
|
827 | 834 | |
828 | 835 | return ' id="' . $this->encodeAttribute($idValue) . '"'; |
829 | 836 | |
@@ -882,8 +889,7 @@ discard block |
||
882 | 889 | '.$whole_list_re.' |
883 | 890 | }mx', |
884 | 891 | array($this, '_doLists_callback'), $text); |
885 | - } |
|
886 | - else { |
|
892 | + } else { |
|
887 | 893 | $text = preg_replace_callback('{ |
888 | 894 | (?:(?<=\n)\n|\A\n?) # Must eat the newline |
889 | 895 | '.$whole_list_re.' |
@@ -990,8 +996,7 @@ discard block |
||
990 | 996 | # Replace marker with the appropriate whitespace indentation |
991 | 997 | $item = $leading_space . str_repeat(' ', strlen($marker_space)) . $item; |
992 | 998 | $item = $this->runBlockGamut($this->outdent($item)."\n"); |
993 | - } |
|
994 | - else { |
|
999 | + } else { |
|
995 | 1000 | # Recursion for sub-lists: |
996 | 1001 | $item = $this->doLists($this->outdent($item)); |
997 | 1002 | $item = preg_replace('/\n+$/', '', $item); |
@@ -1261,8 +1266,7 @@ discard block |
||
1261 | 1266 | $value = preg_replace('/^([ ]*)/', "<p>", $value); |
1262 | 1267 | $value .= "</p>"; |
1263 | 1268 | $grafs[$key] = $this->unhash($value); |
1264 | - } |
|
1265 | - else { |
|
1269 | + } else { |
|
1266 | 1270 | # Is a block. |
1267 | 1271 | # Modify elements of @grafs in-place... |
1268 | 1272 | $graf = $value; |
@@ -1329,17 +1333,17 @@ discard block |
||
1329 | 1333 | # representation for the URL (removing mailto: or tel:) storing it in $text. |
1330 | 1334 | # This function is *not* suitable for attributes enclosed in single quotes. |
1331 | 1335 | # |
1332 | - if ($this->url_filter_func) |
|
1333 | - $url = call_user_func($this->url_filter_func, $url); |
|
1336 | + if ($this->url_filter_func) { |
|
1337 | + $url = call_user_func($this->url_filter_func, $url); |
|
1338 | + } |
|
1334 | 1339 | |
1335 | - if (preg_match('{^mailto:}i', $url)) |
|
1336 | - $url = $this->encodeEntityObfuscatedAttribute($url, $text, 7); |
|
1337 | - else if (preg_match('{^tel:}i', $url)) |
|
1340 | + if (preg_match('{^mailto:}i', $url)) { |
|
1341 | + $url = $this->encodeEntityObfuscatedAttribute($url, $text, 7); |
|
1342 | + } else if (preg_match('{^tel:}i', $url)) |
|
1338 | 1343 | { |
1339 | 1344 | $url = $this->encodeAttribute($url); |
1340 | 1345 | $text = substr($url, 4); |
1341 | - } |
|
1342 | - else |
|
1346 | + } else |
|
1343 | 1347 | { |
1344 | 1348 | $url = $this->encodeAttribute($url); |
1345 | 1349 | $text = $url; |
@@ -1429,7 +1433,9 @@ discard block |
||
1429 | 1433 | # With some optimizations by Milian Wolff. Forced encoding of HTML |
1430 | 1434 | # attribute special characters by Allan Odgaard. |
1431 | 1435 | # |
1432 | - if ($text == "") return $tail = ""; |
|
1436 | + if ($text == "") { |
|
1437 | + return $tail = ""; |
|
1438 | + } |
|
1433 | 1439 | |
1434 | 1440 | $chars = preg_split('/(?<!^)(?!$)/', $text); |
1435 | 1441 | $seed = (int)abs(crc32($text) / strlen($text)); # Deterministic seed. |
@@ -1443,8 +1449,11 @@ discard block |
||
1443 | 1449 | # '@' *must* be encoded. I insist. |
1444 | 1450 | # '"' and '>' have to be encoded inside the attribute |
1445 | 1451 | if ($r > 90 && strpos('@"&>', $char) === false) /* do nothing */; |
1446 | - else if ($r < 45) $chars[$key] = '&#x'.dechex($ord).';'; |
|
1447 | - else $chars[$key] = '&#'.$ord.';'; |
|
1452 | + else if ($r < 45) { |
|
1453 | + $chars[$key] = '&#x'.dechex($ord).';'; |
|
1454 | + } else { |
|
1455 | + $chars[$key] = '&#'.$ord.';'; |
|
1456 | + } |
|
1448 | 1457 | } |
1449 | 1458 | } |
1450 | 1459 | |
@@ -1505,8 +1514,7 @@ discard block |
||
1505 | 1514 | if (isset($parts[1])) { |
1506 | 1515 | $output .= $this->handleSpanToken($parts[1], $parts[2]); |
1507 | 1516 | $str = $parts[2]; |
1508 | - } |
|
1509 | - else { |
|
1517 | + } else { |
|
1510 | 1518 | break; |
1511 | 1519 | } |
1512 | 1520 | } |
@@ -1588,7 +1596,9 @@ discard block |
||
1588 | 1596 | # function that will loosely count the number of UTF-8 characters with a |
1589 | 1597 | # regular expression. |
1590 | 1598 | # |
1591 | - if (function_exists($this->utf8_strlen)) return; |
|
1599 | + if (function_exists($this->utf8_strlen)) { |
|
1600 | + return; |
|
1601 | + } |
|
1592 | 1602 | $this->utf8_strlen = create_function('$text', 'return preg_match_all( |
1593 | 1603 | "/[\\\\x00-\\\\xBF]|[\\\\xC0-\\\\xFF][\\\\x80-\\\\xBF]*/", |
1594 | 1604 | $text, $m);'); |