@@ -205,6 +205,7 @@ |
||
| 205 | 205 | /** |
| 206 | 206 | * Adds a module to the current doctype by first registering it, |
| 207 | 207 | * and then tacking it on to the active doctype |
| 208 | + * @param HTMLPurifier_HTMLModule $module |
|
| 208 | 209 | */ |
| 209 | 210 | public function addModule($module) |
| 210 | 211 | { |
@@ -174,7 +174,7 @@ discard block |
||
| 174 | 174 | $original_module = $module; |
| 175 | 175 | $ok = false; |
| 176 | 176 | foreach ($this->prefixes as $prefix) { |
| 177 | - $module = $prefix . $original_module; |
|
| 177 | + $module = $prefix.$original_module; |
|
| 178 | 178 | if (class_exists($module)) { |
| 179 | 179 | $ok = true; |
| 180 | 180 | break; |
@@ -184,7 +184,7 @@ discard block |
||
| 184 | 184 | $module = $original_module; |
| 185 | 185 | if (!class_exists($module)) { |
| 186 | 186 | trigger_error( |
| 187 | - $original_module . ' module does not exist', |
|
| 187 | + $original_module.' module does not exist', |
|
| 188 | 188 | E_USER_ERROR |
| 189 | 189 | ); |
| 190 | 190 | return; |
@@ -193,11 +193,11 @@ discard block |
||
| 193 | 193 | $module = new $module(); |
| 194 | 194 | } |
| 195 | 195 | if (empty($module->name)) { |
| 196 | - trigger_error('Module instance of ' . get_class($module) . ' must have name'); |
|
| 196 | + trigger_error('Module instance of '.get_class($module).' must have name'); |
|
| 197 | 197 | return; |
| 198 | 198 | } |
| 199 | 199 | if (!$overload && isset($this->registeredModules[$module->name])) { |
| 200 | - trigger_error('Overloading ' . $module->name . ' without explicit overload parameter', E_USER_WARNING); |
|
| 200 | + trigger_error('Overloading '.$module->name.' without explicit overload parameter', E_USER_WARNING); |
|
| 201 | 201 | } |
| 202 | 202 | $this->registeredModules[$module->name] = $module; |
| 203 | 203 | } |
@@ -65,7 +65,7 @@ |
||
| 65 | 65 | * deleted a node, and now need to see if this change affected any |
| 66 | 66 | * earlier nodes. Rewinding does not affect other injectors, and can |
| 67 | 67 | * result in infinite loops if not used carefully. |
| 68 | - * @param bool|int $offset |
|
| 68 | + * @param integer $offset |
|
| 69 | 69 | * @warning HTML Purifier will prevent you from fast-forwarding with this |
| 70 | 70 | * function. |
| 71 | 71 | */ |
@@ -104,9 +104,9 @@ |
||
| 104 | 104 | if ($result !== false) { |
| 105 | 105 | return $result; |
| 106 | 106 | } |
| 107 | - $this->currentNesting =& $context->get('CurrentNesting'); |
|
| 108 | - $this->currentToken =& $context->get('CurrentToken'); |
|
| 109 | - $this->inputZipper =& $context->get('InputZipper'); |
|
| 107 | + $this->currentNesting = & $context->get('CurrentNesting'); |
|
| 108 | + $this->currentToken = & $context->get('CurrentToken'); |
|
| 109 | + $this->inputZipper = & $context->get('InputZipper'); |
|
| 110 | 110 | return false; |
| 111 | 111 | } |
| 112 | 112 | |
@@ -328,7 +328,7 @@ |
||
| 328 | 328 | * Determines if a particular token requires an earlier inline token |
| 329 | 329 | * to get a paragraph. This should be used with _forwardUntilEndToken |
| 330 | 330 | * @param HTMLPurifier_Token $current |
| 331 | - * @return bool |
|
| 331 | + * @return boolean|null |
|
| 332 | 332 | */ |
| 333 | 333 | private function _checkNeedsP($current) |
| 334 | 334 | { |
@@ -341,6 +341,7 @@ |
||
| 341 | 341 | /** |
| 342 | 342 | * Takes a string of HTML (fragment or document) and returns the content |
| 343 | 343 | * @todo Consider making protected |
| 344 | + * @param string $html |
|
| 344 | 345 | */ |
| 345 | 346 | public function extractBody($html) |
| 346 | 347 | { |
@@ -124,7 +124,7 @@ discard block |
||
| 124 | 124 | break; |
| 125 | 125 | default: |
| 126 | 126 | throw new HTMLPurifier_Exception( |
| 127 | - "Cannot instantiate unrecognized Lexer type " . |
|
| 127 | + "Cannot instantiate unrecognized Lexer type ". |
|
| 128 | 128 | htmlspecialchars($lexer) |
| 129 | 129 | ); |
| 130 | 130 | } |
@@ -138,7 +138,7 @@ discard block |
||
| 138 | 138 | // hack out something using XSLT, remove this stipulation |
| 139 | 139 | if ($needs_tracking && !$inst->tracksLineNumbers) { |
| 140 | 140 | throw new HTMLPurifier_Exception( |
| 141 | - 'Cannot use lexer that does not support line numbers with ' . |
|
| 141 | + 'Cannot use lexer that does not support line numbers with '. |
|
| 142 | 142 | 'Core.MaintainLineNumbers or Core.CollectErrors (use DirectLex instead)' |
| 143 | 143 | ); |
| 144 | 144 | } |
@@ -313,7 +313,7 @@ discard block |
||
| 313 | 313 | if ($config->get('Core.ConvertDocumentToFragment')) { |
| 314 | 314 | $e = false; |
| 315 | 315 | if ($config->get('Core.CollectErrors')) { |
| 316 | - $e =& $context->get('ErrorCollector'); |
|
| 316 | + $e = & $context->get('ErrorCollector'); |
|
| 317 | 317 | } |
| 318 | 318 | $new_html = $this->extractBody($html); |
| 319 | 319 | if ($e && $new_html != $html) { |
@@ -458,6 +458,9 @@ discard block |
||
| 458 | 458 | const CHARACTR = 4; |
| 459 | 459 | const EOF = 5; |
| 460 | 460 | |
| 461 | + /** |
|
| 462 | + * @param string $data |
|
| 463 | + */ |
|
| 461 | 464 | public function __construct($data) |
| 462 | 465 | { |
| 463 | 466 | $this->data = $data; |
@@ -478,6 +481,9 @@ discard block |
||
| 478 | 481 | return $this->tree->save(); |
| 479 | 482 | } |
| 480 | 483 | |
| 484 | + /** |
|
| 485 | + * @return string |
|
| 486 | + */ |
|
| 481 | 487 | private function char() |
| 482 | 488 | { |
| 483 | 489 | return ($this->char < $this->EOF) |
@@ -485,6 +491,11 @@ discard block |
||
| 485 | 491 | : false; |
| 486 | 492 | } |
| 487 | 493 | |
| 494 | + /** |
|
| 495 | + * @param integer $s |
|
| 496 | + * |
|
| 497 | + * @return string |
|
| 498 | + */ |
|
| 488 | 499 | private function character($s, $l = 0) |
| 489 | 500 | { |
| 490 | 501 | if ($s + $l < $this->EOF) { |
@@ -496,6 +507,10 @@ discard block |
||
| 496 | 507 | } |
| 497 | 508 | } |
| 498 | 509 | |
| 510 | + /** |
|
| 511 | + * @param string $char_class |
|
| 512 | + * @param integer $start |
|
| 513 | + */ |
|
| 499 | 514 | private function characters($char_class, $start) |
| 500 | 515 | { |
| 501 | 516 | return preg_replace('#^([' . $char_class . ']+).*#s', '\\1', substr($this->data, $start)); |
@@ -4645,6 +4660,9 @@ discard block |
||
| 4645 | 4660 | } |
| 4646 | 4661 | } |
| 4647 | 4662 | |
| 4663 | + /** |
|
| 4664 | + * @param string[] $elements |
|
| 4665 | + */ |
|
| 4648 | 4666 | private function clearStackToTableContext($elements) |
| 4649 | 4667 | { |
| 4650 | 4668 | /* When the steps above require the UA to clear the stack back to a |
@@ -469,7 +469,7 @@ discard block |
||
| 469 | 469 | $this->state = 'data'; |
| 470 | 470 | |
| 471 | 471 | while ($this->state !== null) { |
| 472 | - $this->{$this->state . 'State'}(); |
|
| 472 | + $this->{$this->state.'State'}(); |
|
| 473 | 473 | } |
| 474 | 474 | } |
| 475 | 475 | |
@@ -498,7 +498,7 @@ discard block |
||
| 498 | 498 | |
| 499 | 499 | private function characters($char_class, $start) |
| 500 | 500 | { |
| 501 | - return preg_replace('#^([' . $char_class . ']+).*#s', '\\1', substr($this->data, $start)); |
|
| 501 | + return preg_replace('#^(['.$char_class.']+).*#s', '\\1', substr($this->data, $start)); |
|
| 502 | 502 | } |
| 503 | 503 | |
| 504 | 504 | private function dataState() |
@@ -1289,7 +1289,7 @@ discard block |
||
| 1289 | 1289 | } else { |
| 1290 | 1290 | /* Append a U+002D HYPHEN-MINUS (-) character and the input |
| 1291 | 1291 | character to the comment token's data. Switch to the comment state. */ |
| 1292 | - $this->token['data'] .= '-' . $char; |
|
| 1292 | + $this->token['data'] .= '-'.$char; |
|
| 1293 | 1293 | $this->state = 'comment'; |
| 1294 | 1294 | } |
| 1295 | 1295 | } |
@@ -1313,7 +1313,7 @@ discard block |
||
| 1313 | 1313 | $this->state = 'data'; |
| 1314 | 1314 | |
| 1315 | 1315 | } else { |
| 1316 | - $this->token['data'] .= '--' . $char; |
|
| 1316 | + $this->token['data'] .= '--'.$char; |
|
| 1317 | 1317 | $this->state = 'comment'; |
| 1318 | 1318 | } |
| 1319 | 1319 | } |
@@ -1547,7 +1547,7 @@ discard block |
||
| 1547 | 1547 | |
| 1548 | 1548 | // Return a character token for the character corresponding to the |
| 1549 | 1549 | // entity name (as given by the second column of the entities table). |
| 1550 | - return html_entity_decode('&' . $entity . ';', ENT_QUOTES, 'UTF-8'); |
|
| 1550 | + return html_entity_decode('&'.$entity.';', ENT_QUOTES, 'UTF-8'); |
|
| 1551 | 1551 | } |
| 1552 | 1552 | |
| 1553 | 1553 | private function emitToken($token) |
@@ -2656,7 +2656,7 @@ discard block |
||
| 2656 | 2656 | |
| 2657 | 2657 | /* Act as if a stream of character tokens had been seen. */ |
| 2658 | 2658 | $this->insertText( |
| 2659 | - 'This is a searchable index. ' . |
|
| 2659 | + 'This is a searchable index. '. |
|
| 2660 | 2660 | 'Insert your search keywords here: ' |
| 2661 | 2661 | ); |
| 2662 | 2662 | |
@@ -2678,7 +2678,7 @@ discard block |
||
| 2678 | 2678 | /* Act as if a stream of character tokens had been seen |
| 2679 | 2679 | (see below for what they should say). */ |
| 2680 | 2680 | $this->insertText( |
| 2681 | - 'This is a searchable index. ' . |
|
| 2681 | + 'This is a searchable index. '. |
|
| 2682 | 2682 | 'Insert your search keywords here: ' |
| 2683 | 2683 | ); |
| 2684 | 2684 | |
@@ -108,7 +108,7 @@ |
||
| 108 | 108 | /** |
| 109 | 109 | * Prints a simple key/value row in a table. |
| 110 | 110 | * @param string $name Key |
| 111 | - * @param mixed $value Value |
|
| 111 | + * @param string $value Value |
|
| 112 | 112 | * @return string |
| 113 | 113 | */ |
| 114 | 114 | protected function row($name, $value) |
@@ -77,8 +77,8 @@ discard block |
||
| 77 | 77 | */ |
| 78 | 78 | protected function element($tag, $contents, $attr = array(), $escape = true) |
| 79 | 79 | { |
| 80 | - return $this->start($tag, $attr) . |
|
| 81 | - ($escape ? $this->escape($contents) : $contents) . |
|
| 80 | + return $this->start($tag, $attr). |
|
| 81 | + ($escape ? $this->escape($contents) : $contents). |
|
| 82 | 82 | $this->end($tag); |
| 83 | 83 | } |
| 84 | 84 | |
@@ -117,9 +117,9 @@ discard block |
||
| 117 | 117 | $value = $value ? 'On' : 'Off'; |
| 118 | 118 | } |
| 119 | 119 | return |
| 120 | - $this->start('tr') . "\n" . |
|
| 121 | - $this->element('th', $name) . "\n" . |
|
| 122 | - $this->element('td', $value) . "\n" . |
|
| 120 | + $this->start('tr')."\n". |
|
| 121 | + $this->element('th', $name)."\n". |
|
| 122 | + $this->element('td', $value)."\n". |
|
| 123 | 123 | $this->end('tr'); |
| 124 | 124 | } |
| 125 | 125 | |
@@ -173,7 +173,7 @@ discard block |
||
| 173 | 173 | if ($five === null) { |
| 174 | 174 | $five = version_compare(PHP_VERSION, '5', '>='); |
| 175 | 175 | } |
| 176 | - $prefix = 'HTMLPurifier_' . $sec_prefix; |
|
| 176 | + $prefix = 'HTMLPurifier_'.$sec_prefix; |
|
| 177 | 177 | if (!$five) { |
| 178 | 178 | $prefix = strtolower($prefix); |
| 179 | 179 | } |
@@ -196,11 +196,11 @@ discard block |
||
| 196 | 196 | $class .= implode(', ', $values); |
| 197 | 197 | break; |
| 198 | 198 | case 'css_multiple': |
| 199 | - $class .= $this->getClass($obj->single, $sec_prefix) . ', '; |
|
| 199 | + $class .= $this->getClass($obj->single, $sec_prefix).', '; |
|
| 200 | 200 | $class .= $obj->max; |
| 201 | 201 | break; |
| 202 | 202 | case 'css_denyelementdecorator': |
| 203 | - $class .= $this->getClass($obj->def, $sec_prefix) . ', '; |
|
| 203 | + $class .= $this->getClass($obj->def, $sec_prefix).', '; |
|
| 204 | 204 | $class .= $obj->element; |
| 205 | 205 | break; |
| 206 | 206 | case 'css_importantdecorator': |
@@ -53,8 +53,8 @@ discard block |
||
| 53 | 53 | |
| 54 | 54 | /** |
| 55 | 55 | * Sets default column and row size for textareas in sub-printers |
| 56 | - * @param $cols Integer columns of textarea, null to use default |
|
| 57 | - * @param $rows Integer rows of textarea, null to use default |
|
| 56 | + * @param integer $cols Integer columns of textarea, null to use default |
|
| 57 | + * @param integer $rows Integer rows of textarea, null to use default |
|
| 58 | 58 | */ |
| 59 | 59 | public function setTextareaDimensions($cols = null, $rows = null) |
| 60 | 60 | { |
@@ -84,7 +84,7 @@ discard block |
||
| 84 | 84 | |
| 85 | 85 | /** |
| 86 | 86 | * Returns HTML output for a configuration form |
| 87 | - * @param HTMLPurifier_Config|array $config Configuration object of current form state, or an array |
|
| 87 | + * @param HTMLPurifier_Config $config Configuration object of current form state, or an array |
|
| 88 | 88 | * where [0] has an HTML namespace and [1] is being rendered. |
| 89 | 89 | * @param array|bool $allowed Optional namespace(s) and directives to restrict form to. |
| 90 | 90 | * @param bool $render_controls |
@@ -71,7 +71,7 @@ discard block |
||
| 71 | 71 | */ |
| 72 | 72 | public static function getCSS() |
| 73 | 73 | { |
| 74 | - return file_get_contents(HTMLPURIFIER_PREFIX . '/HTMLPurifier/Printer/ConfigForm.css'); |
|
| 74 | + return file_get_contents(HTMLPURIFIER_PREFIX.'/HTMLPurifier/Printer/ConfigForm.css'); |
|
| 75 | 75 | } |
| 76 | 76 | |
| 77 | 77 | /** |
@@ -79,7 +79,7 @@ discard block |
||
| 79 | 79 | */ |
| 80 | 80 | public static function getJavaScript() |
| 81 | 81 | { |
| 82 | - return file_get_contents(HTMLPURIFIER_PREFIX . '/HTMLPurifier/Printer/ConfigForm.js'); |
|
| 82 | + return file_get_contents(HTMLPURIFIER_PREFIX.'/HTMLPurifier/Printer/ConfigForm.js'); |
|
| 83 | 83 | } |
| 84 | 84 | |
| 85 | 85 | /** |
@@ -107,7 +107,7 @@ discard block |
||
| 107 | 107 | $all = array(); |
| 108 | 108 | foreach ($allowed as $key) { |
| 109 | 109 | list($ns, $directive) = $key; |
| 110 | - $all[$ns][$directive] = $config->get($ns . '.' . $directive); |
|
| 110 | + $all[$ns][$directive] = $config->get($ns.'.'.$directive); |
|
| 111 | 111 | } |
| 112 | 112 | |
| 113 | 113 | $ret = ''; |
@@ -163,7 +163,7 @@ discard block |
||
| 163 | 163 | if (!$this->compress || (strlen($directive) < $this->compress)) { |
| 164 | 164 | $directive_disp = $directive; |
| 165 | 165 | } else { |
| 166 | - $directive_disp = substr($directive, 0, $this->compress - 2) . '...'; |
|
| 166 | + $directive_disp = substr($directive, 0, $this->compress - 2).'...'; |
|
| 167 | 167 | $attr['title'] = $directive; |
| 168 | 168 | } |
| 169 | 169 | |
@@ -251,14 +251,14 @@ discard block |
||
| 251 | 251 | 'type' => 'checkbox', |
| 252 | 252 | 'value' => '1', |
| 253 | 253 | 'class' => 'null-toggle', |
| 254 | - 'name' => "$name" . "[Null_$ns.$directive]", |
|
| 254 | + 'name' => "$name"."[Null_$ns.$directive]", |
|
| 255 | 255 | 'id' => "$name:Null_$ns.$directive", |
| 256 | 256 | 'onclick' => "toggleWriteability('$name:$ns.$directive',checked)" // INLINE JAVASCRIPT!!!! |
| 257 | 257 | ); |
| 258 | 258 | if ($this->obj instanceof HTMLPurifier_Printer_ConfigForm_bool) { |
| 259 | 259 | // modify inline javascript slightly |
| 260 | 260 | $attr['onclick'] = |
| 261 | - "toggleWriteability('$name:Yes_$ns.$directive',checked);" . |
|
| 261 | + "toggleWriteability('$name:Yes_$ns.$directive',checked);". |
|
| 262 | 262 | "toggleWriteability('$name:No_$ns.$directive',checked)"; |
| 263 | 263 | } |
| 264 | 264 | if ($value === null) { |
@@ -327,7 +327,7 @@ discard block |
||
| 327 | 327 | case HTMLPurifier_VarParser::HASH: |
| 328 | 328 | $nvalue = ''; |
| 329 | 329 | foreach ($value as $i => $v) { |
| 330 | - $nvalue .= "$i:$v" . PHP_EOL; |
|
| 330 | + $nvalue .= "$i:$v".PHP_EOL; |
|
| 331 | 331 | } |
| 332 | 332 | $value = $nvalue; |
| 333 | 333 | break; |
@@ -340,7 +340,7 @@ discard block |
||
| 340 | 340 | $value = serialize($value); |
| 341 | 341 | } |
| 342 | 342 | $attr = array( |
| 343 | - 'name' => "$name" . "[$ns.$directive]", |
|
| 343 | + 'name' => "$name"."[$ns.$directive]", |
|
| 344 | 344 | 'id' => "$name:$ns.$directive" |
| 345 | 345 | ); |
| 346 | 346 | if ($value === null) { |
@@ -407,7 +407,7 @@ discard block |
||
| 407 | 407 | |
| 408 | 408 | $attr = array( |
| 409 | 409 | 'type' => 'radio', |
| 410 | - 'name' => "$name" . "[$ns.$directive]", |
|
| 410 | + 'name' => "$name"."[$ns.$directive]", |
|
| 411 | 411 | 'id' => "$name:Yes_$ns.$directive", |
| 412 | 412 | 'value' => '1' |
| 413 | 413 | ); |
@@ -426,7 +426,7 @@ discard block |
||
| 426 | 426 | |
| 427 | 427 | $attr = array( |
| 428 | 428 | 'type' => 'radio', |
| 429 | - 'name' => "$name" . "[$ns.$directive]", |
|
| 429 | + 'name' => "$name"."[$ns.$directive]", |
|
| 430 | 430 | 'id' => "$name:No_$ns.$directive", |
| 431 | 431 | 'value' => '0' |
| 432 | 432 | ); |
@@ -528,9 +528,10 @@ discard block |
||
| 528 | 528 | * being the current one) will be deleted. |
| 529 | 529 | * |
| 530 | 530 | * @param HTMLPurifier_Token|array|int|bool $token Token substitution value |
| 531 | - * @param HTMLPurifier_Injector|int $injector Injector that performed the substitution; default is if |
|
| 531 | + * @param integer $injector Injector that performed the substitution; default is if |
|
| 532 | 532 | * this is not an injector related operation. |
| 533 | 533 | * @throws HTMLPurifier_Exception |
| 534 | + * @return HTMLPurifier_Token |
|
| 534 | 535 | */ |
| 535 | 536 | protected function processToken($token, $injector = -1) |
| 536 | 537 | { |
@@ -577,6 +578,7 @@ discard block |
||
| 577 | 578 | * Inserts a token before the current token. Cursor now points to |
| 578 | 579 | * this token. You must reprocess after this. |
| 579 | 580 | * @param HTMLPurifier_Token $token |
| 581 | + * @return HTMLPurifier_Token |
|
| 580 | 582 | */ |
| 581 | 583 | private function insertBefore($token) |
| 582 | 584 | { |
@@ -151,8 +151,8 @@ |
||
| 151 | 151 | |
| 152 | 152 | // isset is in loop because $tokens size changes during loop exec |
| 153 | 153 | for (;; |
| 154 | - // only increment if we don't need to reprocess |
|
| 155 | - $reprocess ? $reprocess = false : $token = $zipper->next($token)) { |
|
| 154 | + // only increment if we don't need to reprocess |
|
| 155 | + $reprocess ? $reprocess = false : $token = $zipper->next($token)) { |
|
| 156 | 156 | |
| 157 | 157 | // check for a rewind |
| 158 | 158 | if (is_int($i)) { |
@@ -82,10 +82,10 @@ |
||
| 82 | 82 | $stack = array(); |
| 83 | 83 | |
| 84 | 84 | // member variables |
| 85 | - $this->stack =& $stack; |
|
| 86 | - $this->tokens =& $tokens; |
|
| 87 | - $this->token =& $token; |
|
| 88 | - $this->zipper =& $zipper; |
|
| 85 | + $this->stack = & $stack; |
|
| 86 | + $this->tokens = & $tokens; |
|
| 87 | + $this->token = & $token; |
|
| 88 | + $this->zipper = & $zipper; |
|
| 89 | 89 | $this->config = $config; |
| 90 | 90 | $this->context = $context; |
| 91 | 91 | |
@@ -162,7 +162,9 @@ |
||
| 162 | 162 | $rewind_offset = $this->injectors[$i]->getRewindOffset(); |
| 163 | 163 | if (is_int($rewind_offset)) { |
| 164 | 164 | for ($j = 0; $j < $rewind_offset; $j++) { |
| 165 | - if (empty($zipper->front)) break; |
|
| 165 | + if (empty($zipper->front)) {
|
|
| 166 | + break; |
|
| 167 | + } |
|
| 166 | 168 | $token = $zipper->prev($token); |
| 167 | 169 | // indicate that other injectors should not process this token, |
| 168 | 170 | // but we need to reprocess it |
@@ -25,6 +25,9 @@ discard block |
||
| 25 | 25 | |
| 26 | 26 | ### Simple Function Interface ### |
| 27 | 27 | |
| 28 | + /** |
|
| 29 | + * @param string $text |
|
| 30 | + */ |
|
| 28 | 31 | public static function defaultTransform($text) { |
| 29 | 32 | # |
| 30 | 33 | # Initialize the parser and return the result of its transform method. |
@@ -931,6 +934,10 @@ discard block |
||
| 931 | 934 | |
| 932 | 935 | protected $list_level = 0; |
| 933 | 936 | |
| 937 | + /** |
|
| 938 | + * @param string $list_str |
|
| 939 | + * @param string $marker_any_re |
|
| 940 | + */ |
|
| 934 | 941 | protected function processListItems($list_str, $marker_any_re) { |
| 935 | 942 | # |
| 936 | 943 | # Process the contents of a single ordered or unordered list, splitting it |
@@ -1034,6 +1041,9 @@ discard block |
||
| 1034 | 1041 | } |
| 1035 | 1042 | |
| 1036 | 1043 | |
| 1044 | + /** |
|
| 1045 | + * @param string $code |
|
| 1046 | + */ |
|
| 1037 | 1047 | protected function makeCodeSpan($code) { |
| 1038 | 1048 | # |
| 1039 | 1049 | # Create a code span markup for $code. Called from handleSpanToken. |
@@ -1311,6 +1321,9 @@ discard block |
||
| 1311 | 1321 | } |
| 1312 | 1322 | |
| 1313 | 1323 | |
| 1324 | + /** |
|
| 1325 | + * @return string |
|
| 1326 | + */ |
|
| 1314 | 1327 | protected function encodeAttribute($text) { |
| 1315 | 1328 | # |
| 1316 | 1329 | # Encode text for a double-quoted HTML attribute. This function |
@@ -1551,6 +1564,9 @@ discard block |
||
| 1551 | 1564 | # hanlde UTF-8 if the default function does not exist. |
| 1552 | 1565 | protected $utf8_strlen = 'mb_strlen'; |
| 1553 | 1566 | |
| 1567 | + /** |
|
| 1568 | + * @param string $text |
|
| 1569 | + */ |
|
| 1554 | 1570 | protected function detab($text) { |
| 1555 | 1571 | # |
| 1556 | 1572 | # Replace tabs with the appropriate amount of space. |
@@ -19,193 +19,193 @@ discard block |
||
| 19 | 19 | |
| 20 | 20 | class Markdown implements MarkdownInterface { |
| 21 | 21 | |
| 22 | - ### Version ### |
|
| 22 | + ### Version ### |
|
| 23 | 23 | |
| 24 | - const MARKDOWNLIB_VERSION = "1.5.0"; |
|
| 24 | + const MARKDOWNLIB_VERSION = "1.5.0"; |
|
| 25 | 25 | |
| 26 | - ### Simple Function Interface ### |
|
| 26 | + ### Simple Function Interface ### |
|
| 27 | 27 | |
| 28 | - public static function defaultTransform($text) { |
|
| 29 | - # |
|
| 30 | - # Initialize the parser and return the result of its transform method. |
|
| 31 | - # This will work fine for derived classes too. |
|
| 32 | - # |
|
| 33 | - # Take parser class on which this function was called. |
|
| 34 | - $parser_class = \get_called_class(); |
|
| 28 | + public static function defaultTransform($text) { |
|
| 29 | + # |
|
| 30 | + # Initialize the parser and return the result of its transform method. |
|
| 31 | + # This will work fine for derived classes too. |
|
| 32 | + # |
|
| 33 | + # Take parser class on which this function was called. |
|
| 34 | + $parser_class = \get_called_class(); |
|
| 35 | 35 | |
| 36 | - # try to take parser from the static parser list |
|
| 37 | - static $parser_list; |
|
| 38 | - $parser =& $parser_list[$parser_class]; |
|
| 36 | + # try to take parser from the static parser list |
|
| 37 | + static $parser_list; |
|
| 38 | + $parser =& $parser_list[$parser_class]; |
|
| 39 | 39 | |
| 40 | - # create the parser it not already set |
|
| 41 | - if (!$parser) |
|
| 42 | - $parser = new $parser_class; |
|
| 40 | + # create the parser it not already set |
|
| 41 | + if (!$parser) |
|
| 42 | + $parser = new $parser_class; |
|
| 43 | 43 | |
| 44 | - # Transform text using parser. |
|
| 45 | - return $parser->transform($text); |
|
| 46 | - } |
|
| 44 | + # Transform text using parser. |
|
| 45 | + return $parser->transform($text); |
|
| 46 | + } |
|
| 47 | 47 | |
| 48 | - ### Configuration Variables ### |
|
| 48 | + ### Configuration Variables ### |
|
| 49 | 49 | |
| 50 | - # Change to ">" for HTML output. |
|
| 51 | - public $empty_element_suffix = " />"; |
|
| 52 | - public $tab_width = 4; |
|
| 50 | + # Change to ">" for HTML output. |
|
| 51 | + public $empty_element_suffix = " />"; |
|
| 52 | + public $tab_width = 4; |
|
| 53 | 53 | |
| 54 | - # Change to `true` to disallow markup or entities. |
|
| 55 | - public $no_markup = false; |
|
| 56 | - public $no_entities = false; |
|
| 54 | + # Change to `true` to disallow markup or entities. |
|
| 55 | + public $no_markup = false; |
|
| 56 | + public $no_entities = false; |
|
| 57 | 57 | |
| 58 | - # Predefined urls and titles for reference links and images. |
|
| 59 | - public $predef_urls = array(); |
|
| 60 | - public $predef_titles = array(); |
|
| 61 | - |
|
| 62 | - # Optional filter function for URLs |
|
| 63 | - public $url_filter_func = null; |
|
| 64 | - |
|
| 65 | - # Optional header id="" generation callback function. |
|
| 66 | - public $header_id_func = null; |
|
| 67 | - |
|
| 68 | - # Class attribute to toggle "enhanced ordered list" behaviour |
|
| 69 | - # setting this to true will allow ordered lists to start from the index |
|
| 70 | - # number that is defined first. For example: |
|
| 71 | - # 2. List item two |
|
| 72 | - # 3. List item three |
|
| 73 | - # |
|
| 74 | - # becomes |
|
| 75 | - # <ol start="2"> |
|
| 76 | - # <li>List item two</li> |
|
| 77 | - # <li>List item three</li> |
|
| 78 | - # </ol> |
|
| 79 | - public $enhanced_ordered_list = false; |
|
| 80 | - |
|
| 81 | - ### Parser Implementation ### |
|
| 82 | - |
|
| 83 | - # Regex to match balanced [brackets]. |
|
| 84 | - # Needed to insert a maximum bracked depth while converting to PHP. |
|
| 85 | - protected $nested_brackets_depth = 6; |
|
| 86 | - protected $nested_brackets_re; |
|
| 58 | + # Predefined urls and titles for reference links and images. |
|
| 59 | + public $predef_urls = array(); |
|
| 60 | + public $predef_titles = array(); |
|
| 61 | + |
|
| 62 | + # Optional filter function for URLs |
|
| 63 | + public $url_filter_func = null; |
|
| 64 | + |
|
| 65 | + # Optional header id="" generation callback function. |
|
| 66 | + public $header_id_func = null; |
|
| 67 | + |
|
| 68 | + # Class attribute to toggle "enhanced ordered list" behaviour |
|
| 69 | + # setting this to true will allow ordered lists to start from the index |
|
| 70 | + # number that is defined first. For example: |
|
| 71 | + # 2. List item two |
|
| 72 | + # 3. List item three |
|
| 73 | + # |
|
| 74 | + # becomes |
|
| 75 | + # <ol start="2"> |
|
| 76 | + # <li>List item two</li> |
|
| 77 | + # <li>List item three</li> |
|
| 78 | + # </ol> |
|
| 79 | + public $enhanced_ordered_list = false; |
|
| 80 | + |
|
| 81 | + ### Parser Implementation ### |
|
| 82 | + |
|
| 83 | + # Regex to match balanced [brackets]. |
|
| 84 | + # Needed to insert a maximum bracked depth while converting to PHP. |
|
| 85 | + protected $nested_brackets_depth = 6; |
|
| 86 | + protected $nested_brackets_re; |
|
| 87 | 87 | |
| 88 | - protected $nested_url_parenthesis_depth = 4; |
|
| 89 | - protected $nested_url_parenthesis_re; |
|
| 88 | + protected $nested_url_parenthesis_depth = 4; |
|
| 89 | + protected $nested_url_parenthesis_re; |
|
| 90 | 90 | |
| 91 | - # Table of hash values for escaped characters: |
|
| 92 | - protected $escape_chars = '\`*_{}[]()>#+-.!'; |
|
| 93 | - protected $escape_chars_re; |
|
| 91 | + # Table of hash values for escaped characters: |
|
| 92 | + protected $escape_chars = '\`*_{}[]()>#+-.!'; |
|
| 93 | + protected $escape_chars_re; |
|
| 94 | 94 | |
| 95 | 95 | |
| 96 | - public function __construct() { |
|
| 97 | - # |
|
| 98 | - # Constructor function. Initialize appropriate member variables. |
|
| 99 | - # |
|
| 100 | - $this->_initDetab(); |
|
| 101 | - $this->prepareItalicsAndBold(); |
|
| 96 | + public function __construct() { |
|
| 97 | + # |
|
| 98 | + # Constructor function. Initialize appropriate member variables. |
|
| 99 | + # |
|
| 100 | + $this->_initDetab(); |
|
| 101 | + $this->prepareItalicsAndBold(); |
|
| 102 | 102 | |
| 103 | - $this->nested_brackets_re = |
|
| 104 | - str_repeat('(?>[^\[\]]+|\[', $this->nested_brackets_depth). |
|
| 105 | - str_repeat('\])*', $this->nested_brackets_depth); |
|
| 103 | + $this->nested_brackets_re = |
|
| 104 | + str_repeat('(?>[^\[\]]+|\[', $this->nested_brackets_depth). |
|
| 105 | + str_repeat('\])*', $this->nested_brackets_depth); |
|
| 106 | 106 | |
| 107 | - $this->nested_url_parenthesis_re = |
|
| 108 | - str_repeat('(?>[^()\s]+|\(', $this->nested_url_parenthesis_depth). |
|
| 109 | - str_repeat('(?>\)))*', $this->nested_url_parenthesis_depth); |
|
| 107 | + $this->nested_url_parenthesis_re = |
|
| 108 | + str_repeat('(?>[^()\s]+|\(', $this->nested_url_parenthesis_depth). |
|
| 109 | + str_repeat('(?>\)))*', $this->nested_url_parenthesis_depth); |
|
| 110 | 110 | |
| 111 | - $this->escape_chars_re = '['.preg_quote($this->escape_chars).']'; |
|
| 111 | + $this->escape_chars_re = '['.preg_quote($this->escape_chars).']'; |
|
| 112 | 112 | |
| 113 | - # Sort document, block, and span gamut in ascendent priority order. |
|
| 114 | - asort($this->document_gamut); |
|
| 115 | - asort($this->block_gamut); |
|
| 116 | - asort($this->span_gamut); |
|
| 117 | - } |
|
| 113 | + # Sort document, block, and span gamut in ascendent priority order. |
|
| 114 | + asort($this->document_gamut); |
|
| 115 | + asort($this->block_gamut); |
|
| 116 | + asort($this->span_gamut); |
|
| 117 | + } |
|
| 118 | 118 | |
| 119 | 119 | |
| 120 | - # Internal hashes used during transformation. |
|
| 121 | - protected $urls = array(); |
|
| 122 | - protected $titles = array(); |
|
| 123 | - protected $html_hashes = array(); |
|
| 120 | + # Internal hashes used during transformation. |
|
| 121 | + protected $urls = array(); |
|
| 122 | + protected $titles = array(); |
|
| 123 | + protected $html_hashes = array(); |
|
| 124 | 124 | |
| 125 | - # Status flag to avoid invalid nesting. |
|
| 126 | - protected $in_anchor = false; |
|
| 125 | + # Status flag to avoid invalid nesting. |
|
| 126 | + protected $in_anchor = false; |
|
| 127 | 127 | |
| 128 | 128 | |
| 129 | - protected function setup() { |
|
| 130 | - # |
|
| 131 | - # Called before the transformation process starts to setup parser |
|
| 132 | - # states. |
|
| 133 | - # |
|
| 134 | - # Clear global hashes. |
|
| 135 | - $this->urls = $this->predef_urls; |
|
| 136 | - $this->titles = $this->predef_titles; |
|
| 137 | - $this->html_hashes = array(); |
|
| 129 | + protected function setup() { |
|
| 130 | + # |
|
| 131 | + # Called before the transformation process starts to setup parser |
|
| 132 | + # states. |
|
| 133 | + # |
|
| 134 | + # Clear global hashes. |
|
| 135 | + $this->urls = $this->predef_urls; |
|
| 136 | + $this->titles = $this->predef_titles; |
|
| 137 | + $this->html_hashes = array(); |
|
| 138 | 138 | |
| 139 | - $this->in_anchor = false; |
|
| 140 | - } |
|
| 139 | + $this->in_anchor = false; |
|
| 140 | + } |
|
| 141 | 141 | |
| 142 | - protected function teardown() { |
|
| 143 | - # |
|
| 144 | - # Called after the transformation process to clear any variable |
|
| 145 | - # which may be taking up memory unnecessarly. |
|
| 146 | - # |
|
| 147 | - $this->urls = array(); |
|
| 148 | - $this->titles = array(); |
|
| 149 | - $this->html_hashes = array(); |
|
| 150 | - } |
|
| 151 | - |
|
| 152 | - |
|
| 153 | - public function transform($text) { |
|
| 154 | - # |
|
| 155 | - # Main function. Performs some preprocessing on the input text |
|
| 156 | - # and pass it through the document gamut. |
|
| 157 | - # |
|
| 158 | - $this->setup(); |
|
| 142 | + protected function teardown() { |
|
| 143 | + # |
|
| 144 | + # Called after the transformation process to clear any variable |
|
| 145 | + # which may be taking up memory unnecessarly. |
|
| 146 | + # |
|
| 147 | + $this->urls = array(); |
|
| 148 | + $this->titles = array(); |
|
| 149 | + $this->html_hashes = array(); |
|
| 150 | + } |
|
| 151 | + |
|
| 152 | + |
|
| 153 | + public function transform($text) { |
|
| 154 | + # |
|
| 155 | + # Main function. Performs some preprocessing on the input text |
|
| 156 | + # and pass it through the document gamut. |
|
| 157 | + # |
|
| 158 | + $this->setup(); |
|
| 159 | 159 | |
| 160 | - # Remove UTF-8 BOM and marker character in input, if present. |
|
| 161 | - $text = preg_replace('{^\xEF\xBB\xBF|\x1A}', '', $text); |
|
| 160 | + # Remove UTF-8 BOM and marker character in input, if present. |
|
| 161 | + $text = preg_replace('{^\xEF\xBB\xBF|\x1A}', '', $text); |
|
| 162 | 162 | |
| 163 | - # Standardize line endings: |
|
| 164 | - # DOS to Unix and Mac to Unix |
|
| 165 | - $text = preg_replace('{\r\n?}', "\n", $text); |
|
| 163 | + # Standardize line endings: |
|
| 164 | + # DOS to Unix and Mac to Unix |
|
| 165 | + $text = preg_replace('{\r\n?}', "\n", $text); |
|
| 166 | 166 | |
| 167 | - # Make sure $text ends with a couple of newlines: |
|
| 168 | - $text .= "\n\n"; |
|
| 167 | + # Make sure $text ends with a couple of newlines: |
|
| 168 | + $text .= "\n\n"; |
|
| 169 | 169 | |
| 170 | - # Convert all tabs to spaces. |
|
| 171 | - $text = $this->detab($text); |
|
| 170 | + # Convert all tabs to spaces. |
|
| 171 | + $text = $this->detab($text); |
|
| 172 | 172 | |
| 173 | - # Turn block-level HTML blocks into hash entries |
|
| 174 | - $text = $this->hashHTMLBlocks($text); |
|
| 173 | + # Turn block-level HTML blocks into hash entries |
|
| 174 | + $text = $this->hashHTMLBlocks($text); |
|
| 175 | 175 | |
| 176 | - # Strip any lines consisting only of spaces and tabs. |
|
| 177 | - # This makes subsequent regexen easier to write, because we can |
|
| 178 | - # match consecutive blank lines with /\n+/ instead of something |
|
| 179 | - # contorted like /[ ]*\n+/ . |
|
| 180 | - $text = preg_replace('/^[ ]+$/m', '', $text); |
|
| 176 | + # Strip any lines consisting only of spaces and tabs. |
|
| 177 | + # This makes subsequent regexen easier to write, because we can |
|
| 178 | + # match consecutive blank lines with /\n+/ instead of something |
|
| 179 | + # contorted like /[ ]*\n+/ . |
|
| 180 | + $text = preg_replace('/^[ ]+$/m', '', $text); |
|
| 181 | 181 | |
| 182 | - # Run document gamut methods. |
|
| 183 | - foreach ($this->document_gamut as $method => $priority) { |
|
| 184 | - $text = $this->$method($text); |
|
| 185 | - } |
|
| 182 | + # Run document gamut methods. |
|
| 183 | + foreach ($this->document_gamut as $method => $priority) { |
|
| 184 | + $text = $this->$method($text); |
|
| 185 | + } |
|
| 186 | 186 | |
| 187 | - $this->teardown(); |
|
| 187 | + $this->teardown(); |
|
| 188 | 188 | |
| 189 | - return $text . "\n"; |
|
| 190 | - } |
|
| 189 | + return $text . "\n"; |
|
| 190 | + } |
|
| 191 | 191 | |
| 192 | - protected $document_gamut = array( |
|
| 193 | - # Strip link definitions, store in hashes. |
|
| 194 | - "stripLinkDefinitions" => 20, |
|
| 192 | + protected $document_gamut = array( |
|
| 193 | + # Strip link definitions, store in hashes. |
|
| 194 | + "stripLinkDefinitions" => 20, |
|
| 195 | 195 | |
| 196 | - "runBasicBlockGamut" => 30, |
|
| 197 | - ); |
|
| 196 | + "runBasicBlockGamut" => 30, |
|
| 197 | + ); |
|
| 198 | 198 | |
| 199 | 199 | |
| 200 | - protected function stripLinkDefinitions($text) { |
|
| 201 | - # |
|
| 202 | - # Strips link definitions from text, stores the URLs and titles in |
|
| 203 | - # hash references. |
|
| 204 | - # |
|
| 205 | - $less_than_tab = $this->tab_width - 1; |
|
| 200 | + protected function stripLinkDefinitions($text) { |
|
| 201 | + # |
|
| 202 | + # Strips link definitions from text, stores the URLs and titles in |
|
| 203 | + # hash references. |
|
| 204 | + # |
|
| 205 | + $less_than_tab = $this->tab_width - 1; |
|
| 206 | 206 | |
| 207 | - # Link defs are in the form: ^[id]: url "optional title" |
|
| 208 | - $text = preg_replace_callback('{ |
|
| 207 | + # Link defs are in the form: ^[id]: url "optional title" |
|
| 208 | + $text = preg_replace_callback('{ |
|
| 209 | 209 | ^[ ]{0,'.$less_than_tab.'}\[(.+)\][ ]?: # id = $1 |
| 210 | 210 | [ ]* |
| 211 | 211 | \n? # maybe *one* newline |
@@ -227,46 +227,46 @@ discard block |
||
| 227 | 227 | )? # title is optional |
| 228 | 228 | (?:\n+|\Z) |
| 229 | 229 | }xm', |
| 230 | - array($this, '_stripLinkDefinitions_callback'), |
|
| 231 | - $text); |
|
| 232 | - return $text; |
|
| 233 | - } |
|
| 234 | - protected function _stripLinkDefinitions_callback($matches) { |
|
| 235 | - $link_id = strtolower($matches[1]); |
|
| 236 | - $url = $matches[2] == '' ? $matches[3] : $matches[2]; |
|
| 237 | - $this->urls[$link_id] = $url; |
|
| 238 | - $this->titles[$link_id] =& $matches[4]; |
|
| 239 | - return ''; # String that will replace the block |
|
| 240 | - } |
|
| 241 | - |
|
| 242 | - |
|
| 243 | - protected function hashHTMLBlocks($text) { |
|
| 244 | - if ($this->no_markup) return $text; |
|
| 245 | - |
|
| 246 | - $less_than_tab = $this->tab_width - 1; |
|
| 247 | - |
|
| 248 | - # Hashify HTML blocks: |
|
| 249 | - # We only want to do this for block-level HTML tags, such as headers, |
|
| 250 | - # lists, and tables. That's because we still want to wrap <p>s around |
|
| 251 | - # "paragraphs" that are wrapped in non-block-level tags, such as anchors, |
|
| 252 | - # phrase emphasis, and spans. The list of tags we're looking for is |
|
| 253 | - # hard-coded: |
|
| 254 | - # |
|
| 255 | - # * List "a" is made of tags which can be both inline or block-level. |
|
| 256 | - # These will be treated block-level when the start tag is alone on |
|
| 257 | - # its line, otherwise they're not matched here and will be taken as |
|
| 258 | - # inline later. |
|
| 259 | - # * List "b" is made of tags which are always block-level; |
|
| 260 | - # |
|
| 261 | - $block_tags_a_re = 'ins|del'; |
|
| 262 | - $block_tags_b_re = 'p|div|h[1-6]|blockquote|pre|table|dl|ol|ul|address|'. |
|
| 263 | - 'script|noscript|style|form|fieldset|iframe|math|svg|'. |
|
| 264 | - 'article|section|nav|aside|hgroup|header|footer|'. |
|
| 265 | - 'figure'; |
|
| 266 | - |
|
| 267 | - # Regular expression for the content of a block tag. |
|
| 268 | - $nested_tags_level = 4; |
|
| 269 | - $attr = ' |
|
| 230 | + array($this, '_stripLinkDefinitions_callback'), |
|
| 231 | + $text); |
|
| 232 | + return $text; |
|
| 233 | + } |
|
| 234 | + protected function _stripLinkDefinitions_callback($matches) { |
|
| 235 | + $link_id = strtolower($matches[1]); |
|
| 236 | + $url = $matches[2] == '' ? $matches[3] : $matches[2]; |
|
| 237 | + $this->urls[$link_id] = $url; |
|
| 238 | + $this->titles[$link_id] =& $matches[4]; |
|
| 239 | + return ''; # String that will replace the block |
|
| 240 | + } |
|
| 241 | + |
|
| 242 | + |
|
| 243 | + protected function hashHTMLBlocks($text) { |
|
| 244 | + if ($this->no_markup) return $text; |
|
| 245 | + |
|
| 246 | + $less_than_tab = $this->tab_width - 1; |
|
| 247 | + |
|
| 248 | + # Hashify HTML blocks: |
|
| 249 | + # We only want to do this for block-level HTML tags, such as headers, |
|
| 250 | + # lists, and tables. That's because we still want to wrap <p>s around |
|
| 251 | + # "paragraphs" that are wrapped in non-block-level tags, such as anchors, |
|
| 252 | + # phrase emphasis, and spans. The list of tags we're looking for is |
|
| 253 | + # hard-coded: |
|
| 254 | + # |
|
| 255 | + # * List "a" is made of tags which can be both inline or block-level. |
|
| 256 | + # These will be treated block-level when the start tag is alone on |
|
| 257 | + # its line, otherwise they're not matched here and will be taken as |
|
| 258 | + # inline later. |
|
| 259 | + # * List "b" is made of tags which are always block-level; |
|
| 260 | + # |
|
| 261 | + $block_tags_a_re = 'ins|del'; |
|
| 262 | + $block_tags_b_re = 'p|div|h[1-6]|blockquote|pre|table|dl|ol|ul|address|'. |
|
| 263 | + 'script|noscript|style|form|fieldset|iframe|math|svg|'. |
|
| 264 | + 'article|section|nav|aside|hgroup|header|footer|'. |
|
| 265 | + 'figure'; |
|
| 266 | + |
|
| 267 | + # Regular expression for the content of a block tag. |
|
| 268 | + $nested_tags_level = 4; |
|
| 269 | + $attr = ' |
|
| 270 | 270 | (?> # optional tag attributes |
| 271 | 271 | \s # starts with whitespace |
| 272 | 272 | (?> |
@@ -280,8 +280,8 @@ discard block |
||
| 280 | 280 | )* |
| 281 | 281 | )? |
| 282 | 282 | '; |
| 283 | - $content = |
|
| 284 | - str_repeat(' |
|
| 283 | + $content = |
|
| 284 | + str_repeat(' |
|
| 285 | 285 | (?> |
| 286 | 286 | [^<]+ # content without tag |
| 287 | 287 | | |
@@ -291,29 +291,29 @@ discard block |
||
| 291 | 291 | /> |
| 292 | 292 | | |
| 293 | 293 | >', $nested_tags_level). # end of opening tag |
| 294 | - '.*?'. # last level nested tag content |
|
| 295 | - str_repeat(' |
|
| 294 | + '.*?'. # last level nested tag content |
|
| 295 | + str_repeat(' |
|
| 296 | 296 | </\2\s*> # closing nested tag |
| 297 | 297 | ) |
| 298 | 298 | | |
| 299 | 299 | <(?!/\2\s*> # other tags with a different name |
| 300 | 300 | ) |
| 301 | 301 | )*', |
| 302 | - $nested_tags_level); |
|
| 303 | - $content2 = str_replace('\2', '\3', $content); |
|
| 304 | - |
|
| 305 | - # First, look for nested blocks, e.g.: |
|
| 306 | - # <div> |
|
| 307 | - # <div> |
|
| 308 | - # tags for inner block must be indented. |
|
| 309 | - # </div> |
|
| 310 | - # </div> |
|
| 311 | - # |
|
| 312 | - # The outermost tags must start at the left margin for this to match, and |
|
| 313 | - # the inner nested divs must be indented. |
|
| 314 | - # We need to do this before the next, more liberal match, because the next |
|
| 315 | - # match will start at the first `<div>` and stop at the first `</div>`. |
|
| 316 | - $text = preg_replace_callback('{(?> |
|
| 302 | + $nested_tags_level); |
|
| 303 | + $content2 = str_replace('\2', '\3', $content); |
|
| 304 | + |
|
| 305 | + # First, look for nested blocks, e.g.: |
|
| 306 | + # <div> |
|
| 307 | + # <div> |
|
| 308 | + # tags for inner block must be indented. |
|
| 309 | + # </div> |
|
| 310 | + # </div> |
|
| 311 | + # |
|
| 312 | + # The outermost tags must start at the left margin for this to match, and |
|
| 313 | + # the inner nested divs must be indented. |
|
| 314 | + # We need to do this before the next, more liberal match, because the next |
|
| 315 | + # match will start at the first `<div>` and stop at the first `</div>`. |
|
| 316 | + $text = preg_replace_callback('{(?> |
|
| 317 | 317 | (?> |
| 318 | 318 | (?<=\n) # Starting on its own line |
| 319 | 319 | | # or |
@@ -374,97 +374,97 @@ discard block |
||
| 374 | 374 | |
| 375 | 375 | ) |
| 376 | 376 | )}Sxmi', |
| 377 | - array($this, '_hashHTMLBlocks_callback'), |
|
| 378 | - $text); |
|
| 379 | - |
|
| 380 | - return $text; |
|
| 381 | - } |
|
| 382 | - protected function _hashHTMLBlocks_callback($matches) { |
|
| 383 | - $text = $matches[1]; |
|
| 384 | - $key = $this->hashBlock($text); |
|
| 385 | - return "\n\n$key\n\n"; |
|
| 386 | - } |
|
| 377 | + array($this, '_hashHTMLBlocks_callback'), |
|
| 378 | + $text); |
|
| 379 | + |
|
| 380 | + return $text; |
|
| 381 | + } |
|
| 382 | + protected function _hashHTMLBlocks_callback($matches) { |
|
| 383 | + $text = $matches[1]; |
|
| 384 | + $key = $this->hashBlock($text); |
|
| 385 | + return "\n\n$key\n\n"; |
|
| 386 | + } |
|
| 387 | 387 | |
| 388 | 388 | |
| 389 | - protected function hashPart($text, $boundary = 'X') { |
|
| 390 | - # |
|
| 391 | - # Called whenever a tag must be hashed when a function insert an atomic |
|
| 392 | - # element in the text stream. Passing $text to through this function gives |
|
| 393 | - # a unique text-token which will be reverted back when calling unhash. |
|
| 394 | - # |
|
| 395 | - # The $boundary argument specify what character should be used to surround |
|
| 396 | - # the token. By convension, "B" is used for block elements that needs not |
|
| 397 | - # to be wrapped into paragraph tags at the end, ":" is used for elements |
|
| 398 | - # that are word separators and "X" is used in the general case. |
|
| 399 | - # |
|
| 400 | - # Swap back any tag hash found in $text so we do not have to `unhash` |
|
| 401 | - # multiple times at the end. |
|
| 402 | - $text = $this->unhash($text); |
|
| 389 | + protected function hashPart($text, $boundary = 'X') { |
|
| 390 | + # |
|
| 391 | + # Called whenever a tag must be hashed when a function insert an atomic |
|
| 392 | + # element in the text stream. Passing $text to through this function gives |
|
| 393 | + # a unique text-token which will be reverted back when calling unhash. |
|
| 394 | + # |
|
| 395 | + # The $boundary argument specify what character should be used to surround |
|
| 396 | + # the token. By convension, "B" is used for block elements that needs not |
|
| 397 | + # to be wrapped into paragraph tags at the end, ":" is used for elements |
|
| 398 | + # that are word separators and "X" is used in the general case. |
|
| 399 | + # |
|
| 400 | + # Swap back any tag hash found in $text so we do not have to `unhash` |
|
| 401 | + # multiple times at the end. |
|
| 402 | + $text = $this->unhash($text); |
|
| 403 | 403 | |
| 404 | - # Then hash the block. |
|
| 405 | - static $i = 0; |
|
| 406 | - $key = "$boundary\x1A" . ++$i . $boundary; |
|
| 407 | - $this->html_hashes[$key] = $text; |
|
| 408 | - return $key; # String that will replace the tag. |
|
| 409 | - } |
|
| 410 | - |
|
| 411 | - |
|
| 412 | - protected function hashBlock($text) { |
|
| 413 | - # |
|
| 414 | - # Shortcut function for hashPart with block-level boundaries. |
|
| 415 | - # |
|
| 416 | - return $this->hashPart($text, 'B'); |
|
| 417 | - } |
|
| 418 | - |
|
| 419 | - |
|
| 420 | - protected $block_gamut = array( |
|
| 421 | - # |
|
| 422 | - # These are all the transformations that form block-level |
|
| 423 | - # tags like paragraphs, headers, and list items. |
|
| 424 | - # |
|
| 425 | - "doHeaders" => 10, |
|
| 426 | - "doHorizontalRules" => 20, |
|
| 404 | + # Then hash the block. |
|
| 405 | + static $i = 0; |
|
| 406 | + $key = "$boundary\x1A" . ++$i . $boundary; |
|
| 407 | + $this->html_hashes[$key] = $text; |
|
| 408 | + return $key; # String that will replace the tag. |
|
| 409 | + } |
|
| 410 | + |
|
| 411 | + |
|
| 412 | + protected function hashBlock($text) { |
|
| 413 | + # |
|
| 414 | + # Shortcut function for hashPart with block-level boundaries. |
|
| 415 | + # |
|
| 416 | + return $this->hashPart($text, 'B'); |
|
| 417 | + } |
|
| 418 | + |
|
| 419 | + |
|
| 420 | + protected $block_gamut = array( |
|
| 421 | + # |
|
| 422 | + # These are all the transformations that form block-level |
|
| 423 | + # tags like paragraphs, headers, and list items. |
|
| 424 | + # |
|
| 425 | + "doHeaders" => 10, |
|
| 426 | + "doHorizontalRules" => 20, |
|
| 427 | 427 | |
| 428 | - "doLists" => 40, |
|
| 429 | - "doCodeBlocks" => 50, |
|
| 430 | - "doBlockQuotes" => 60, |
|
| 431 | - ); |
|
| 432 | - |
|
| 433 | - protected function runBlockGamut($text) { |
|
| 434 | - # |
|
| 435 | - # Run block gamut tranformations. |
|
| 436 | - # |
|
| 437 | - # We need to escape raw HTML in Markdown source before doing anything |
|
| 438 | - # else. This need to be done for each block, and not only at the |
|
| 439 | - # begining in the Markdown function since hashed blocks can be part of |
|
| 440 | - # list items and could have been indented. Indented blocks would have |
|
| 441 | - # been seen as a code block in a previous pass of hashHTMLBlocks. |
|
| 442 | - $text = $this->hashHTMLBlocks($text); |
|
| 428 | + "doLists" => 40, |
|
| 429 | + "doCodeBlocks" => 50, |
|
| 430 | + "doBlockQuotes" => 60, |
|
| 431 | + ); |
|
| 432 | + |
|
| 433 | + protected function runBlockGamut($text) { |
|
| 434 | + # |
|
| 435 | + # Run block gamut tranformations. |
|
| 436 | + # |
|
| 437 | + # We need to escape raw HTML in Markdown source before doing anything |
|
| 438 | + # else. This need to be done for each block, and not only at the |
|
| 439 | + # begining in the Markdown function since hashed blocks can be part of |
|
| 440 | + # list items and could have been indented. Indented blocks would have |
|
| 441 | + # been seen as a code block in a previous pass of hashHTMLBlocks. |
|
| 442 | + $text = $this->hashHTMLBlocks($text); |
|
| 443 | 443 | |
| 444 | - return $this->runBasicBlockGamut($text); |
|
| 445 | - } |
|
| 444 | + return $this->runBasicBlockGamut($text); |
|
| 445 | + } |
|
| 446 | 446 | |
| 447 | - protected function runBasicBlockGamut($text) { |
|
| 448 | - # |
|
| 449 | - # Run block gamut tranformations, without hashing HTML blocks. This is |
|
| 450 | - # useful when HTML blocks are known to be already hashed, like in the first |
|
| 451 | - # whole-document pass. |
|
| 452 | - # |
|
| 453 | - foreach ($this->block_gamut as $method => $priority) { |
|
| 454 | - $text = $this->$method($text); |
|
| 455 | - } |
|
| 447 | + protected function runBasicBlockGamut($text) { |
|
| 448 | + # |
|
| 449 | + # Run block gamut tranformations, without hashing HTML blocks. This is |
|
| 450 | + # useful when HTML blocks are known to be already hashed, like in the first |
|
| 451 | + # whole-document pass. |
|
| 452 | + # |
|
| 453 | + foreach ($this->block_gamut as $method => $priority) { |
|
| 454 | + $text = $this->$method($text); |
|
| 455 | + } |
|
| 456 | 456 | |
| 457 | - # Finally form paragraph and restore hashed blocks. |
|
| 458 | - $text = $this->formParagraphs($text); |
|
| 457 | + # Finally form paragraph and restore hashed blocks. |
|
| 458 | + $text = $this->formParagraphs($text); |
|
| 459 | 459 | |
| 460 | - return $text; |
|
| 461 | - } |
|
| 460 | + return $text; |
|
| 461 | + } |
|
| 462 | 462 | |
| 463 | 463 | |
| 464 | - protected function doHorizontalRules($text) { |
|
| 465 | - # Do Horizontal Rules: |
|
| 466 | - return preg_replace( |
|
| 467 | - '{ |
|
| 464 | + protected function doHorizontalRules($text) { |
|
| 465 | + # Do Horizontal Rules: |
|
| 466 | + return preg_replace( |
|
| 467 | + '{ |
|
| 468 | 468 | ^[ ]{0,3} # Leading space |
| 469 | 469 | ([-*_]) # $1: First marker |
| 470 | 470 | (?> # Repeated marker group |
@@ -474,68 +474,68 @@ discard block |
||
| 474 | 474 | [ ]* # Tailing spaces |
| 475 | 475 | $ # End of line. |
| 476 | 476 | }mx', |
| 477 | - "\n".$this->hashBlock("<hr$this->empty_element_suffix")."\n", |
|
| 478 | - $text); |
|
| 479 | - } |
|
| 480 | - |
|
| 481 | - |
|
| 482 | - protected $span_gamut = array( |
|
| 483 | - # |
|
| 484 | - # These are all the transformations that occur *within* block-level |
|
| 485 | - # tags like paragraphs, headers, and list items. |
|
| 486 | - # |
|
| 487 | - # Process character escapes, code spans, and inline HTML |
|
| 488 | - # in one shot. |
|
| 489 | - "parseSpan" => -30, |
|
| 490 | - |
|
| 491 | - # Process anchor and image tags. Images must come first, |
|
| 492 | - # because ![foo][f] looks like an anchor. |
|
| 493 | - "doImages" => 10, |
|
| 494 | - "doAnchors" => 20, |
|
| 477 | + "\n".$this->hashBlock("<hr$this->empty_element_suffix")."\n", |
|
| 478 | + $text); |
|
| 479 | + } |
|
| 480 | + |
|
| 481 | + |
|
| 482 | + protected $span_gamut = array( |
|
| 483 | + # |
|
| 484 | + # These are all the transformations that occur *within* block-level |
|
| 485 | + # tags like paragraphs, headers, and list items. |
|
| 486 | + # |
|
| 487 | + # Process character escapes, code spans, and inline HTML |
|
| 488 | + # in one shot. |
|
| 489 | + "parseSpan" => -30, |
|
| 490 | + |
|
| 491 | + # Process anchor and image tags. Images must come first, |
|
| 492 | + # because ![foo][f] looks like an anchor. |
|
| 493 | + "doImages" => 10, |
|
| 494 | + "doAnchors" => 20, |
|
| 495 | 495 | |
| 496 | - # Make links out of things like `<http://example.com/>` |
|
| 497 | - # Must come after doAnchors, because you can use < and > |
|
| 498 | - # delimiters in inline links like [this](<url>). |
|
| 499 | - "doAutoLinks" => 30, |
|
| 500 | - "encodeAmpsAndAngles" => 40, |
|
| 501 | - |
|
| 502 | - "doItalicsAndBold" => 50, |
|
| 503 | - "doHardBreaks" => 60, |
|
| 504 | - ); |
|
| 505 | - |
|
| 506 | - protected function runSpanGamut($text) { |
|
| 507 | - # |
|
| 508 | - # Run span gamut tranformations. |
|
| 509 | - # |
|
| 510 | - foreach ($this->span_gamut as $method => $priority) { |
|
| 511 | - $text = $this->$method($text); |
|
| 512 | - } |
|
| 513 | - |
|
| 514 | - return $text; |
|
| 515 | - } |
|
| 496 | + # Make links out of things like `<http://example.com/>` |
|
| 497 | + # Must come after doAnchors, because you can use < and > |
|
| 498 | + # delimiters in inline links like [this](<url>). |
|
| 499 | + "doAutoLinks" => 30, |
|
| 500 | + "encodeAmpsAndAngles" => 40, |
|
| 501 | + |
|
| 502 | + "doItalicsAndBold" => 50, |
|
| 503 | + "doHardBreaks" => 60, |
|
| 504 | + ); |
|
| 505 | + |
|
| 506 | + protected function runSpanGamut($text) { |
|
| 507 | + # |
|
| 508 | + # Run span gamut tranformations. |
|
| 509 | + # |
|
| 510 | + foreach ($this->span_gamut as $method => $priority) { |
|
| 511 | + $text = $this->$method($text); |
|
| 512 | + } |
|
| 513 | + |
|
| 514 | + return $text; |
|
| 515 | + } |
|
| 516 | 516 | |
| 517 | 517 | |
| 518 | - protected function doHardBreaks($text) { |
|
| 519 | - # Do hard breaks: |
|
| 520 | - return preg_replace_callback('/ {2,}\n/', |
|
| 521 | - array($this, '_doHardBreaks_callback'), $text); |
|
| 522 | - } |
|
| 523 | - protected function _doHardBreaks_callback($matches) { |
|
| 524 | - return $this->hashPart("<br$this->empty_element_suffix\n"); |
|
| 525 | - } |
|
| 526 | - |
|
| 527 | - |
|
| 528 | - protected function doAnchors($text) { |
|
| 529 | - # |
|
| 530 | - # Turn Markdown link shortcuts into XHTML <a> tags. |
|
| 531 | - # |
|
| 532 | - if ($this->in_anchor) return $text; |
|
| 533 | - $this->in_anchor = true; |
|
| 518 | + protected function doHardBreaks($text) { |
|
| 519 | + # Do hard breaks: |
|
| 520 | + return preg_replace_callback('/ {2,}\n/', |
|
| 521 | + array($this, '_doHardBreaks_callback'), $text); |
|
| 522 | + } |
|
| 523 | + protected function _doHardBreaks_callback($matches) { |
|
| 524 | + return $this->hashPart("<br$this->empty_element_suffix\n"); |
|
| 525 | + } |
|
| 526 | + |
|
| 527 | + |
|
| 528 | + protected function doAnchors($text) { |
|
| 529 | + # |
|
| 530 | + # Turn Markdown link shortcuts into XHTML <a> tags. |
|
| 531 | + # |
|
| 532 | + if ($this->in_anchor) return $text; |
|
| 533 | + $this->in_anchor = true; |
|
| 534 | 534 | |
| 535 | - # |
|
| 536 | - # First, handle reference-style links: [link text] [id] |
|
| 537 | - # |
|
| 538 | - $text = preg_replace_callback('{ |
|
| 535 | + # |
|
| 536 | + # First, handle reference-style links: [link text] [id] |
|
| 537 | + # |
|
| 538 | + $text = preg_replace_callback('{ |
|
| 539 | 539 | ( # wrap whole match in $1 |
| 540 | 540 | \[ |
| 541 | 541 | ('.$this->nested_brackets_re.') # link text = $2 |
@@ -549,12 +549,12 @@ discard block |
||
| 549 | 549 | \] |
| 550 | 550 | ) |
| 551 | 551 | }xs', |
| 552 | - array($this, '_doAnchors_reference_callback'), $text); |
|
| 552 | + array($this, '_doAnchors_reference_callback'), $text); |
|
| 553 | 553 | |
| 554 | - # |
|
| 555 | - # Next, inline-style links: [link text](url "optional title") |
|
| 556 | - # |
|
| 557 | - $text = preg_replace_callback('{ |
|
| 554 | + # |
|
| 555 | + # Next, inline-style links: [link text](url "optional title") |
|
| 556 | + # |
|
| 557 | + $text = preg_replace_callback('{ |
|
| 558 | 558 | ( # wrap whole match in $1 |
| 559 | 559 | \[ |
| 560 | 560 | ('.$this->nested_brackets_re.') # link text = $2 |
@@ -576,94 +576,94 @@ discard block |
||
| 576 | 576 | \) |
| 577 | 577 | ) |
| 578 | 578 | }xs', |
| 579 | - array($this, '_doAnchors_inline_callback'), $text); |
|
| 580 | - |
|
| 581 | - # |
|
| 582 | - # Last, handle reference-style shortcuts: [link text] |
|
| 583 | - # These must come last in case you've also got [link text][1] |
|
| 584 | - # or [link text](/foo) |
|
| 585 | - # |
|
| 586 | - $text = preg_replace_callback('{ |
|
| 579 | + array($this, '_doAnchors_inline_callback'), $text); |
|
| 580 | + |
|
| 581 | + # |
|
| 582 | + # Last, handle reference-style shortcuts: [link text] |
|
| 583 | + # These must come last in case you've also got [link text][1] |
|
| 584 | + # or [link text](/foo) |
|
| 585 | + # |
|
| 586 | + $text = preg_replace_callback('{ |
|
| 587 | 587 | ( # wrap whole match in $1 |
| 588 | 588 | \[ |
| 589 | 589 | ([^\[\]]+) # link text = $2; can\'t contain [ or ] |
| 590 | 590 | \] |
| 591 | 591 | ) |
| 592 | 592 | }xs', |
| 593 | - array($this, '_doAnchors_reference_callback'), $text); |
|
| 594 | - |
|
| 595 | - $this->in_anchor = false; |
|
| 596 | - return $text; |
|
| 597 | - } |
|
| 598 | - protected function _doAnchors_reference_callback($matches) { |
|
| 599 | - $whole_match = $matches[1]; |
|
| 600 | - $link_text = $matches[2]; |
|
| 601 | - $link_id =& $matches[3]; |
|
| 602 | - |
|
| 603 | - if ($link_id == "") { |
|
| 604 | - # for shortcut links like [this][] or [this]. |
|
| 605 | - $link_id = $link_text; |
|
| 606 | - } |
|
| 593 | + array($this, '_doAnchors_reference_callback'), $text); |
|
| 594 | + |
|
| 595 | + $this->in_anchor = false; |
|
| 596 | + return $text; |
|
| 597 | + } |
|
| 598 | + protected function _doAnchors_reference_callback($matches) { |
|
| 599 | + $whole_match = $matches[1]; |
|
| 600 | + $link_text = $matches[2]; |
|
| 601 | + $link_id =& $matches[3]; |
|
| 602 | + |
|
| 603 | + if ($link_id == "") { |
|
| 604 | + # for shortcut links like [this][] or [this]. |
|
| 605 | + $link_id = $link_text; |
|
| 606 | + } |
|
| 607 | 607 | |
| 608 | - # lower-case and turn embedded newlines into spaces |
|
| 609 | - $link_id = strtolower($link_id); |
|
| 610 | - $link_id = preg_replace('{[ ]?\n}', ' ', $link_id); |
|
| 608 | + # lower-case and turn embedded newlines into spaces |
|
| 609 | + $link_id = strtolower($link_id); |
|
| 610 | + $link_id = preg_replace('{[ ]?\n}', ' ', $link_id); |
|
| 611 | 611 | |
| 612 | - if (isset($this->urls[$link_id])) { |
|
| 613 | - $url = $this->urls[$link_id]; |
|
| 614 | - $url = $this->encodeURLAttribute($url); |
|
| 612 | + if (isset($this->urls[$link_id])) { |
|
| 613 | + $url = $this->urls[$link_id]; |
|
| 614 | + $url = $this->encodeURLAttribute($url); |
|
| 615 | 615 | |
| 616 | - $result = "<a href=\"$url\""; |
|
| 617 | - if ( isset( $this->titles[$link_id] ) ) { |
|
| 618 | - $title = $this->titles[$link_id]; |
|
| 619 | - $title = $this->encodeAttribute($title); |
|
| 620 | - $result .= " title=\"$title\""; |
|
| 621 | - } |
|
| 616 | + $result = "<a href=\"$url\""; |
|
| 617 | + if ( isset( $this->titles[$link_id] ) ) { |
|
| 618 | + $title = $this->titles[$link_id]; |
|
| 619 | + $title = $this->encodeAttribute($title); |
|
| 620 | + $result .= " title=\"$title\""; |
|
| 621 | + } |
|
| 622 | 622 | |
| 623 | - $link_text = $this->runSpanGamut($link_text); |
|
| 624 | - $result .= ">$link_text</a>"; |
|
| 625 | - $result = $this->hashPart($result); |
|
| 626 | - } |
|
| 627 | - else { |
|
| 628 | - $result = $whole_match; |
|
| 629 | - } |
|
| 630 | - return $result; |
|
| 631 | - } |
|
| 632 | - protected function _doAnchors_inline_callback($matches) { |
|
| 633 | - $whole_match = $matches[1]; |
|
| 634 | - $link_text = $this->runSpanGamut($matches[2]); |
|
| 635 | - $url = $matches[3] == '' ? $matches[4] : $matches[3]; |
|
| 636 | - $title =& $matches[7]; |
|
| 637 | - |
|
| 638 | - // if the URL was of the form <s p a c e s> it got caught by the HTML |
|
| 639 | - // tag parser and hashed. Need to reverse the process before using the URL. |
|
| 640 | - $unhashed = $this->unhash($url); |
|
| 641 | - if ($unhashed != $url) |
|
| 642 | - $url = preg_replace('/^<(.*)>$/', '\1', $unhashed); |
|
| 643 | - |
|
| 644 | - $url = $this->encodeURLAttribute($url); |
|
| 645 | - |
|
| 646 | - $result = "<a href=\"$url\""; |
|
| 647 | - if (isset($title)) { |
|
| 648 | - $title = $this->encodeAttribute($title); |
|
| 649 | - $result .= " title=\"$title\""; |
|
| 650 | - } |
|
| 623 | + $link_text = $this->runSpanGamut($link_text); |
|
| 624 | + $result .= ">$link_text</a>"; |
|
| 625 | + $result = $this->hashPart($result); |
|
| 626 | + } |
|
| 627 | + else { |
|
| 628 | + $result = $whole_match; |
|
| 629 | + } |
|
| 630 | + return $result; |
|
| 631 | + } |
|
| 632 | + protected function _doAnchors_inline_callback($matches) { |
|
| 633 | + $whole_match = $matches[1]; |
|
| 634 | + $link_text = $this->runSpanGamut($matches[2]); |
|
| 635 | + $url = $matches[3] == '' ? $matches[4] : $matches[3]; |
|
| 636 | + $title =& $matches[7]; |
|
| 637 | + |
|
| 638 | + // if the URL was of the form <s p a c e s> it got caught by the HTML |
|
| 639 | + // tag parser and hashed. Need to reverse the process before using the URL. |
|
| 640 | + $unhashed = $this->unhash($url); |
|
| 641 | + if ($unhashed != $url) |
|
| 642 | + $url = preg_replace('/^<(.*)>$/', '\1', $unhashed); |
|
| 643 | + |
|
| 644 | + $url = $this->encodeURLAttribute($url); |
|
| 645 | + |
|
| 646 | + $result = "<a href=\"$url\""; |
|
| 647 | + if (isset($title)) { |
|
| 648 | + $title = $this->encodeAttribute($title); |
|
| 649 | + $result .= " title=\"$title\""; |
|
| 650 | + } |
|
| 651 | 651 | |
| 652 | - $link_text = $this->runSpanGamut($link_text); |
|
| 653 | - $result .= ">$link_text</a>"; |
|
| 652 | + $link_text = $this->runSpanGamut($link_text); |
|
| 653 | + $result .= ">$link_text</a>"; |
|
| 654 | 654 | |
| 655 | - return $this->hashPart($result); |
|
| 656 | - } |
|
| 655 | + return $this->hashPart($result); |
|
| 656 | + } |
|
| 657 | 657 | |
| 658 | 658 | |
| 659 | - protected function doImages($text) { |
|
| 660 | - # |
|
| 661 | - # Turn Markdown image shortcuts into <img> tags. |
|
| 662 | - # |
|
| 663 | - # |
|
| 664 | - # First, handle reference-style labeled images: ![alt text][id] |
|
| 665 | - # |
|
| 666 | - $text = preg_replace_callback('{ |
|
| 659 | + protected function doImages($text) { |
|
| 660 | + # |
|
| 661 | + # Turn Markdown image shortcuts into <img> tags. |
|
| 662 | + # |
|
| 663 | + # |
|
| 664 | + # First, handle reference-style labeled images: ![alt text][id] |
|
| 665 | + # |
|
| 666 | + $text = preg_replace_callback('{ |
|
| 667 | 667 | ( # wrap whole match in $1 |
| 668 | 668 | !\[ |
| 669 | 669 | ('.$this->nested_brackets_re.') # alt text = $2 |
@@ -678,13 +678,13 @@ discard block |
||
| 678 | 678 | |
| 679 | 679 | ) |
| 680 | 680 | }xs', |
| 681 | - array($this, '_doImages_reference_callback'), $text); |
|
| 681 | + array($this, '_doImages_reference_callback'), $text); |
|
| 682 | 682 | |
| 683 | - # |
|
| 684 | - # Next, handle inline images:  |
|
| 685 | - # Don't forget: encode * and _ |
|
| 686 | - # |
|
| 687 | - $text = preg_replace_callback('{ |
|
| 683 | + # |
|
| 684 | + # Next, handle inline images:  |
|
| 685 | + # Don't forget: encode * and _ |
|
| 686 | + # |
|
| 687 | + $text = preg_replace_callback('{ |
|
| 688 | 688 | ( # wrap whole match in $1 |
| 689 | 689 | !\[ |
| 690 | 690 | ('.$this->nested_brackets_re.') # alt text = $2 |
@@ -707,76 +707,76 @@ discard block |
||
| 707 | 707 | \) |
| 708 | 708 | ) |
| 709 | 709 | }xs', |
| 710 | - array($this, '_doImages_inline_callback'), $text); |
|
| 711 | - |
|
| 712 | - return $text; |
|
| 713 | - } |
|
| 714 | - protected function _doImages_reference_callback($matches) { |
|
| 715 | - $whole_match = $matches[1]; |
|
| 716 | - $alt_text = $matches[2]; |
|
| 717 | - $link_id = strtolower($matches[3]); |
|
| 718 | - |
|
| 719 | - if ($link_id == "") { |
|
| 720 | - $link_id = strtolower($alt_text); # for shortcut links like ![this][]. |
|
| 721 | - } |
|
| 722 | - |
|
| 723 | - $alt_text = $this->encodeAttribute($alt_text); |
|
| 724 | - if (isset($this->urls[$link_id])) { |
|
| 725 | - $url = $this->encodeURLAttribute($this->urls[$link_id]); |
|
| 726 | - $result = "<img src=\"$url\" alt=\"$alt_text\""; |
|
| 727 | - if (isset($this->titles[$link_id])) { |
|
| 728 | - $title = $this->titles[$link_id]; |
|
| 729 | - $title = $this->encodeAttribute($title); |
|
| 730 | - $result .= " title=\"$title\""; |
|
| 731 | - } |
|
| 732 | - $result .= $this->empty_element_suffix; |
|
| 733 | - $result = $this->hashPart($result); |
|
| 734 | - } |
|
| 735 | - else { |
|
| 736 | - # If there's no such link ID, leave intact: |
|
| 737 | - $result = $whole_match; |
|
| 738 | - } |
|
| 739 | - |
|
| 740 | - return $result; |
|
| 741 | - } |
|
| 742 | - protected function _doImages_inline_callback($matches) { |
|
| 743 | - $whole_match = $matches[1]; |
|
| 744 | - $alt_text = $matches[2]; |
|
| 745 | - $url = $matches[3] == '' ? $matches[4] : $matches[3]; |
|
| 746 | - $title =& $matches[7]; |
|
| 747 | - |
|
| 748 | - $alt_text = $this->encodeAttribute($alt_text); |
|
| 749 | - $url = $this->encodeURLAttribute($url); |
|
| 750 | - $result = "<img src=\"$url\" alt=\"$alt_text\""; |
|
| 751 | - if (isset($title)) { |
|
| 752 | - $title = $this->encodeAttribute($title); |
|
| 753 | - $result .= " title=\"$title\""; # $title already quoted |
|
| 754 | - } |
|
| 755 | - $result .= $this->empty_element_suffix; |
|
| 756 | - |
|
| 757 | - return $this->hashPart($result); |
|
| 758 | - } |
|
| 759 | - |
|
| 760 | - |
|
| 761 | - protected function doHeaders($text) { |
|
| 762 | - # Setext-style headers: |
|
| 763 | - # Header 1 |
|
| 764 | - # ======== |
|
| 765 | - # |
|
| 766 | - # Header 2 |
|
| 767 | - # -------- |
|
| 768 | - # |
|
| 769 | - $text = preg_replace_callback('{ ^(.+?)[ ]*\n(=+|-+)[ ]*\n+ }mx', |
|
| 770 | - array($this, '_doHeaders_callback_setext'), $text); |
|
| 771 | - |
|
| 772 | - # atx-style headers: |
|
| 773 | - # # Header 1 |
|
| 774 | - # ## Header 2 |
|
| 775 | - # ## Header 2 with closing hashes ## |
|
| 776 | - # ... |
|
| 777 | - # ###### Header 6 |
|
| 778 | - # |
|
| 779 | - $text = preg_replace_callback('{ |
|
| 710 | + array($this, '_doImages_inline_callback'), $text); |
|
| 711 | + |
|
| 712 | + return $text; |
|
| 713 | + } |
|
| 714 | + protected function _doImages_reference_callback($matches) { |
|
| 715 | + $whole_match = $matches[1]; |
|
| 716 | + $alt_text = $matches[2]; |
|
| 717 | + $link_id = strtolower($matches[3]); |
|
| 718 | + |
|
| 719 | + if ($link_id == "") { |
|
| 720 | + $link_id = strtolower($alt_text); # for shortcut links like ![this][]. |
|
| 721 | + } |
|
| 722 | + |
|
| 723 | + $alt_text = $this->encodeAttribute($alt_text); |
|
| 724 | + if (isset($this->urls[$link_id])) { |
|
| 725 | + $url = $this->encodeURLAttribute($this->urls[$link_id]); |
|
| 726 | + $result = "<img src=\"$url\" alt=\"$alt_text\""; |
|
| 727 | + if (isset($this->titles[$link_id])) { |
|
| 728 | + $title = $this->titles[$link_id]; |
|
| 729 | + $title = $this->encodeAttribute($title); |
|
| 730 | + $result .= " title=\"$title\""; |
|
| 731 | + } |
|
| 732 | + $result .= $this->empty_element_suffix; |
|
| 733 | + $result = $this->hashPart($result); |
|
| 734 | + } |
|
| 735 | + else { |
|
| 736 | + # If there's no such link ID, leave intact: |
|
| 737 | + $result = $whole_match; |
|
| 738 | + } |
|
| 739 | + |
|
| 740 | + return $result; |
|
| 741 | + } |
|
| 742 | + protected function _doImages_inline_callback($matches) { |
|
| 743 | + $whole_match = $matches[1]; |
|
| 744 | + $alt_text = $matches[2]; |
|
| 745 | + $url = $matches[3] == '' ? $matches[4] : $matches[3]; |
|
| 746 | + $title =& $matches[7]; |
|
| 747 | + |
|
| 748 | + $alt_text = $this->encodeAttribute($alt_text); |
|
| 749 | + $url = $this->encodeURLAttribute($url); |
|
| 750 | + $result = "<img src=\"$url\" alt=\"$alt_text\""; |
|
| 751 | + if (isset($title)) { |
|
| 752 | + $title = $this->encodeAttribute($title); |
|
| 753 | + $result .= " title=\"$title\""; # $title already quoted |
|
| 754 | + } |
|
| 755 | + $result .= $this->empty_element_suffix; |
|
| 756 | + |
|
| 757 | + return $this->hashPart($result); |
|
| 758 | + } |
|
| 759 | + |
|
| 760 | + |
|
| 761 | + protected function doHeaders($text) { |
|
| 762 | + # Setext-style headers: |
|
| 763 | + # Header 1 |
|
| 764 | + # ======== |
|
| 765 | + # |
|
| 766 | + # Header 2 |
|
| 767 | + # -------- |
|
| 768 | + # |
|
| 769 | + $text = preg_replace_callback('{ ^(.+?)[ ]*\n(=+|-+)[ ]*\n+ }mx', |
|
| 770 | + array($this, '_doHeaders_callback_setext'), $text); |
|
| 771 | + |
|
| 772 | + # atx-style headers: |
|
| 773 | + # # Header 1 |
|
| 774 | + # ## Header 2 |
|
| 775 | + # ## Header 2 with closing hashes ## |
|
| 776 | + # ... |
|
| 777 | + # ###### Header 6 |
|
| 778 | + # |
|
| 779 | + $text = preg_replace_callback('{ |
|
| 780 | 780 | ^(\#{1,6}) # $1 = string of #\'s |
| 781 | 781 | [ ]* |
| 782 | 782 | (.+?) # $2 = Header text |
@@ -784,69 +784,69 @@ discard block |
||
| 784 | 784 | \#* # optional closing #\'s (not counted) |
| 785 | 785 | \n+ |
| 786 | 786 | }xm', |
| 787 | - array($this, '_doHeaders_callback_atx'), $text); |
|
| 787 | + array($this, '_doHeaders_callback_atx'), $text); |
|
| 788 | 788 | |
| 789 | - return $text; |
|
| 790 | - } |
|
| 789 | + return $text; |
|
| 790 | + } |
|
| 791 | 791 | |
| 792 | - protected function _doHeaders_callback_setext($matches) { |
|
| 793 | - # Terrible hack to check we haven't found an empty list item. |
|
| 794 | - if ($matches[2] == '-' && preg_match('{^-(?: |$)}', $matches[1])) |
|
| 795 | - return $matches[0]; |
|
| 792 | + protected function _doHeaders_callback_setext($matches) { |
|
| 793 | + # Terrible hack to check we haven't found an empty list item. |
|
| 794 | + if ($matches[2] == '-' && preg_match('{^-(?: |$)}', $matches[1])) |
|
| 795 | + return $matches[0]; |
|
| 796 | 796 | |
| 797 | - $level = $matches[2]{0} == '=' ? 1 : 2; |
|
| 798 | - |
|
| 799 | - # id attribute generation |
|
| 800 | - $idAtt = $this->_generateIdFromHeaderValue($matches[1]); |
|
| 801 | - |
|
| 802 | - $block = "<h$level$idAtt>".$this->runSpanGamut($matches[1])."</h$level>"; |
|
| 803 | - return "\n" . $this->hashBlock($block) . "\n\n"; |
|
| 804 | - } |
|
| 805 | - protected function _doHeaders_callback_atx($matches) { |
|
| 806 | - |
|
| 807 | - # id attribute generation |
|
| 808 | - $idAtt = $this->_generateIdFromHeaderValue($matches[2]); |
|
| 809 | - |
|
| 810 | - $level = strlen($matches[1]); |
|
| 811 | - $block = "<h$level$idAtt>".$this->runSpanGamut($matches[2])."</h$level>"; |
|
| 812 | - return "\n" . $this->hashBlock($block) . "\n\n"; |
|
| 813 | - } |
|
| 814 | - |
|
| 815 | - protected function _generateIdFromHeaderValue($headerValue) { |
|
| 816 | - |
|
| 817 | - # if a header_id_func property is set, we can use it to automatically |
|
| 818 | - # generate an id attribute. |
|
| 819 | - # |
|
| 820 | - # This method returns a string in the form id="foo", or an empty string |
|
| 821 | - # otherwise. |
|
| 822 | - if (!is_callable($this->header_id_func)) { |
|
| 823 | - return ""; |
|
| 824 | - } |
|
| 825 | - $idValue = call_user_func($this->header_id_func, $headerValue); |
|
| 826 | - if (!$idValue) return ""; |
|
| 827 | - |
|
| 828 | - return ' id="' . $this->encodeAttribute($idValue) . '"'; |
|
| 829 | - |
|
| 830 | - } |
|
| 831 | - |
|
| 832 | - protected function doLists($text) { |
|
| 833 | - # |
|
| 834 | - # Form HTML ordered (numbered) and unordered (bulleted) lists. |
|
| 835 | - # |
|
| 836 | - $less_than_tab = $this->tab_width - 1; |
|
| 837 | - |
|
| 838 | - # Re-usable patterns to match list item bullets and number markers: |
|
| 839 | - $marker_ul_re = '[*+-]'; |
|
| 840 | - $marker_ol_re = '\d+[\.]'; |
|
| 841 | - |
|
| 842 | - $markers_relist = array( |
|
| 843 | - $marker_ul_re => $marker_ol_re, |
|
| 844 | - $marker_ol_re => $marker_ul_re, |
|
| 845 | - ); |
|
| 846 | - |
|
| 847 | - foreach ($markers_relist as $marker_re => $other_marker_re) { |
|
| 848 | - # Re-usable pattern to match any entirel ul or ol list: |
|
| 849 | - $whole_list_re = ' |
|
| 797 | + $level = $matches[2]{0} == '=' ? 1 : 2; |
|
| 798 | + |
|
| 799 | + # id attribute generation |
|
| 800 | + $idAtt = $this->_generateIdFromHeaderValue($matches[1]); |
|
| 801 | + |
|
| 802 | + $block = "<h$level$idAtt>".$this->runSpanGamut($matches[1])."</h$level>"; |
|
| 803 | + return "\n" . $this->hashBlock($block) . "\n\n"; |
|
| 804 | + } |
|
| 805 | + protected function _doHeaders_callback_atx($matches) { |
|
| 806 | + |
|
| 807 | + # id attribute generation |
|
| 808 | + $idAtt = $this->_generateIdFromHeaderValue($matches[2]); |
|
| 809 | + |
|
| 810 | + $level = strlen($matches[1]); |
|
| 811 | + $block = "<h$level$idAtt>".$this->runSpanGamut($matches[2])."</h$level>"; |
|
| 812 | + return "\n" . $this->hashBlock($block) . "\n\n"; |
|
| 813 | + } |
|
| 814 | + |
|
| 815 | + protected function _generateIdFromHeaderValue($headerValue) { |
|
| 816 | + |
|
| 817 | + # if a header_id_func property is set, we can use it to automatically |
|
| 818 | + # generate an id attribute. |
|
| 819 | + # |
|
| 820 | + # This method returns a string in the form id="foo", or an empty string |
|
| 821 | + # otherwise. |
|
| 822 | + if (!is_callable($this->header_id_func)) { |
|
| 823 | + return ""; |
|
| 824 | + } |
|
| 825 | + $idValue = call_user_func($this->header_id_func, $headerValue); |
|
| 826 | + if (!$idValue) return ""; |
|
| 827 | + |
|
| 828 | + return ' id="' . $this->encodeAttribute($idValue) . '"'; |
|
| 829 | + |
|
| 830 | + } |
|
| 831 | + |
|
| 832 | + protected function doLists($text) { |
|
| 833 | + # |
|
| 834 | + # Form HTML ordered (numbered) and unordered (bulleted) lists. |
|
| 835 | + # |
|
| 836 | + $less_than_tab = $this->tab_width - 1; |
|
| 837 | + |
|
| 838 | + # Re-usable patterns to match list item bullets and number markers: |
|
| 839 | + $marker_ul_re = '[*+-]'; |
|
| 840 | + $marker_ol_re = '\d+[\.]'; |
|
| 841 | + |
|
| 842 | + $markers_relist = array( |
|
| 843 | + $marker_ul_re => $marker_ol_re, |
|
| 844 | + $marker_ol_re => $marker_ul_re, |
|
| 845 | + ); |
|
| 846 | + |
|
| 847 | + foreach ($markers_relist as $marker_re => $other_marker_re) { |
|
| 848 | + # Re-usable pattern to match any entirel ul or ol list: |
|
| 849 | + $whole_list_re = ' |
|
| 850 | 850 | ( # $1 = whole list |
| 851 | 851 | ( # $2 |
| 852 | 852 | ([ ]{0,'.$less_than_tab.'}) # $3 = number of spaces |
@@ -873,96 +873,96 @@ discard block |
||
| 873 | 873 | ) |
| 874 | 874 | '; // mx |
| 875 | 875 | |
| 876 | - # We use a different prefix before nested lists than top-level lists. |
|
| 877 | - # See extended comment in _ProcessListItems(). |
|
| 876 | + # We use a different prefix before nested lists than top-level lists. |
|
| 877 | + # See extended comment in _ProcessListItems(). |
|
| 878 | 878 | |
| 879 | - if ($this->list_level) { |
|
| 880 | - $text = preg_replace_callback('{ |
|
| 879 | + if ($this->list_level) { |
|
| 880 | + $text = preg_replace_callback('{ |
|
| 881 | 881 | ^ |
| 882 | 882 | '.$whole_list_re.' |
| 883 | 883 | }mx', |
| 884 | - array($this, '_doLists_callback'), $text); |
|
| 885 | - } |
|
| 886 | - else { |
|
| 887 | - $text = preg_replace_callback('{ |
|
| 884 | + array($this, '_doLists_callback'), $text); |
|
| 885 | + } |
|
| 886 | + else { |
|
| 887 | + $text = preg_replace_callback('{ |
|
| 888 | 888 | (?:(?<=\n)\n|\A\n?) # Must eat the newline |
| 889 | 889 | '.$whole_list_re.' |
| 890 | 890 | }mx', |
| 891 | - array($this, '_doLists_callback'), $text); |
|
| 892 | - } |
|
| 893 | - } |
|
| 894 | - |
|
| 895 | - return $text; |
|
| 896 | - } |
|
| 897 | - protected function _doLists_callback($matches) { |
|
| 898 | - # Re-usable patterns to match list item bullets and number markers: |
|
| 899 | - $marker_ul_re = '[*+-]'; |
|
| 900 | - $marker_ol_re = '\d+[\.]'; |
|
| 901 | - $marker_any_re = "(?:$marker_ul_re|$marker_ol_re)"; |
|
| 902 | - $marker_ol_start_re = '[0-9]+'; |
|
| 903 | - |
|
| 904 | - $list = $matches[1]; |
|
| 905 | - $list_type = preg_match("/$marker_ul_re/", $matches[4]) ? "ul" : "ol"; |
|
| 906 | - |
|
| 907 | - $marker_any_re = ( $list_type == "ul" ? $marker_ul_re : $marker_ol_re ); |
|
| 908 | - |
|
| 909 | - $list .= "\n"; |
|
| 910 | - $result = $this->processListItems($list, $marker_any_re); |
|
| 911 | - |
|
| 912 | - $ol_start = 1; |
|
| 913 | - if ($this->enhanced_ordered_list) { |
|
| 914 | - # Get the start number for ordered list. |
|
| 915 | - if ($list_type == 'ol') { |
|
| 916 | - $ol_start_array = array(); |
|
| 917 | - $ol_start_check = preg_match("/$marker_ol_start_re/", $matches[4], $ol_start_array); |
|
| 918 | - if ($ol_start_check){ |
|
| 919 | - $ol_start = $ol_start_array[0]; |
|
| 920 | - } |
|
| 921 | - } |
|
| 922 | - } |
|
| 923 | - |
|
| 924 | - if ($ol_start > 1 && $list_type == 'ol'){ |
|
| 925 | - $result = $this->hashBlock("<$list_type start=\"$ol_start\">\n" . $result . "</$list_type>"); |
|
| 926 | - } else { |
|
| 927 | - $result = $this->hashBlock("<$list_type>\n" . $result . "</$list_type>"); |
|
| 928 | - } |
|
| 929 | - return "\n". $result ."\n\n"; |
|
| 930 | - } |
|
| 931 | - |
|
| 932 | - protected $list_level = 0; |
|
| 933 | - |
|
| 934 | - protected function processListItems($list_str, $marker_any_re) { |
|
| 935 | - # |
|
| 936 | - # Process the contents of a single ordered or unordered list, splitting it |
|
| 937 | - # into individual list items. |
|
| 938 | - # |
|
| 939 | - # The $this->list_level global keeps track of when we're inside a list. |
|
| 940 | - # Each time we enter a list, we increment it; when we leave a list, |
|
| 941 | - # we decrement. If it's zero, we're not in a list anymore. |
|
| 942 | - # |
|
| 943 | - # We do this because when we're not inside a list, we want to treat |
|
| 944 | - # something like this: |
|
| 945 | - # |
|
| 946 | - # I recommend upgrading to version |
|
| 947 | - # 8. Oops, now this line is treated |
|
| 948 | - # as a sub-list. |
|
| 949 | - # |
|
| 950 | - # As a single paragraph, despite the fact that the second line starts |
|
| 951 | - # with a digit-period-space sequence. |
|
| 952 | - # |
|
| 953 | - # Whereas when we're inside a list (or sub-list), that line will be |
|
| 954 | - # treated as the start of a sub-list. What a kludge, huh? This is |
|
| 955 | - # an aspect of Markdown's syntax that's hard to parse perfectly |
|
| 956 | - # without resorting to mind-reading. Perhaps the solution is to |
|
| 957 | - # change the syntax rules such that sub-lists must start with a |
|
| 958 | - # starting cardinal number; e.g. "1." or "a.". |
|
| 891 | + array($this, '_doLists_callback'), $text); |
|
| 892 | + } |
|
| 893 | + } |
|
| 894 | + |
|
| 895 | + return $text; |
|
| 896 | + } |
|
| 897 | + protected function _doLists_callback($matches) { |
|
| 898 | + # Re-usable patterns to match list item bullets and number markers: |
|
| 899 | + $marker_ul_re = '[*+-]'; |
|
| 900 | + $marker_ol_re = '\d+[\.]'; |
|
| 901 | + $marker_any_re = "(?:$marker_ul_re|$marker_ol_re)"; |
|
| 902 | + $marker_ol_start_re = '[0-9]+'; |
|
| 903 | + |
|
| 904 | + $list = $matches[1]; |
|
| 905 | + $list_type = preg_match("/$marker_ul_re/", $matches[4]) ? "ul" : "ol"; |
|
| 906 | + |
|
| 907 | + $marker_any_re = ( $list_type == "ul" ? $marker_ul_re : $marker_ol_re ); |
|
| 908 | + |
|
| 909 | + $list .= "\n"; |
|
| 910 | + $result = $this->processListItems($list, $marker_any_re); |
|
| 911 | + |
|
| 912 | + $ol_start = 1; |
|
| 913 | + if ($this->enhanced_ordered_list) { |
|
| 914 | + # Get the start number for ordered list. |
|
| 915 | + if ($list_type == 'ol') { |
|
| 916 | + $ol_start_array = array(); |
|
| 917 | + $ol_start_check = preg_match("/$marker_ol_start_re/", $matches[4], $ol_start_array); |
|
| 918 | + if ($ol_start_check){ |
|
| 919 | + $ol_start = $ol_start_array[0]; |
|
| 920 | + } |
|
| 921 | + } |
|
| 922 | + } |
|
| 923 | + |
|
| 924 | + if ($ol_start > 1 && $list_type == 'ol'){ |
|
| 925 | + $result = $this->hashBlock("<$list_type start=\"$ol_start\">\n" . $result . "</$list_type>"); |
|
| 926 | + } else { |
|
| 927 | + $result = $this->hashBlock("<$list_type>\n" . $result . "</$list_type>"); |
|
| 928 | + } |
|
| 929 | + return "\n". $result ."\n\n"; |
|
| 930 | + } |
|
| 931 | + |
|
| 932 | + protected $list_level = 0; |
|
| 933 | + |
|
| 934 | + protected function processListItems($list_str, $marker_any_re) { |
|
| 935 | + # |
|
| 936 | + # Process the contents of a single ordered or unordered list, splitting it |
|
| 937 | + # into individual list items. |
|
| 938 | + # |
|
| 939 | + # The $this->list_level global keeps track of when we're inside a list. |
|
| 940 | + # Each time we enter a list, we increment it; when we leave a list, |
|
| 941 | + # we decrement. If it's zero, we're not in a list anymore. |
|
| 942 | + # |
|
| 943 | + # We do this because when we're not inside a list, we want to treat |
|
| 944 | + # something like this: |
|
| 945 | + # |
|
| 946 | + # I recommend upgrading to version |
|
| 947 | + # 8. Oops, now this line is treated |
|
| 948 | + # as a sub-list. |
|
| 949 | + # |
|
| 950 | + # As a single paragraph, despite the fact that the second line starts |
|
| 951 | + # with a digit-period-space sequence. |
|
| 952 | + # |
|
| 953 | + # Whereas when we're inside a list (or sub-list), that line will be |
|
| 954 | + # treated as the start of a sub-list. What a kludge, huh? This is |
|
| 955 | + # an aspect of Markdown's syntax that's hard to parse perfectly |
|
| 956 | + # without resorting to mind-reading. Perhaps the solution is to |
|
| 957 | + # change the syntax rules such that sub-lists must start with a |
|
| 958 | + # starting cardinal number; e.g. "1." or "a.". |
|
| 959 | 959 | |
| 960 | - $this->list_level++; |
|
| 960 | + $this->list_level++; |
|
| 961 | 961 | |
| 962 | - # trim trailing blank lines: |
|
| 963 | - $list_str = preg_replace("/\n{2,}\\z/", "\n", $list_str); |
|
| 962 | + # trim trailing blank lines: |
|
| 963 | + $list_str = preg_replace("/\n{2,}\\z/", "\n", $list_str); |
|
| 964 | 964 | |
| 965 | - $list_str = preg_replace_callback('{ |
|
| 965 | + $list_str = preg_replace_callback('{ |
|
| 966 | 966 | (\n)? # leading line = $1 |
| 967 | 967 | (^[ ]*) # leading whitespace = $2 |
| 968 | 968 | ('.$marker_any_re.' # list marker and space = $3 |
@@ -972,41 +972,41 @@ discard block |
||
| 972 | 972 | (?:(\n+(?=\n))|\n) # tailing blank line = $5 |
| 973 | 973 | (?= \n* (\z | \2 ('.$marker_any_re.') (?:[ ]+|(?=\n)))) |
| 974 | 974 | }xm', |
| 975 | - array($this, '_processListItems_callback'), $list_str); |
|
| 976 | - |
|
| 977 | - $this->list_level--; |
|
| 978 | - return $list_str; |
|
| 979 | - } |
|
| 980 | - protected function _processListItems_callback($matches) { |
|
| 981 | - $item = $matches[4]; |
|
| 982 | - $leading_line =& $matches[1]; |
|
| 983 | - $leading_space =& $matches[2]; |
|
| 984 | - $marker_space = $matches[3]; |
|
| 985 | - $tailing_blank_line =& $matches[5]; |
|
| 986 | - |
|
| 987 | - if ($leading_line || $tailing_blank_line || |
|
| 988 | - preg_match('/\n{2,}/', $item)) |
|
| 989 | - { |
|
| 990 | - # Replace marker with the appropriate whitespace indentation |
|
| 991 | - $item = $leading_space . str_repeat(' ', strlen($marker_space)) . $item; |
|
| 992 | - $item = $this->runBlockGamut($this->outdent($item)."\n"); |
|
| 993 | - } |
|
| 994 | - else { |
|
| 995 | - # Recursion for sub-lists: |
|
| 996 | - $item = $this->doLists($this->outdent($item)); |
|
| 997 | - $item = preg_replace('/\n+$/', '', $item); |
|
| 998 | - $item = $this->runSpanGamut($item); |
|
| 999 | - } |
|
| 1000 | - |
|
| 1001 | - return "<li>" . $item . "</li>\n"; |
|
| 1002 | - } |
|
| 1003 | - |
|
| 1004 | - |
|
| 1005 | - protected function doCodeBlocks($text) { |
|
| 1006 | - # |
|
| 1007 | - # Process Markdown `<pre><code>` blocks. |
|
| 1008 | - # |
|
| 1009 | - $text = preg_replace_callback('{ |
|
| 975 | + array($this, '_processListItems_callback'), $list_str); |
|
| 976 | + |
|
| 977 | + $this->list_level--; |
|
| 978 | + return $list_str; |
|
| 979 | + } |
|
| 980 | + protected function _processListItems_callback($matches) { |
|
| 981 | + $item = $matches[4]; |
|
| 982 | + $leading_line =& $matches[1]; |
|
| 983 | + $leading_space =& $matches[2]; |
|
| 984 | + $marker_space = $matches[3]; |
|
| 985 | + $tailing_blank_line =& $matches[5]; |
|
| 986 | + |
|
| 987 | + if ($leading_line || $tailing_blank_line || |
|
| 988 | + preg_match('/\n{2,}/', $item)) |
|
| 989 | + { |
|
| 990 | + # Replace marker with the appropriate whitespace indentation |
|
| 991 | + $item = $leading_space . str_repeat(' ', strlen($marker_space)) . $item; |
|
| 992 | + $item = $this->runBlockGamut($this->outdent($item)."\n"); |
|
| 993 | + } |
|
| 994 | + else { |
|
| 995 | + # Recursion for sub-lists: |
|
| 996 | + $item = $this->doLists($this->outdent($item)); |
|
| 997 | + $item = preg_replace('/\n+$/', '', $item); |
|
| 998 | + $item = $this->runSpanGamut($item); |
|
| 999 | + } |
|
| 1000 | + |
|
| 1001 | + return "<li>" . $item . "</li>\n"; |
|
| 1002 | + } |
|
| 1003 | + |
|
| 1004 | + |
|
| 1005 | + protected function doCodeBlocks($text) { |
|
| 1006 | + # |
|
| 1007 | + # Process Markdown `<pre><code>` blocks. |
|
| 1008 | + # |
|
| 1009 | + $text = preg_replace_callback('{ |
|
| 1010 | 1010 | (?:\n\n|\A\n?) |
| 1011 | 1011 | ( # $1 = the code block -- one or more lines, starting with a space/tab |
| 1012 | 1012 | (?> |
@@ -1016,197 +1016,197 @@ discard block |
||
| 1016 | 1016 | ) |
| 1017 | 1017 | ((?=^[ ]{0,'.$this->tab_width.'}\S)|\Z) # Lookahead for non-space at line-start, or end of doc |
| 1018 | 1018 | }xm', |
| 1019 | - array($this, '_doCodeBlocks_callback'), $text); |
|
| 1020 | - |
|
| 1021 | - return $text; |
|
| 1022 | - } |
|
| 1023 | - protected function _doCodeBlocks_callback($matches) { |
|
| 1024 | - $codeblock = $matches[1]; |
|
| 1025 | - |
|
| 1026 | - $codeblock = $this->outdent($codeblock); |
|
| 1027 | - $codeblock = htmlspecialchars($codeblock, ENT_NOQUOTES); |
|
| 1028 | - |
|
| 1029 | - # trim leading newlines and trailing newlines |
|
| 1030 | - $codeblock = preg_replace('/\A\n+|\n+\z/', '', $codeblock); |
|
| 1031 | - |
|
| 1032 | - $codeblock = "<pre><code>$codeblock\n</code></pre>"; |
|
| 1033 | - return "\n\n".$this->hashBlock($codeblock)."\n\n"; |
|
| 1034 | - } |
|
| 1035 | - |
|
| 1036 | - |
|
| 1037 | - protected function makeCodeSpan($code) { |
|
| 1038 | - # |
|
| 1039 | - # Create a code span markup for $code. Called from handleSpanToken. |
|
| 1040 | - # |
|
| 1041 | - $code = htmlspecialchars(trim($code), ENT_NOQUOTES); |
|
| 1042 | - return $this->hashPart("<code>$code</code>"); |
|
| 1043 | - } |
|
| 1044 | - |
|
| 1045 | - |
|
| 1046 | - protected $em_relist = array( |
|
| 1047 | - '' => '(?:(?<!\*)\*(?!\*)|(?<!_)_(?!_))(?![\.,:;]?\s)', |
|
| 1048 | - '*' => '(?<![\s*])\*(?!\*)', |
|
| 1049 | - '_' => '(?<![\s_])_(?!_)', |
|
| 1050 | - ); |
|
| 1051 | - protected $strong_relist = array( |
|
| 1052 | - '' => '(?:(?<!\*)\*\*(?!\*)|(?<!_)__(?!_))(?![\.,:;]?\s)', |
|
| 1053 | - '**' => '(?<![\s*])\*\*(?!\*)', |
|
| 1054 | - '__' => '(?<![\s_])__(?!_)', |
|
| 1055 | - ); |
|
| 1056 | - protected $em_strong_relist = array( |
|
| 1057 | - '' => '(?:(?<!\*)\*\*\*(?!\*)|(?<!_)___(?!_))(?![\.,:;]?\s)', |
|
| 1058 | - '***' => '(?<![\s*])\*\*\*(?!\*)', |
|
| 1059 | - '___' => '(?<![\s_])___(?!_)', |
|
| 1060 | - ); |
|
| 1061 | - protected $em_strong_prepared_relist; |
|
| 1019 | + array($this, '_doCodeBlocks_callback'), $text); |
|
| 1020 | + |
|
| 1021 | + return $text; |
|
| 1022 | + } |
|
| 1023 | + protected function _doCodeBlocks_callback($matches) { |
|
| 1024 | + $codeblock = $matches[1]; |
|
| 1025 | + |
|
| 1026 | + $codeblock = $this->outdent($codeblock); |
|
| 1027 | + $codeblock = htmlspecialchars($codeblock, ENT_NOQUOTES); |
|
| 1028 | + |
|
| 1029 | + # trim leading newlines and trailing newlines |
|
| 1030 | + $codeblock = preg_replace('/\A\n+|\n+\z/', '', $codeblock); |
|
| 1031 | + |
|
| 1032 | + $codeblock = "<pre><code>$codeblock\n</code></pre>"; |
|
| 1033 | + return "\n\n".$this->hashBlock($codeblock)."\n\n"; |
|
| 1034 | + } |
|
| 1035 | + |
|
| 1036 | + |
|
| 1037 | + protected function makeCodeSpan($code) { |
|
| 1038 | + # |
|
| 1039 | + # Create a code span markup for $code. Called from handleSpanToken. |
|
| 1040 | + # |
|
| 1041 | + $code = htmlspecialchars(trim($code), ENT_NOQUOTES); |
|
| 1042 | + return $this->hashPart("<code>$code</code>"); |
|
| 1043 | + } |
|
| 1044 | + |
|
| 1045 | + |
|
| 1046 | + protected $em_relist = array( |
|
| 1047 | + '' => '(?:(?<!\*)\*(?!\*)|(?<!_)_(?!_))(?![\.,:;]?\s)', |
|
| 1048 | + '*' => '(?<![\s*])\*(?!\*)', |
|
| 1049 | + '_' => '(?<![\s_])_(?!_)', |
|
| 1050 | + ); |
|
| 1051 | + protected $strong_relist = array( |
|
| 1052 | + '' => '(?:(?<!\*)\*\*(?!\*)|(?<!_)__(?!_))(?![\.,:;]?\s)', |
|
| 1053 | + '**' => '(?<![\s*])\*\*(?!\*)', |
|
| 1054 | + '__' => '(?<![\s_])__(?!_)', |
|
| 1055 | + ); |
|
| 1056 | + protected $em_strong_relist = array( |
|
| 1057 | + '' => '(?:(?<!\*)\*\*\*(?!\*)|(?<!_)___(?!_))(?![\.,:;]?\s)', |
|
| 1058 | + '***' => '(?<![\s*])\*\*\*(?!\*)', |
|
| 1059 | + '___' => '(?<![\s_])___(?!_)', |
|
| 1060 | + ); |
|
| 1061 | + protected $em_strong_prepared_relist; |
|
| 1062 | 1062 | |
| 1063 | - protected function prepareItalicsAndBold() { |
|
| 1064 | - # |
|
| 1065 | - # Prepare regular expressions for searching emphasis tokens in any |
|
| 1066 | - # context. |
|
| 1067 | - # |
|
| 1068 | - foreach ($this->em_relist as $em => $em_re) { |
|
| 1069 | - foreach ($this->strong_relist as $strong => $strong_re) { |
|
| 1070 | - # Construct list of allowed token expressions. |
|
| 1071 | - $token_relist = array(); |
|
| 1072 | - if (isset($this->em_strong_relist["$em$strong"])) { |
|
| 1073 | - $token_relist[] = $this->em_strong_relist["$em$strong"]; |
|
| 1074 | - } |
|
| 1075 | - $token_relist[] = $em_re; |
|
| 1076 | - $token_relist[] = $strong_re; |
|
| 1063 | + protected function prepareItalicsAndBold() { |
|
| 1064 | + # |
|
| 1065 | + # Prepare regular expressions for searching emphasis tokens in any |
|
| 1066 | + # context. |
|
| 1067 | + # |
|
| 1068 | + foreach ($this->em_relist as $em => $em_re) { |
|
| 1069 | + foreach ($this->strong_relist as $strong => $strong_re) { |
|
| 1070 | + # Construct list of allowed token expressions. |
|
| 1071 | + $token_relist = array(); |
|
| 1072 | + if (isset($this->em_strong_relist["$em$strong"])) { |
|
| 1073 | + $token_relist[] = $this->em_strong_relist["$em$strong"]; |
|
| 1074 | + } |
|
| 1075 | + $token_relist[] = $em_re; |
|
| 1076 | + $token_relist[] = $strong_re; |
|
| 1077 | 1077 | |
| 1078 | - # Construct master expression from list. |
|
| 1079 | - $token_re = '{('. implode('|', $token_relist) .')}'; |
|
| 1080 | - $this->em_strong_prepared_relist["$em$strong"] = $token_re; |
|
| 1081 | - } |
|
| 1082 | - } |
|
| 1083 | - } |
|
| 1078 | + # Construct master expression from list. |
|
| 1079 | + $token_re = '{('. implode('|', $token_relist) .')}'; |
|
| 1080 | + $this->em_strong_prepared_relist["$em$strong"] = $token_re; |
|
| 1081 | + } |
|
| 1082 | + } |
|
| 1083 | + } |
|
| 1084 | 1084 | |
| 1085 | - protected function doItalicsAndBold($text) { |
|
| 1086 | - $token_stack = array(''); |
|
| 1087 | - $text_stack = array(''); |
|
| 1088 | - $em = ''; |
|
| 1089 | - $strong = ''; |
|
| 1090 | - $tree_char_em = false; |
|
| 1085 | + protected function doItalicsAndBold($text) { |
|
| 1086 | + $token_stack = array(''); |
|
| 1087 | + $text_stack = array(''); |
|
| 1088 | + $em = ''; |
|
| 1089 | + $strong = ''; |
|
| 1090 | + $tree_char_em = false; |
|
| 1091 | 1091 | |
| 1092 | - while (1) { |
|
| 1093 | - # |
|
| 1094 | - # Get prepared regular expression for seraching emphasis tokens |
|
| 1095 | - # in current context. |
|
| 1096 | - # |
|
| 1097 | - $token_re = $this->em_strong_prepared_relist["$em$strong"]; |
|
| 1092 | + while (1) { |
|
| 1093 | + # |
|
| 1094 | + # Get prepared regular expression for seraching emphasis tokens |
|
| 1095 | + # in current context. |
|
| 1096 | + # |
|
| 1097 | + $token_re = $this->em_strong_prepared_relist["$em$strong"]; |
|
| 1098 | 1098 | |
| 1099 | - # |
|
| 1100 | - # Each loop iteration search for the next emphasis token. |
|
| 1101 | - # Each token is then passed to handleSpanToken. |
|
| 1102 | - # |
|
| 1103 | - $parts = preg_split($token_re, $text, 2, PREG_SPLIT_DELIM_CAPTURE); |
|
| 1104 | - $text_stack[0] .= $parts[0]; |
|
| 1105 | - $token =& $parts[1]; |
|
| 1106 | - $text =& $parts[2]; |
|
| 1099 | + # |
|
| 1100 | + # Each loop iteration search for the next emphasis token. |
|
| 1101 | + # Each token is then passed to handleSpanToken. |
|
| 1102 | + # |
|
| 1103 | + $parts = preg_split($token_re, $text, 2, PREG_SPLIT_DELIM_CAPTURE); |
|
| 1104 | + $text_stack[0] .= $parts[0]; |
|
| 1105 | + $token =& $parts[1]; |
|
| 1106 | + $text =& $parts[2]; |
|
| 1107 | 1107 | |
| 1108 | - if (empty($token)) { |
|
| 1109 | - # Reached end of text span: empty stack without emitting. |
|
| 1110 | - # any more emphasis. |
|
| 1111 | - while ($token_stack[0]) { |
|
| 1112 | - $text_stack[1] .= array_shift($token_stack); |
|
| 1113 | - $text_stack[0] .= array_shift($text_stack); |
|
| 1114 | - } |
|
| 1115 | - break; |
|
| 1116 | - } |
|
| 1108 | + if (empty($token)) { |
|
| 1109 | + # Reached end of text span: empty stack without emitting. |
|
| 1110 | + # any more emphasis. |
|
| 1111 | + while ($token_stack[0]) { |
|
| 1112 | + $text_stack[1] .= array_shift($token_stack); |
|
| 1113 | + $text_stack[0] .= array_shift($text_stack); |
|
| 1114 | + } |
|
| 1115 | + break; |
|
| 1116 | + } |
|
| 1117 | 1117 | |
| 1118 | - $token_len = strlen($token); |
|
| 1119 | - if ($tree_char_em) { |
|
| 1120 | - # Reached closing marker while inside a three-char emphasis. |
|
| 1121 | - if ($token_len == 3) { |
|
| 1122 | - # Three-char closing marker, close em and strong. |
|
| 1123 | - array_shift($token_stack); |
|
| 1124 | - $span = array_shift($text_stack); |
|
| 1125 | - $span = $this->runSpanGamut($span); |
|
| 1126 | - $span = "<strong><em>$span</em></strong>"; |
|
| 1127 | - $text_stack[0] .= $this->hashPart($span); |
|
| 1128 | - $em = ''; |
|
| 1129 | - $strong = ''; |
|
| 1130 | - } else { |
|
| 1131 | - # Other closing marker: close one em or strong and |
|
| 1132 | - # change current token state to match the other |
|
| 1133 | - $token_stack[0] = str_repeat($token{0}, 3-$token_len); |
|
| 1134 | - $tag = $token_len == 2 ? "strong" : "em"; |
|
| 1135 | - $span = $text_stack[0]; |
|
| 1136 | - $span = $this->runSpanGamut($span); |
|
| 1137 | - $span = "<$tag>$span</$tag>"; |
|
| 1138 | - $text_stack[0] = $this->hashPart($span); |
|
| 1139 | - $$tag = ''; # $$tag stands for $em or $strong |
|
| 1140 | - } |
|
| 1141 | - $tree_char_em = false; |
|
| 1142 | - } else if ($token_len == 3) { |
|
| 1143 | - if ($em) { |
|
| 1144 | - # Reached closing marker for both em and strong. |
|
| 1145 | - # Closing strong marker: |
|
| 1146 | - for ($i = 0; $i < 2; ++$i) { |
|
| 1147 | - $shifted_token = array_shift($token_stack); |
|
| 1148 | - $tag = strlen($shifted_token) == 2 ? "strong" : "em"; |
|
| 1149 | - $span = array_shift($text_stack); |
|
| 1150 | - $span = $this->runSpanGamut($span); |
|
| 1151 | - $span = "<$tag>$span</$tag>"; |
|
| 1152 | - $text_stack[0] .= $this->hashPart($span); |
|
| 1153 | - $$tag = ''; # $$tag stands for $em or $strong |
|
| 1154 | - } |
|
| 1155 | - } else { |
|
| 1156 | - # Reached opening three-char emphasis marker. Push on token |
|
| 1157 | - # stack; will be handled by the special condition above. |
|
| 1158 | - $em = $token{0}; |
|
| 1159 | - $strong = "$em$em"; |
|
| 1160 | - array_unshift($token_stack, $token); |
|
| 1161 | - array_unshift($text_stack, ''); |
|
| 1162 | - $tree_char_em = true; |
|
| 1163 | - } |
|
| 1164 | - } else if ($token_len == 2) { |
|
| 1165 | - if ($strong) { |
|
| 1166 | - # Unwind any dangling emphasis marker: |
|
| 1167 | - if (strlen($token_stack[0]) == 1) { |
|
| 1168 | - $text_stack[1] .= array_shift($token_stack); |
|
| 1169 | - $text_stack[0] .= array_shift($text_stack); |
|
| 1170 | - } |
|
| 1171 | - # Closing strong marker: |
|
| 1172 | - array_shift($token_stack); |
|
| 1173 | - $span = array_shift($text_stack); |
|
| 1174 | - $span = $this->runSpanGamut($span); |
|
| 1175 | - $span = "<strong>$span</strong>"; |
|
| 1176 | - $text_stack[0] .= $this->hashPart($span); |
|
| 1177 | - $strong = ''; |
|
| 1178 | - } else { |
|
| 1179 | - array_unshift($token_stack, $token); |
|
| 1180 | - array_unshift($text_stack, ''); |
|
| 1181 | - $strong = $token; |
|
| 1182 | - } |
|
| 1183 | - } else { |
|
| 1184 | - # Here $token_len == 1 |
|
| 1185 | - if ($em) { |
|
| 1186 | - if (strlen($token_stack[0]) == 1) { |
|
| 1187 | - # Closing emphasis marker: |
|
| 1188 | - array_shift($token_stack); |
|
| 1189 | - $span = array_shift($text_stack); |
|
| 1190 | - $span = $this->runSpanGamut($span); |
|
| 1191 | - $span = "<em>$span</em>"; |
|
| 1192 | - $text_stack[0] .= $this->hashPart($span); |
|
| 1193 | - $em = ''; |
|
| 1194 | - } else { |
|
| 1195 | - $text_stack[0] .= $token; |
|
| 1196 | - } |
|
| 1197 | - } else { |
|
| 1198 | - array_unshift($token_stack, $token); |
|
| 1199 | - array_unshift($text_stack, ''); |
|
| 1200 | - $em = $token; |
|
| 1201 | - } |
|
| 1202 | - } |
|
| 1203 | - } |
|
| 1204 | - return $text_stack[0]; |
|
| 1205 | - } |
|
| 1206 | - |
|
| 1207 | - |
|
| 1208 | - protected function doBlockQuotes($text) { |
|
| 1209 | - $text = preg_replace_callback('/ |
|
| 1118 | + $token_len = strlen($token); |
|
| 1119 | + if ($tree_char_em) { |
|
| 1120 | + # Reached closing marker while inside a three-char emphasis. |
|
| 1121 | + if ($token_len == 3) { |
|
| 1122 | + # Three-char closing marker, close em and strong. |
|
| 1123 | + array_shift($token_stack); |
|
| 1124 | + $span = array_shift($text_stack); |
|
| 1125 | + $span = $this->runSpanGamut($span); |
|
| 1126 | + $span = "<strong><em>$span</em></strong>"; |
|
| 1127 | + $text_stack[0] .= $this->hashPart($span); |
|
| 1128 | + $em = ''; |
|
| 1129 | + $strong = ''; |
|
| 1130 | + } else { |
|
| 1131 | + # Other closing marker: close one em or strong and |
|
| 1132 | + # change current token state to match the other |
|
| 1133 | + $token_stack[0] = str_repeat($token{0}, 3-$token_len); |
|
| 1134 | + $tag = $token_len == 2 ? "strong" : "em"; |
|
| 1135 | + $span = $text_stack[0]; |
|
| 1136 | + $span = $this->runSpanGamut($span); |
|
| 1137 | + $span = "<$tag>$span</$tag>"; |
|
| 1138 | + $text_stack[0] = $this->hashPart($span); |
|
| 1139 | + $$tag = ''; # $$tag stands for $em or $strong |
|
| 1140 | + } |
|
| 1141 | + $tree_char_em = false; |
|
| 1142 | + } else if ($token_len == 3) { |
|
| 1143 | + if ($em) { |
|
| 1144 | + # Reached closing marker for both em and strong. |
|
| 1145 | + # Closing strong marker: |
|
| 1146 | + for ($i = 0; $i < 2; ++$i) { |
|
| 1147 | + $shifted_token = array_shift($token_stack); |
|
| 1148 | + $tag = strlen($shifted_token) == 2 ? "strong" : "em"; |
|
| 1149 | + $span = array_shift($text_stack); |
|
| 1150 | + $span = $this->runSpanGamut($span); |
|
| 1151 | + $span = "<$tag>$span</$tag>"; |
|
| 1152 | + $text_stack[0] .= $this->hashPart($span); |
|
| 1153 | + $$tag = ''; # $$tag stands for $em or $strong |
|
| 1154 | + } |
|
| 1155 | + } else { |
|
| 1156 | + # Reached opening three-char emphasis marker. Push on token |
|
| 1157 | + # stack; will be handled by the special condition above. |
|
| 1158 | + $em = $token{0}; |
|
| 1159 | + $strong = "$em$em"; |
|
| 1160 | + array_unshift($token_stack, $token); |
|
| 1161 | + array_unshift($text_stack, ''); |
|
| 1162 | + $tree_char_em = true; |
|
| 1163 | + } |
|
| 1164 | + } else if ($token_len == 2) { |
|
| 1165 | + if ($strong) { |
|
| 1166 | + # Unwind any dangling emphasis marker: |
|
| 1167 | + if (strlen($token_stack[0]) == 1) { |
|
| 1168 | + $text_stack[1] .= array_shift($token_stack); |
|
| 1169 | + $text_stack[0] .= array_shift($text_stack); |
|
| 1170 | + } |
|
| 1171 | + # Closing strong marker: |
|
| 1172 | + array_shift($token_stack); |
|
| 1173 | + $span = array_shift($text_stack); |
|
| 1174 | + $span = $this->runSpanGamut($span); |
|
| 1175 | + $span = "<strong>$span</strong>"; |
|
| 1176 | + $text_stack[0] .= $this->hashPart($span); |
|
| 1177 | + $strong = ''; |
|
| 1178 | + } else { |
|
| 1179 | + array_unshift($token_stack, $token); |
|
| 1180 | + array_unshift($text_stack, ''); |
|
| 1181 | + $strong = $token; |
|
| 1182 | + } |
|
| 1183 | + } else { |
|
| 1184 | + # Here $token_len == 1 |
|
| 1185 | + if ($em) { |
|
| 1186 | + if (strlen($token_stack[0]) == 1) { |
|
| 1187 | + # Closing emphasis marker: |
|
| 1188 | + array_shift($token_stack); |
|
| 1189 | + $span = array_shift($text_stack); |
|
| 1190 | + $span = $this->runSpanGamut($span); |
|
| 1191 | + $span = "<em>$span</em>"; |
|
| 1192 | + $text_stack[0] .= $this->hashPart($span); |
|
| 1193 | + $em = ''; |
|
| 1194 | + } else { |
|
| 1195 | + $text_stack[0] .= $token; |
|
| 1196 | + } |
|
| 1197 | + } else { |
|
| 1198 | + array_unshift($token_stack, $token); |
|
| 1199 | + array_unshift($text_stack, ''); |
|
| 1200 | + $em = $token; |
|
| 1201 | + } |
|
| 1202 | + } |
|
| 1203 | + } |
|
| 1204 | + return $text_stack[0]; |
|
| 1205 | + } |
|
| 1206 | + |
|
| 1207 | + |
|
| 1208 | + protected function doBlockQuotes($text) { |
|
| 1209 | + $text = preg_replace_callback('/ |
|
| 1210 | 1210 | ( # Wrap whole match in $1 |
| 1211 | 1211 | (?> |
| 1212 | 1212 | ^[ ]*>[ ]? # ">" at the start of a line |
@@ -1216,58 +1216,58 @@ discard block |
||
| 1216 | 1216 | )+ |
| 1217 | 1217 | ) |
| 1218 | 1218 | /xm', |
| 1219 | - array($this, '_doBlockQuotes_callback'), $text); |
|
| 1220 | - |
|
| 1221 | - return $text; |
|
| 1222 | - } |
|
| 1223 | - protected function _doBlockQuotes_callback($matches) { |
|
| 1224 | - $bq = $matches[1]; |
|
| 1225 | - # trim one level of quoting - trim whitespace-only lines |
|
| 1226 | - $bq = preg_replace('/^[ ]*>[ ]?|^[ ]+$/m', '', $bq); |
|
| 1227 | - $bq = $this->runBlockGamut($bq); # recurse |
|
| 1228 | - |
|
| 1229 | - $bq = preg_replace('/^/m', " ", $bq); |
|
| 1230 | - # These leading spaces cause problem with <pre> content, |
|
| 1231 | - # so we need to fix that: |
|
| 1232 | - $bq = preg_replace_callback('{(\s*<pre>.+?</pre>)}sx', |
|
| 1233 | - array($this, '_doBlockQuotes_callback2'), $bq); |
|
| 1234 | - |
|
| 1235 | - return "\n". $this->hashBlock("<blockquote>\n$bq\n</blockquote>")."\n\n"; |
|
| 1236 | - } |
|
| 1237 | - protected function _doBlockQuotes_callback2($matches) { |
|
| 1238 | - $pre = $matches[1]; |
|
| 1239 | - $pre = preg_replace('/^ /m', '', $pre); |
|
| 1240 | - return $pre; |
|
| 1241 | - } |
|
| 1242 | - |
|
| 1243 | - |
|
| 1244 | - protected function formParagraphs($text) { |
|
| 1245 | - # |
|
| 1246 | - # Params: |
|
| 1247 | - # $text - string to process with html <p> tags |
|
| 1248 | - # |
|
| 1249 | - # Strip leading and trailing lines: |
|
| 1250 | - $text = preg_replace('/\A\n+|\n+\z/', '', $text); |
|
| 1251 | - |
|
| 1252 | - $grafs = preg_split('/\n{2,}/', $text, -1, PREG_SPLIT_NO_EMPTY); |
|
| 1253 | - |
|
| 1254 | - # |
|
| 1255 | - # Wrap <p> tags and unhashify HTML blocks |
|
| 1256 | - # |
|
| 1257 | - foreach ($grafs as $key => $value) { |
|
| 1258 | - if (!preg_match('/^B\x1A[0-9]+B$/', $value)) { |
|
| 1259 | - # Is a paragraph. |
|
| 1260 | - $value = $this->runSpanGamut($value); |
|
| 1261 | - $value = preg_replace('/^([ ]*)/', "<p>", $value); |
|
| 1262 | - $value .= "</p>"; |
|
| 1263 | - $grafs[$key] = $this->unhash($value); |
|
| 1264 | - } |
|
| 1265 | - else { |
|
| 1266 | - # Is a block. |
|
| 1267 | - # Modify elements of @grafs in-place... |
|
| 1268 | - $graf = $value; |
|
| 1269 | - $block = $this->html_hashes[$graf]; |
|
| 1270 | - $graf = $block; |
|
| 1219 | + array($this, '_doBlockQuotes_callback'), $text); |
|
| 1220 | + |
|
| 1221 | + return $text; |
|
| 1222 | + } |
|
| 1223 | + protected function _doBlockQuotes_callback($matches) { |
|
| 1224 | + $bq = $matches[1]; |
|
| 1225 | + # trim one level of quoting - trim whitespace-only lines |
|
| 1226 | + $bq = preg_replace('/^[ ]*>[ ]?|^[ ]+$/m', '', $bq); |
|
| 1227 | + $bq = $this->runBlockGamut($bq); # recurse |
|
| 1228 | + |
|
| 1229 | + $bq = preg_replace('/^/m', " ", $bq); |
|
| 1230 | + # These leading spaces cause problem with <pre> content, |
|
| 1231 | + # so we need to fix that: |
|
| 1232 | + $bq = preg_replace_callback('{(\s*<pre>.+?</pre>)}sx', |
|
| 1233 | + array($this, '_doBlockQuotes_callback2'), $bq); |
|
| 1234 | + |
|
| 1235 | + return "\n". $this->hashBlock("<blockquote>\n$bq\n</blockquote>")."\n\n"; |
|
| 1236 | + } |
|
| 1237 | + protected function _doBlockQuotes_callback2($matches) { |
|
| 1238 | + $pre = $matches[1]; |
|
| 1239 | + $pre = preg_replace('/^ /m', '', $pre); |
|
| 1240 | + return $pre; |
|
| 1241 | + } |
|
| 1242 | + |
|
| 1243 | + |
|
| 1244 | + protected function formParagraphs($text) { |
|
| 1245 | + # |
|
| 1246 | + # Params: |
|
| 1247 | + # $text - string to process with html <p> tags |
|
| 1248 | + # |
|
| 1249 | + # Strip leading and trailing lines: |
|
| 1250 | + $text = preg_replace('/\A\n+|\n+\z/', '', $text); |
|
| 1251 | + |
|
| 1252 | + $grafs = preg_split('/\n{2,}/', $text, -1, PREG_SPLIT_NO_EMPTY); |
|
| 1253 | + |
|
| 1254 | + # |
|
| 1255 | + # Wrap <p> tags and unhashify HTML blocks |
|
| 1256 | + # |
|
| 1257 | + foreach ($grafs as $key => $value) { |
|
| 1258 | + if (!preg_match('/^B\x1A[0-9]+B$/', $value)) { |
|
| 1259 | + # Is a paragraph. |
|
| 1260 | + $value = $this->runSpanGamut($value); |
|
| 1261 | + $value = preg_replace('/^([ ]*)/', "<p>", $value); |
|
| 1262 | + $value .= "</p>"; |
|
| 1263 | + $grafs[$key] = $this->unhash($value); |
|
| 1264 | + } |
|
| 1265 | + else { |
|
| 1266 | + # Is a block. |
|
| 1267 | + # Modify elements of @grafs in-place... |
|
| 1268 | + $graf = $value; |
|
| 1269 | + $block = $this->html_hashes[$graf]; |
|
| 1270 | + $graf = $block; |
|
| 1271 | 1271 | // if (preg_match('{ |
| 1272 | 1272 | // \A |
| 1273 | 1273 | // ( # $1 = <div> tag |
@@ -1303,79 +1303,79 @@ discard block |
||
| 1303 | 1303 | // |
| 1304 | 1304 | // $graf = $div_open . "\n" . $div_content . "\n" . $div_close; |
| 1305 | 1305 | // } |
| 1306 | - $grafs[$key] = $graf; |
|
| 1307 | - } |
|
| 1308 | - } |
|
| 1309 | - |
|
| 1310 | - return implode("\n\n", $grafs); |
|
| 1311 | - } |
|
| 1312 | - |
|
| 1313 | - |
|
| 1314 | - protected function encodeAttribute($text) { |
|
| 1315 | - # |
|
| 1316 | - # Encode text for a double-quoted HTML attribute. This function |
|
| 1317 | - # is *not* suitable for attributes enclosed in single quotes. |
|
| 1318 | - # |
|
| 1319 | - $text = $this->encodeAmpsAndAngles($text); |
|
| 1320 | - $text = str_replace('"', '"', $text); |
|
| 1321 | - return $text; |
|
| 1322 | - } |
|
| 1323 | - |
|
| 1324 | - |
|
| 1325 | - protected function encodeURLAttribute($url, &$text = null) { |
|
| 1326 | - # |
|
| 1327 | - # Encode text for a double-quoted HTML attribute containing a URL, |
|
| 1328 | - # applying the URL filter if set. Also generates the textual |
|
| 1329 | - # representation for the URL (removing mailto: or tel:) storing it in $text. |
|
| 1330 | - # This function is *not* suitable for attributes enclosed in single quotes. |
|
| 1331 | - # |
|
| 1332 | - if ($this->url_filter_func) |
|
| 1333 | - $url = call_user_func($this->url_filter_func, $url); |
|
| 1334 | - |
|
| 1335 | - if (preg_match('{^mailto:}i', $url)) |
|
| 1336 | - $url = $this->encodeEntityObfuscatedAttribute($url, $text, 7); |
|
| 1337 | - else if (preg_match('{^tel:}i', $url)) |
|
| 1338 | - { |
|
| 1339 | - $url = $this->encodeAttribute($url); |
|
| 1340 | - $text = substr($url, 4); |
|
| 1341 | - } |
|
| 1342 | - else |
|
| 1343 | - { |
|
| 1344 | - $url = $this->encodeAttribute($url); |
|
| 1345 | - $text = $url; |
|
| 1346 | - } |
|
| 1347 | - |
|
| 1348 | - return $url; |
|
| 1349 | - } |
|
| 1306 | + $grafs[$key] = $graf; |
|
| 1307 | + } |
|
| 1308 | + } |
|
| 1309 | + |
|
| 1310 | + return implode("\n\n", $grafs); |
|
| 1311 | + } |
|
| 1312 | + |
|
| 1313 | + |
|
| 1314 | + protected function encodeAttribute($text) { |
|
| 1315 | + # |
|
| 1316 | + # Encode text for a double-quoted HTML attribute. This function |
|
| 1317 | + # is *not* suitable for attributes enclosed in single quotes. |
|
| 1318 | + # |
|
| 1319 | + $text = $this->encodeAmpsAndAngles($text); |
|
| 1320 | + $text = str_replace('"', '"', $text); |
|
| 1321 | + return $text; |
|
| 1322 | + } |
|
| 1323 | + |
|
| 1324 | + |
|
| 1325 | + protected function encodeURLAttribute($url, &$text = null) { |
|
| 1326 | + # |
|
| 1327 | + # Encode text for a double-quoted HTML attribute containing a URL, |
|
| 1328 | + # applying the URL filter if set. Also generates the textual |
|
| 1329 | + # representation for the URL (removing mailto: or tel:) storing it in $text. |
|
| 1330 | + # This function is *not* suitable for attributes enclosed in single quotes. |
|
| 1331 | + # |
|
| 1332 | + if ($this->url_filter_func) |
|
| 1333 | + $url = call_user_func($this->url_filter_func, $url); |
|
| 1334 | + |
|
| 1335 | + if (preg_match('{^mailto:}i', $url)) |
|
| 1336 | + $url = $this->encodeEntityObfuscatedAttribute($url, $text, 7); |
|
| 1337 | + else if (preg_match('{^tel:}i', $url)) |
|
| 1338 | + { |
|
| 1339 | + $url = $this->encodeAttribute($url); |
|
| 1340 | + $text = substr($url, 4); |
|
| 1341 | + } |
|
| 1342 | + else |
|
| 1343 | + { |
|
| 1344 | + $url = $this->encodeAttribute($url); |
|
| 1345 | + $text = $url; |
|
| 1346 | + } |
|
| 1347 | + |
|
| 1348 | + return $url; |
|
| 1349 | + } |
|
| 1350 | 1350 | |
| 1351 | 1351 | |
| 1352 | - protected function encodeAmpsAndAngles($text) { |
|
| 1353 | - # |
|
| 1354 | - # Smart processing for ampersands and angle brackets that need to |
|
| 1355 | - # be encoded. Valid character entities are left alone unless the |
|
| 1356 | - # no-entities mode is set. |
|
| 1357 | - # |
|
| 1358 | - if ($this->no_entities) { |
|
| 1359 | - $text = str_replace('&', '&', $text); |
|
| 1360 | - } else { |
|
| 1361 | - # Ampersand-encoding based entirely on Nat Irons's Amputator |
|
| 1362 | - # MT plugin: <http://bumppo.net/projects/amputator/> |
|
| 1363 | - $text = preg_replace('/&(?!#?[xX]?(?:[0-9a-fA-F]+|\w+);)/', |
|
| 1364 | - '&', $text); |
|
| 1365 | - } |
|
| 1366 | - # Encode remaining <'s |
|
| 1367 | - $text = str_replace('<', '<', $text); |
|
| 1368 | - |
|
| 1369 | - return $text; |
|
| 1370 | - } |
|
| 1371 | - |
|
| 1372 | - |
|
| 1373 | - protected function doAutoLinks($text) { |
|
| 1374 | - $text = preg_replace_callback('{<((https?|ftp|dict|tel):[^\'">\s]+)>}i', |
|
| 1375 | - array($this, '_doAutoLinks_url_callback'), $text); |
|
| 1376 | - |
|
| 1377 | - # Email addresses: <[email protected]> |
|
| 1378 | - $text = preg_replace_callback('{ |
|
| 1352 | + protected function encodeAmpsAndAngles($text) { |
|
| 1353 | + # |
|
| 1354 | + # Smart processing for ampersands and angle brackets that need to |
|
| 1355 | + # be encoded. Valid character entities are left alone unless the |
|
| 1356 | + # no-entities mode is set. |
|
| 1357 | + # |
|
| 1358 | + if ($this->no_entities) { |
|
| 1359 | + $text = str_replace('&', '&', $text); |
|
| 1360 | + } else { |
|
| 1361 | + # Ampersand-encoding based entirely on Nat Irons's Amputator |
|
| 1362 | + # MT plugin: <http://bumppo.net/projects/amputator/> |
|
| 1363 | + $text = preg_replace('/&(?!#?[xX]?(?:[0-9a-fA-F]+|\w+);)/', |
|
| 1364 | + '&', $text); |
|
| 1365 | + } |
|
| 1366 | + # Encode remaining <'s |
|
| 1367 | + $text = str_replace('<', '<', $text); |
|
| 1368 | + |
|
| 1369 | + return $text; |
|
| 1370 | + } |
|
| 1371 | + |
|
| 1372 | + |
|
| 1373 | + protected function doAutoLinks($text) { |
|
| 1374 | + $text = preg_replace_callback('{<((https?|ftp|dict|tel):[^\'">\s]+)>}i', |
|
| 1375 | + array($this, '_doAutoLinks_url_callback'), $text); |
|
| 1376 | + |
|
| 1377 | + # Email addresses: <[email protected]> |
|
| 1378 | + $text = preg_replace_callback('{ |
|
| 1379 | 1379 | < |
| 1380 | 1380 | (?:mailto:)? |
| 1381 | 1381 | ( |
@@ -1393,76 +1393,76 @@ discard block |
||
| 1393 | 1393 | ) |
| 1394 | 1394 | > |
| 1395 | 1395 | }xi', |
| 1396 | - array($this, '_doAutoLinks_email_callback'), $text); |
|
| 1397 | - |
|
| 1398 | - return $text; |
|
| 1399 | - } |
|
| 1400 | - protected function _doAutoLinks_url_callback($matches) { |
|
| 1401 | - $url = $this->encodeURLAttribute($matches[1], $text); |
|
| 1402 | - $link = "<a href=\"$url\">$text</a>"; |
|
| 1403 | - return $this->hashPart($link); |
|
| 1404 | - } |
|
| 1405 | - protected function _doAutoLinks_email_callback($matches) { |
|
| 1406 | - $addr = $matches[1]; |
|
| 1407 | - $url = $this->encodeURLAttribute("mailto:$addr", $text); |
|
| 1408 | - $link = "<a href=\"$url\">$text</a>"; |
|
| 1409 | - return $this->hashPart($link); |
|
| 1410 | - } |
|
| 1411 | - |
|
| 1412 | - |
|
| 1413 | - protected function encodeEntityObfuscatedAttribute($text, &$tail = null, $head_length = 0) { |
|
| 1414 | - # |
|
| 1415 | - # Input: some text to obfuscate, e.g. "mailto:[email protected]" |
|
| 1416 | - # |
|
| 1417 | - # Output: the same text but with most characters encoded as either a |
|
| 1418 | - # decimal or hex entity, in the hopes of foiling most address |
|
| 1419 | - # harvesting spam bots. E.g.: |
|
| 1420 | - # |
|
| 1421 | - # mailto:foo |
|
| 1422 | - # @example.co |
|
| 1423 | - # m |
|
| 1424 | - # |
|
| 1425 | - # Note: the additional output $tail is assigned the same value as the |
|
| 1426 | - # ouput, minus the number of characters specified by $head_length. |
|
| 1427 | - # |
|
| 1428 | - # Based by a filter by Matthew Wickline, posted to BBEdit-Talk. |
|
| 1429 | - # With some optimizations by Milian Wolff. Forced encoding of HTML |
|
| 1430 | - # attribute special characters by Allan Odgaard. |
|
| 1431 | - # |
|
| 1432 | - if ($text == "") return $tail = ""; |
|
| 1433 | - |
|
| 1434 | - $chars = preg_split('/(?<!^)(?!$)/', $text); |
|
| 1435 | - $seed = (int)abs(crc32($text) / strlen($text)); # Deterministic seed. |
|
| 1436 | - |
|
| 1437 | - foreach ($chars as $key => $char) { |
|
| 1438 | - $ord = ord($char); |
|
| 1439 | - # Ignore non-ascii chars. |
|
| 1440 | - if ($ord < 128) { |
|
| 1441 | - $r = ($seed * (1 + $key)) % 100; # Pseudo-random function. |
|
| 1442 | - # roughly 10% raw, 45% hex, 45% dec |
|
| 1443 | - # '@' *must* be encoded. I insist. |
|
| 1444 | - # '"' and '>' have to be encoded inside the attribute |
|
| 1445 | - if ($r > 90 && strpos('@"&>', $char) === false) /* do nothing */; |
|
| 1446 | - else if ($r < 45) $chars[$key] = '&#x'.dechex($ord).';'; |
|
| 1447 | - else $chars[$key] = '&#'.$ord.';'; |
|
| 1448 | - } |
|
| 1449 | - } |
|
| 1450 | - |
|
| 1451 | - $text = implode('', $chars); |
|
| 1452 | - $tail = $head_length ? implode('', array_slice($chars, $head_length)) : $text; |
|
| 1453 | - |
|
| 1454 | - return $text; |
|
| 1455 | - } |
|
| 1456 | - |
|
| 1457 | - |
|
| 1458 | - protected function parseSpan($str) { |
|
| 1459 | - # |
|
| 1460 | - # Take the string $str and parse it into tokens, hashing embeded HTML, |
|
| 1461 | - # escaped characters and handling code spans. |
|
| 1462 | - # |
|
| 1463 | - $output = ''; |
|
| 1396 | + array($this, '_doAutoLinks_email_callback'), $text); |
|
| 1397 | + |
|
| 1398 | + return $text; |
|
| 1399 | + } |
|
| 1400 | + protected function _doAutoLinks_url_callback($matches) { |
|
| 1401 | + $url = $this->encodeURLAttribute($matches[1], $text); |
|
| 1402 | + $link = "<a href=\"$url\">$text</a>"; |
|
| 1403 | + return $this->hashPart($link); |
|
| 1404 | + } |
|
| 1405 | + protected function _doAutoLinks_email_callback($matches) { |
|
| 1406 | + $addr = $matches[1]; |
|
| 1407 | + $url = $this->encodeURLAttribute("mailto:$addr", $text); |
|
| 1408 | + $link = "<a href=\"$url\">$text</a>"; |
|
| 1409 | + return $this->hashPart($link); |
|
| 1410 | + } |
|
| 1411 | + |
|
| 1412 | + |
|
| 1413 | + protected function encodeEntityObfuscatedAttribute($text, &$tail = null, $head_length = 0) { |
|
| 1414 | + # |
|
| 1415 | + # Input: some text to obfuscate, e.g. "mailto:[email protected]" |
|
| 1416 | + # |
|
| 1417 | + # Output: the same text but with most characters encoded as either a |
|
| 1418 | + # decimal or hex entity, in the hopes of foiling most address |
|
| 1419 | + # harvesting spam bots. E.g.: |
|
| 1420 | + # |
|
| 1421 | + # mailto:foo |
|
| 1422 | + # @example.co |
|
| 1423 | + # m |
|
| 1424 | + # |
|
| 1425 | + # Note: the additional output $tail is assigned the same value as the |
|
| 1426 | + # ouput, minus the number of characters specified by $head_length. |
|
| 1427 | + # |
|
| 1428 | + # Based by a filter by Matthew Wickline, posted to BBEdit-Talk. |
|
| 1429 | + # With some optimizations by Milian Wolff. Forced encoding of HTML |
|
| 1430 | + # attribute special characters by Allan Odgaard. |
|
| 1431 | + # |
|
| 1432 | + if ($text == "") return $tail = ""; |
|
| 1433 | + |
|
| 1434 | + $chars = preg_split('/(?<!^)(?!$)/', $text); |
|
| 1435 | + $seed = (int)abs(crc32($text) / strlen($text)); # Deterministic seed. |
|
| 1436 | + |
|
| 1437 | + foreach ($chars as $key => $char) { |
|
| 1438 | + $ord = ord($char); |
|
| 1439 | + # Ignore non-ascii chars. |
|
| 1440 | + if ($ord < 128) { |
|
| 1441 | + $r = ($seed * (1 + $key)) % 100; # Pseudo-random function. |
|
| 1442 | + # roughly 10% raw, 45% hex, 45% dec |
|
| 1443 | + # '@' *must* be encoded. I insist. |
|
| 1444 | + # '"' and '>' have to be encoded inside the attribute |
|
| 1445 | + if ($r > 90 && strpos('@"&>', $char) === false) /* do nothing */; |
|
| 1446 | + else if ($r < 45) $chars[$key] = '&#x'.dechex($ord).';'; |
|
| 1447 | + else $chars[$key] = '&#'.$ord.';'; |
|
| 1448 | + } |
|
| 1449 | + } |
|
| 1450 | + |
|
| 1451 | + $text = implode('', $chars); |
|
| 1452 | + $tail = $head_length ? implode('', array_slice($chars, $head_length)) : $text; |
|
| 1453 | + |
|
| 1454 | + return $text; |
|
| 1455 | + } |
|
| 1456 | + |
|
| 1457 | + |
|
| 1458 | + protected function parseSpan($str) { |
|
| 1459 | + # |
|
| 1460 | + # Take the string $str and parse it into tokens, hashing embeded HTML, |
|
| 1461 | + # escaped characters and handling code spans. |
|
| 1462 | + # |
|
| 1463 | + $output = ''; |
|
| 1464 | 1464 | |
| 1465 | - $span_re = '{ |
|
| 1465 | + $span_re = '{ |
|
| 1466 | 1466 | ( |
| 1467 | 1467 | \\\\'.$this->escape_chars_re.' |
| 1468 | 1468 | | |
@@ -1488,122 +1488,122 @@ discard block |
||
| 1488 | 1488 | ) |
| 1489 | 1489 | }xs'; |
| 1490 | 1490 | |
| 1491 | - while (1) { |
|
| 1492 | - # |
|
| 1493 | - # Each loop iteration seach for either the next tag, the next |
|
| 1494 | - # openning code span marker, or the next escaped character. |
|
| 1495 | - # Each token is then passed to handleSpanToken. |
|
| 1496 | - # |
|
| 1497 | - $parts = preg_split($span_re, $str, 2, PREG_SPLIT_DELIM_CAPTURE); |
|
| 1491 | + while (1) { |
|
| 1492 | + # |
|
| 1493 | + # Each loop iteration seach for either the next tag, the next |
|
| 1494 | + # openning code span marker, or the next escaped character. |
|
| 1495 | + # Each token is then passed to handleSpanToken. |
|
| 1496 | + # |
|
| 1497 | + $parts = preg_split($span_re, $str, 2, PREG_SPLIT_DELIM_CAPTURE); |
|
| 1498 | 1498 | |
| 1499 | - # Create token from text preceding tag. |
|
| 1500 | - if ($parts[0] != "") { |
|
| 1501 | - $output .= $parts[0]; |
|
| 1502 | - } |
|
| 1499 | + # Create token from text preceding tag. |
|
| 1500 | + if ($parts[0] != "") { |
|
| 1501 | + $output .= $parts[0]; |
|
| 1502 | + } |
|
| 1503 | 1503 | |
| 1504 | - # Check if we reach the end. |
|
| 1505 | - if (isset($parts[1])) { |
|
| 1506 | - $output .= $this->handleSpanToken($parts[1], $parts[2]); |
|
| 1507 | - $str = $parts[2]; |
|
| 1508 | - } |
|
| 1509 | - else { |
|
| 1510 | - break; |
|
| 1511 | - } |
|
| 1512 | - } |
|
| 1504 | + # Check if we reach the end. |
|
| 1505 | + if (isset($parts[1])) { |
|
| 1506 | + $output .= $this->handleSpanToken($parts[1], $parts[2]); |
|
| 1507 | + $str = $parts[2]; |
|
| 1508 | + } |
|
| 1509 | + else { |
|
| 1510 | + break; |
|
| 1511 | + } |
|
| 1512 | + } |
|
| 1513 | 1513 | |
| 1514 | - return $output; |
|
| 1515 | - } |
|
| 1514 | + return $output; |
|
| 1515 | + } |
|
| 1516 | 1516 | |
| 1517 | 1517 | |
| 1518 | - protected function handleSpanToken($token, &$str) { |
|
| 1519 | - # |
|
| 1520 | - # Handle $token provided by parseSpan by determining its nature and |
|
| 1521 | - # returning the corresponding value that should replace it. |
|
| 1522 | - # |
|
| 1523 | - switch ($token{0}) { |
|
| 1524 | - case "\\": |
|
| 1525 | - return $this->hashPart("&#". ord($token{1}). ";"); |
|
| 1526 | - case "`": |
|
| 1527 | - # Search for end marker in remaining text. |
|
| 1528 | - if (preg_match('/^(.*?[^`])'.preg_quote($token).'(?!`)(.*)$/sm', |
|
| 1529 | - $str, $matches)) |
|
| 1530 | - { |
|
| 1531 | - $str = $matches[2]; |
|
| 1532 | - $codespan = $this->makeCodeSpan($matches[1]); |
|
| 1533 | - return $this->hashPart($codespan); |
|
| 1534 | - } |
|
| 1535 | - return $token; // return as text since no ending marker found. |
|
| 1536 | - default: |
|
| 1537 | - return $this->hashPart($token); |
|
| 1538 | - } |
|
| 1539 | - } |
|
| 1540 | - |
|
| 1541 | - |
|
| 1542 | - protected function outdent($text) { |
|
| 1543 | - # |
|
| 1544 | - # Remove one level of line-leading tabs or spaces |
|
| 1545 | - # |
|
| 1546 | - return preg_replace('/^(\t|[ ]{1,'.$this->tab_width.'})/m', '', $text); |
|
| 1547 | - } |
|
| 1548 | - |
|
| 1549 | - |
|
| 1550 | - # String length function for detab. `_initDetab` will create a function to |
|
| 1551 | - # hanlde UTF-8 if the default function does not exist. |
|
| 1552 | - protected $utf8_strlen = 'mb_strlen'; |
|
| 1518 | + protected function handleSpanToken($token, &$str) { |
|
| 1519 | + # |
|
| 1520 | + # Handle $token provided by parseSpan by determining its nature and |
|
| 1521 | + # returning the corresponding value that should replace it. |
|
| 1522 | + # |
|
| 1523 | + switch ($token{0}) { |
|
| 1524 | + case "\\": |
|
| 1525 | + return $this->hashPart("&#". ord($token{1}). ";"); |
|
| 1526 | + case "`": |
|
| 1527 | + # Search for end marker in remaining text. |
|
| 1528 | + if (preg_match('/^(.*?[^`])'.preg_quote($token).'(?!`)(.*)$/sm', |
|
| 1529 | + $str, $matches)) |
|
| 1530 | + { |
|
| 1531 | + $str = $matches[2]; |
|
| 1532 | + $codespan = $this->makeCodeSpan($matches[1]); |
|
| 1533 | + return $this->hashPart($codespan); |
|
| 1534 | + } |
|
| 1535 | + return $token; // return as text since no ending marker found. |
|
| 1536 | + default: |
|
| 1537 | + return $this->hashPart($token); |
|
| 1538 | + } |
|
| 1539 | + } |
|
| 1540 | + |
|
| 1541 | + |
|
| 1542 | + protected function outdent($text) { |
|
| 1543 | + # |
|
| 1544 | + # Remove one level of line-leading tabs or spaces |
|
| 1545 | + # |
|
| 1546 | + return preg_replace('/^(\t|[ ]{1,'.$this->tab_width.'})/m', '', $text); |
|
| 1547 | + } |
|
| 1548 | + |
|
| 1549 | + |
|
| 1550 | + # String length function for detab. `_initDetab` will create a function to |
|
| 1551 | + # hanlde UTF-8 if the default function does not exist. |
|
| 1552 | + protected $utf8_strlen = 'mb_strlen'; |
|
| 1553 | 1553 | |
| 1554 | - protected function detab($text) { |
|
| 1555 | - # |
|
| 1556 | - # Replace tabs with the appropriate amount of space. |
|
| 1557 | - # |
|
| 1558 | - # For each line we separate the line in blocks delemited by |
|
| 1559 | - # tab characters. Then we reconstruct every line by adding the |
|
| 1560 | - # appropriate number of space between each blocks. |
|
| 1554 | + protected function detab($text) { |
|
| 1555 | + # |
|
| 1556 | + # Replace tabs with the appropriate amount of space. |
|
| 1557 | + # |
|
| 1558 | + # For each line we separate the line in blocks delemited by |
|
| 1559 | + # tab characters. Then we reconstruct every line by adding the |
|
| 1560 | + # appropriate number of space between each blocks. |
|
| 1561 | 1561 | |
| 1562 | - $text = preg_replace_callback('/^.*\t.*$/m', |
|
| 1563 | - array($this, '_detab_callback'), $text); |
|
| 1564 | - |
|
| 1565 | - return $text; |
|
| 1566 | - } |
|
| 1567 | - protected function _detab_callback($matches) { |
|
| 1568 | - $line = $matches[0]; |
|
| 1569 | - $strlen = $this->utf8_strlen; # strlen function for UTF-8. |
|
| 1562 | + $text = preg_replace_callback('/^.*\t.*$/m', |
|
| 1563 | + array($this, '_detab_callback'), $text); |
|
| 1564 | + |
|
| 1565 | + return $text; |
|
| 1566 | + } |
|
| 1567 | + protected function _detab_callback($matches) { |
|
| 1568 | + $line = $matches[0]; |
|
| 1569 | + $strlen = $this->utf8_strlen; # strlen function for UTF-8. |
|
| 1570 | 1570 | |
| 1571 | - # Split in blocks. |
|
| 1572 | - $blocks = explode("\t", $line); |
|
| 1573 | - # Add each blocks to the line. |
|
| 1574 | - $line = $blocks[0]; |
|
| 1575 | - unset($blocks[0]); # Do not add first block twice. |
|
| 1576 | - foreach ($blocks as $block) { |
|
| 1577 | - # Calculate amount of space, insert spaces, insert block. |
|
| 1578 | - $amount = $this->tab_width - |
|
| 1579 | - $strlen($line, 'UTF-8') % $this->tab_width; |
|
| 1580 | - $line .= str_repeat(" ", $amount) . $block; |
|
| 1581 | - } |
|
| 1582 | - return $line; |
|
| 1583 | - } |
|
| 1584 | - protected function _initDetab() { |
|
| 1585 | - # |
|
| 1586 | - # Check for the availability of the function in the `utf8_strlen` property |
|
| 1587 | - # (initially `mb_strlen`). If the function is not available, create a |
|
| 1588 | - # function that will loosely count the number of UTF-8 characters with a |
|
| 1589 | - # regular expression. |
|
| 1590 | - # |
|
| 1591 | - if (function_exists($this->utf8_strlen)) return; |
|
| 1592 | - $this->utf8_strlen = create_function('$text', 'return preg_match_all( |
|
| 1571 | + # Split in blocks. |
|
| 1572 | + $blocks = explode("\t", $line); |
|
| 1573 | + # Add each blocks to the line. |
|
| 1574 | + $line = $blocks[0]; |
|
| 1575 | + unset($blocks[0]); # Do not add first block twice. |
|
| 1576 | + foreach ($blocks as $block) { |
|
| 1577 | + # Calculate amount of space, insert spaces, insert block. |
|
| 1578 | + $amount = $this->tab_width - |
|
| 1579 | + $strlen($line, 'UTF-8') % $this->tab_width; |
|
| 1580 | + $line .= str_repeat(" ", $amount) . $block; |
|
| 1581 | + } |
|
| 1582 | + return $line; |
|
| 1583 | + } |
|
| 1584 | + protected function _initDetab() { |
|
| 1585 | + # |
|
| 1586 | + # Check for the availability of the function in the `utf8_strlen` property |
|
| 1587 | + # (initially `mb_strlen`). If the function is not available, create a |
|
| 1588 | + # function that will loosely count the number of UTF-8 characters with a |
|
| 1589 | + # regular expression. |
|
| 1590 | + # |
|
| 1591 | + if (function_exists($this->utf8_strlen)) return; |
|
| 1592 | + $this->utf8_strlen = create_function('$text', 'return preg_match_all( |
|
| 1593 | 1593 | "/[\\\\x00-\\\\xBF]|[\\\\xC0-\\\\xFF][\\\\x80-\\\\xBF]*/", |
| 1594 | 1594 | $text, $m);'); |
| 1595 | - } |
|
| 1596 | - |
|
| 1597 | - |
|
| 1598 | - protected function unhash($text) { |
|
| 1599 | - # |
|
| 1600 | - # Swap back in all the tags hashed by _HashHTMLBlocks. |
|
| 1601 | - # |
|
| 1602 | - return preg_replace_callback('/(.)\x1A[0-9]+\1/', |
|
| 1603 | - array($this, '_unhash_callback'), $text); |
|
| 1604 | - } |
|
| 1605 | - protected function _unhash_callback($matches) { |
|
| 1606 | - return $this->html_hashes[$matches[0]]; |
|
| 1607 | - } |
|
| 1595 | + } |
|
| 1596 | + |
|
| 1597 | + |
|
| 1598 | + protected function unhash($text) { |
|
| 1599 | + # |
|
| 1600 | + # Swap back in all the tags hashed by _HashHTMLBlocks. |
|
| 1601 | + # |
|
| 1602 | + return preg_replace_callback('/(.)\x1A[0-9]+\1/', |
|
| 1603 | + array($this, '_unhash_callback'), $text); |
|
| 1604 | + } |
|
| 1605 | + protected function _unhash_callback($matches) { |
|
| 1606 | + return $this->html_hashes[$matches[0]]; |
|
| 1607 | + } |
|
| 1608 | 1608 | |
| 1609 | 1609 | } |
@@ -21,7 +21,7 @@ discard block |
||
| 21 | 21 | |
| 22 | 22 | ### Version ### |
| 23 | 23 | |
| 24 | - const MARKDOWNLIB_VERSION = "1.5.0"; |
|
| 24 | + const MARKDOWNLIB_VERSION = "1.5.0"; |
|
| 25 | 25 | |
| 26 | 26 | ### Simple Function Interface ### |
| 27 | 27 | |
@@ -35,7 +35,7 @@ discard block |
||
| 35 | 35 | |
| 36 | 36 | # try to take parser from the static parser list |
| 37 | 37 | static $parser_list; |
| 38 | - $parser =& $parser_list[$parser_class]; |
|
| 38 | + $parser = & $parser_list[$parser_class]; |
|
| 39 | 39 | |
| 40 | 40 | # create the parser it not already set |
| 41 | 41 | if (!$parser) |
@@ -186,7 +186,7 @@ discard block |
||
| 186 | 186 | |
| 187 | 187 | $this->teardown(); |
| 188 | 188 | |
| 189 | - return $text . "\n"; |
|
| 189 | + return $text."\n"; |
|
| 190 | 190 | } |
| 191 | 191 | |
| 192 | 192 | protected $document_gamut = array( |
@@ -235,7 +235,7 @@ discard block |
||
| 235 | 235 | $link_id = strtolower($matches[1]); |
| 236 | 236 | $url = $matches[2] == '' ? $matches[3] : $matches[2]; |
| 237 | 237 | $this->urls[$link_id] = $url; |
| 238 | - $this->titles[$link_id] =& $matches[4]; |
|
| 238 | + $this->titles[$link_id] = & $matches[4]; |
|
| 239 | 239 | return ''; # String that will replace the block |
| 240 | 240 | } |
| 241 | 241 | |
@@ -290,8 +290,8 @@ discard block |
||
| 290 | 290 | (?> |
| 291 | 291 | /> |
| 292 | 292 | | |
| 293 | - >', $nested_tags_level). # end of opening tag |
|
| 294 | - '.*?'. # last level nested tag content |
|
| 293 | + >', $nested_tags_level).# end of opening tag |
|
| 294 | + '.*?'.# last level nested tag content |
|
| 295 | 295 | str_repeat(' |
| 296 | 296 | </\2\s*> # closing nested tag |
| 297 | 297 | ) |
@@ -403,7 +403,7 @@ discard block |
||
| 403 | 403 | |
| 404 | 404 | # Then hash the block. |
| 405 | 405 | static $i = 0; |
| 406 | - $key = "$boundary\x1A" . ++$i . $boundary; |
|
| 406 | + $key = "$boundary\x1A".++$i.$boundary; |
|
| 407 | 407 | $this->html_hashes[$key] = $text; |
| 408 | 408 | return $key; # String that will replace the tag. |
| 409 | 409 | } |
@@ -596,9 +596,9 @@ discard block |
||
| 596 | 596 | return $text; |
| 597 | 597 | } |
| 598 | 598 | protected function _doAnchors_reference_callback($matches) { |
| 599 | - $whole_match = $matches[1]; |
|
| 600 | - $link_text = $matches[2]; |
|
| 601 | - $link_id =& $matches[3]; |
|
| 599 | + $whole_match = $matches[1]; |
|
| 600 | + $link_text = $matches[2]; |
|
| 601 | + $link_id = & $matches[3]; |
|
| 602 | 602 | |
| 603 | 603 | if ($link_id == "") { |
| 604 | 604 | # for shortcut links like [this][] or [this]. |
@@ -614,10 +614,10 @@ discard block |
||
| 614 | 614 | $url = $this->encodeURLAttribute($url); |
| 615 | 615 | |
| 616 | 616 | $result = "<a href=\"$url\""; |
| 617 | - if ( isset( $this->titles[$link_id] ) ) { |
|
| 617 | + if (isset($this->titles[$link_id])) { |
|
| 618 | 618 | $title = $this->titles[$link_id]; |
| 619 | 619 | $title = $this->encodeAttribute($title); |
| 620 | - $result .= " title=\"$title\""; |
|
| 620 | + $result .= " title=\"$title\""; |
|
| 621 | 621 | } |
| 622 | 622 | |
| 623 | 623 | $link_text = $this->runSpanGamut($link_text); |
@@ -630,10 +630,10 @@ discard block |
||
| 630 | 630 | return $result; |
| 631 | 631 | } |
| 632 | 632 | protected function _doAnchors_inline_callback($matches) { |
| 633 | - $whole_match = $matches[1]; |
|
| 634 | - $link_text = $this->runSpanGamut($matches[2]); |
|
| 635 | - $url = $matches[3] == '' ? $matches[4] : $matches[3]; |
|
| 636 | - $title =& $matches[7]; |
|
| 633 | + $whole_match = $matches[1]; |
|
| 634 | + $link_text = $this->runSpanGamut($matches[2]); |
|
| 635 | + $url = $matches[3] == '' ? $matches[4] : $matches[3]; |
|
| 636 | + $title = & $matches[7]; |
|
| 637 | 637 | |
| 638 | 638 | // if the URL was of the form <s p a c e s> it got caught by the HTML |
| 639 | 639 | // tag parser and hashed. Need to reverse the process before using the URL. |
@@ -646,7 +646,7 @@ discard block |
||
| 646 | 646 | $result = "<a href=\"$url\""; |
| 647 | 647 | if (isset($title)) { |
| 648 | 648 | $title = $this->encodeAttribute($title); |
| 649 | - $result .= " title=\"$title\""; |
|
| 649 | + $result .= " title=\"$title\""; |
|
| 650 | 650 | } |
| 651 | 651 | |
| 652 | 652 | $link_text = $this->runSpanGamut($link_text); |
@@ -727,7 +727,7 @@ discard block |
||
| 727 | 727 | if (isset($this->titles[$link_id])) { |
| 728 | 728 | $title = $this->titles[$link_id]; |
| 729 | 729 | $title = $this->encodeAttribute($title); |
| 730 | - $result .= " title=\"$title\""; |
|
| 730 | + $result .= " title=\"$title\""; |
|
| 731 | 731 | } |
| 732 | 732 | $result .= $this->empty_element_suffix; |
| 733 | 733 | $result = $this->hashPart($result); |
@@ -740,17 +740,17 @@ discard block |
||
| 740 | 740 | return $result; |
| 741 | 741 | } |
| 742 | 742 | protected function _doImages_inline_callback($matches) { |
| 743 | - $whole_match = $matches[1]; |
|
| 744 | - $alt_text = $matches[2]; |
|
| 745 | - $url = $matches[3] == '' ? $matches[4] : $matches[3]; |
|
| 746 | - $title =& $matches[7]; |
|
| 743 | + $whole_match = $matches[1]; |
|
| 744 | + $alt_text = $matches[2]; |
|
| 745 | + $url = $matches[3] == '' ? $matches[4] : $matches[3]; |
|
| 746 | + $title = & $matches[7]; |
|
| 747 | 747 | |
| 748 | 748 | $alt_text = $this->encodeAttribute($alt_text); |
| 749 | 749 | $url = $this->encodeURLAttribute($url); |
| 750 | 750 | $result = "<img src=\"$url\" alt=\"$alt_text\""; |
| 751 | 751 | if (isset($title)) { |
| 752 | 752 | $title = $this->encodeAttribute($title); |
| 753 | - $result .= " title=\"$title\""; # $title already quoted |
|
| 753 | + $result .= " title=\"$title\""; # $title already quoted |
|
| 754 | 754 | } |
| 755 | 755 | $result .= $this->empty_element_suffix; |
| 756 | 756 | |
@@ -800,7 +800,7 @@ discard block |
||
| 800 | 800 | $idAtt = $this->_generateIdFromHeaderValue($matches[1]); |
| 801 | 801 | |
| 802 | 802 | $block = "<h$level$idAtt>".$this->runSpanGamut($matches[1])."</h$level>"; |
| 803 | - return "\n" . $this->hashBlock($block) . "\n\n"; |
|
| 803 | + return "\n".$this->hashBlock($block)."\n\n"; |
|
| 804 | 804 | } |
| 805 | 805 | protected function _doHeaders_callback_atx($matches) { |
| 806 | 806 | |
@@ -809,7 +809,7 @@ discard block |
||
| 809 | 809 | |
| 810 | 810 | $level = strlen($matches[1]); |
| 811 | 811 | $block = "<h$level$idAtt>".$this->runSpanGamut($matches[2])."</h$level>"; |
| 812 | - return "\n" . $this->hashBlock($block) . "\n\n"; |
|
| 812 | + return "\n".$this->hashBlock($block)."\n\n"; |
|
| 813 | 813 | } |
| 814 | 814 | |
| 815 | 815 | protected function _generateIdFromHeaderValue($headerValue) { |
@@ -825,7 +825,7 @@ discard block |
||
| 825 | 825 | $idValue = call_user_func($this->header_id_func, $headerValue); |
| 826 | 826 | if (!$idValue) return ""; |
| 827 | 827 | |
| 828 | - return ' id="' . $this->encodeAttribute($idValue) . '"'; |
|
| 828 | + return ' id="'.$this->encodeAttribute($idValue).'"'; |
|
| 829 | 829 | |
| 830 | 830 | } |
| 831 | 831 | |
@@ -904,7 +904,7 @@ discard block |
||
| 904 | 904 | $list = $matches[1]; |
| 905 | 905 | $list_type = preg_match("/$marker_ul_re/", $matches[4]) ? "ul" : "ol"; |
| 906 | 906 | |
| 907 | - $marker_any_re = ( $list_type == "ul" ? $marker_ul_re : $marker_ol_re ); |
|
| 907 | + $marker_any_re = ($list_type == "ul" ? $marker_ul_re : $marker_ol_re); |
|
| 908 | 908 | |
| 909 | 909 | $list .= "\n"; |
| 910 | 910 | $result = $this->processListItems($list, $marker_any_re); |
@@ -915,18 +915,18 @@ discard block |
||
| 915 | 915 | if ($list_type == 'ol') { |
| 916 | 916 | $ol_start_array = array(); |
| 917 | 917 | $ol_start_check = preg_match("/$marker_ol_start_re/", $matches[4], $ol_start_array); |
| 918 | - if ($ol_start_check){ |
|
| 918 | + if ($ol_start_check) { |
|
| 919 | 919 | $ol_start = $ol_start_array[0]; |
| 920 | 920 | } |
| 921 | 921 | } |
| 922 | 922 | } |
| 923 | 923 | |
| 924 | - if ($ol_start > 1 && $list_type == 'ol'){ |
|
| 925 | - $result = $this->hashBlock("<$list_type start=\"$ol_start\">\n" . $result . "</$list_type>"); |
|
| 924 | + if ($ol_start > 1 && $list_type == 'ol') { |
|
| 925 | + $result = $this->hashBlock("<$list_type start=\"$ol_start\">\n".$result."</$list_type>"); |
|
| 926 | 926 | } else { |
| 927 | - $result = $this->hashBlock("<$list_type>\n" . $result . "</$list_type>"); |
|
| 927 | + $result = $this->hashBlock("<$list_type>\n".$result."</$list_type>"); |
|
| 928 | 928 | } |
| 929 | - return "\n". $result ."\n\n"; |
|
| 929 | + return "\n".$result."\n\n"; |
|
| 930 | 930 | } |
| 931 | 931 | |
| 932 | 932 | protected $list_level = 0; |
@@ -979,16 +979,16 @@ discard block |
||
| 979 | 979 | } |
| 980 | 980 | protected function _processListItems_callback($matches) { |
| 981 | 981 | $item = $matches[4]; |
| 982 | - $leading_line =& $matches[1]; |
|
| 983 | - $leading_space =& $matches[2]; |
|
| 982 | + $leading_line = & $matches[1]; |
|
| 983 | + $leading_space = & $matches[2]; |
|
| 984 | 984 | $marker_space = $matches[3]; |
| 985 | - $tailing_blank_line =& $matches[5]; |
|
| 985 | + $tailing_blank_line = & $matches[5]; |
|
| 986 | 986 | |
| 987 | 987 | if ($leading_line || $tailing_blank_line || |
| 988 | 988 | preg_match('/\n{2,}/', $item)) |
| 989 | 989 | { |
| 990 | 990 | # Replace marker with the appropriate whitespace indentation |
| 991 | - $item = $leading_space . str_repeat(' ', strlen($marker_space)) . $item; |
|
| 991 | + $item = $leading_space.str_repeat(' ', strlen($marker_space)).$item; |
|
| 992 | 992 | $item = $this->runBlockGamut($this->outdent($item)."\n"); |
| 993 | 993 | } |
| 994 | 994 | else { |
@@ -998,7 +998,7 @@ discard block |
||
| 998 | 998 | $item = $this->runSpanGamut($item); |
| 999 | 999 | } |
| 1000 | 1000 | |
| 1001 | - return "<li>" . $item . "</li>\n"; |
|
| 1001 | + return "<li>".$item."</li>\n"; |
|
| 1002 | 1002 | } |
| 1003 | 1003 | |
| 1004 | 1004 | |
@@ -1076,7 +1076,7 @@ discard block |
||
| 1076 | 1076 | $token_relist[] = $strong_re; |
| 1077 | 1077 | |
| 1078 | 1078 | # Construct master expression from list. |
| 1079 | - $token_re = '{('. implode('|', $token_relist) .')}'; |
|
| 1079 | + $token_re = '{('.implode('|', $token_relist).')}'; |
|
| 1080 | 1080 | $this->em_strong_prepared_relist["$em$strong"] = $token_re; |
| 1081 | 1081 | } |
| 1082 | 1082 | } |
@@ -1102,8 +1102,8 @@ discard block |
||
| 1102 | 1102 | # |
| 1103 | 1103 | $parts = preg_split($token_re, $text, 2, PREG_SPLIT_DELIM_CAPTURE); |
| 1104 | 1104 | $text_stack[0] .= $parts[0]; |
| 1105 | - $token =& $parts[1]; |
|
| 1106 | - $text =& $parts[2]; |
|
| 1105 | + $token = & $parts[1]; |
|
| 1106 | + $text = & $parts[2]; |
|
| 1107 | 1107 | |
| 1108 | 1108 | if (empty($token)) { |
| 1109 | 1109 | # Reached end of text span: empty stack without emitting. |
@@ -1130,7 +1130,7 @@ discard block |
||
| 1130 | 1130 | } else { |
| 1131 | 1131 | # Other closing marker: close one em or strong and |
| 1132 | 1132 | # change current token state to match the other |
| 1133 | - $token_stack[0] = str_repeat($token{0}, 3-$token_len); |
|
| 1133 | + $token_stack[0] = str_repeat($token{0}, 3 - $token_len); |
|
| 1134 | 1134 | $tag = $token_len == 2 ? "strong" : "em"; |
| 1135 | 1135 | $span = $text_stack[0]; |
| 1136 | 1136 | $span = $this->runSpanGamut($span); |
@@ -1224,7 +1224,7 @@ discard block |
||
| 1224 | 1224 | $bq = $matches[1]; |
| 1225 | 1225 | # trim one level of quoting - trim whitespace-only lines |
| 1226 | 1226 | $bq = preg_replace('/^[ ]*>[ ]?|^[ ]+$/m', '', $bq); |
| 1227 | - $bq = $this->runBlockGamut($bq); # recurse |
|
| 1227 | + $bq = $this->runBlockGamut($bq); # recurse |
|
| 1228 | 1228 | |
| 1229 | 1229 | $bq = preg_replace('/^/m', " ", $bq); |
| 1230 | 1230 | # These leading spaces cause problem with <pre> content, |
@@ -1232,7 +1232,7 @@ discard block |
||
| 1232 | 1232 | $bq = preg_replace_callback('{(\s*<pre>.+?</pre>)}sx', |
| 1233 | 1233 | array($this, '_doBlockQuotes_callback2'), $bq); |
| 1234 | 1234 | |
| 1235 | - return "\n". $this->hashBlock("<blockquote>\n$bq\n</blockquote>")."\n\n"; |
|
| 1235 | + return "\n".$this->hashBlock("<blockquote>\n$bq\n</blockquote>")."\n\n"; |
|
| 1236 | 1236 | } |
| 1237 | 1237 | protected function _doBlockQuotes_callback2($matches) { |
| 1238 | 1238 | $pre = $matches[1]; |
@@ -1432,7 +1432,7 @@ discard block |
||
| 1432 | 1432 | if ($text == "") return $tail = ""; |
| 1433 | 1433 | |
| 1434 | 1434 | $chars = preg_split('/(?<!^)(?!$)/', $text); |
| 1435 | - $seed = (int)abs(crc32($text) / strlen($text)); # Deterministic seed. |
|
| 1435 | + $seed = (int) abs(crc32($text) / strlen($text)); # Deterministic seed. |
|
| 1436 | 1436 | |
| 1437 | 1437 | foreach ($chars as $key => $char) { |
| 1438 | 1438 | $ord = ord($char); |
@@ -1468,7 +1468,7 @@ discard block |
||
| 1468 | 1468 | | |
| 1469 | 1469 | (?<![`\\\\]) |
| 1470 | 1470 | `+ # code span marker |
| 1471 | - '.( $this->no_markup ? '' : ' |
|
| 1471 | + '.($this->no_markup ? '' : ' |
|
| 1472 | 1472 | | |
| 1473 | 1473 | <!-- .*? --> # comment |
| 1474 | 1474 | | |
@@ -1522,7 +1522,7 @@ discard block |
||
| 1522 | 1522 | # |
| 1523 | 1523 | switch ($token{0}) { |
| 1524 | 1524 | case "\\": |
| 1525 | - return $this->hashPart("&#". ord($token{1}). ";"); |
|
| 1525 | + return $this->hashPart("&#".ord($token{1}).";"); |
|
| 1526 | 1526 | case "`": |
| 1527 | 1527 | # Search for end marker in remaining text. |
| 1528 | 1528 | if (preg_match('/^(.*?[^`])'.preg_quote($token).'(?!`)(.*)$/sm', |
@@ -1577,7 +1577,7 @@ discard block |
||
| 1577 | 1577 | # Calculate amount of space, insert spaces, insert block. |
| 1578 | 1578 | $amount = $this->tab_width - |
| 1579 | 1579 | $strlen($line, 'UTF-8') % $this->tab_width; |
| 1580 | - $line .= str_repeat(" ", $amount) . $block; |
|
| 1580 | + $line .= str_repeat(" ", $amount).$block; |
|
| 1581 | 1581 | } |
| 1582 | 1582 | return $line; |
| 1583 | 1583 | } |
@@ -38,8 +38,9 @@ discard block |
||
| 38 | 38 | $parser =& $parser_list[$parser_class]; |
| 39 | 39 | |
| 40 | 40 | # create the parser it not already set |
| 41 | - if (!$parser) |
|
| 42 | - $parser = new $parser_class; |
|
| 41 | + if (!$parser) {
|
|
| 42 | + $parser = new $parser_class; |
|
| 43 | + } |
|
| 43 | 44 | |
| 44 | 45 | # Transform text using parser. |
| 45 | 46 | return $parser->transform($text); |
@@ -241,7 +242,9 @@ discard block |
||
| 241 | 242 | |
| 242 | 243 | |
| 243 | 244 | protected function hashHTMLBlocks($text) { |
| 244 | - if ($this->no_markup) return $text; |
|
| 245 | + if ($this->no_markup) {
|
|
| 246 | + return $text; |
|
| 247 | + } |
|
| 245 | 248 | |
| 246 | 249 | $less_than_tab = $this->tab_width - 1; |
| 247 | 250 | |
@@ -529,7 +532,9 @@ discard block |
||
| 529 | 532 | # |
| 530 | 533 | # Turn Markdown link shortcuts into XHTML <a> tags. |
| 531 | 534 | # |
| 532 | - if ($this->in_anchor) return $text; |
|
| 535 | + if ($this->in_anchor) {
|
|
| 536 | + return $text; |
|
| 537 | + } |
|
| 533 | 538 | $this->in_anchor = true; |
| 534 | 539 | |
| 535 | 540 | # |
@@ -623,8 +628,7 @@ discard block |
||
| 623 | 628 | $link_text = $this->runSpanGamut($link_text); |
| 624 | 629 | $result .= ">$link_text</a>"; |
| 625 | 630 | $result = $this->hashPart($result); |
| 626 | - } |
|
| 627 | - else { |
|
| 631 | + } else { |
|
| 628 | 632 | $result = $whole_match; |
| 629 | 633 | } |
| 630 | 634 | return $result; |
@@ -638,8 +642,9 @@ discard block |
||
| 638 | 642 | // if the URL was of the form <s p a c e s> it got caught by the HTML |
| 639 | 643 | // tag parser and hashed. Need to reverse the process before using the URL. |
| 640 | 644 | $unhashed = $this->unhash($url); |
| 641 | - if ($unhashed != $url) |
|
| 642 | - $url = preg_replace('/^<(.*)>$/', '\1', $unhashed); |
|
| 645 | + if ($unhashed != $url) {
|
|
| 646 | + $url = preg_replace('/^<(.*)>$/', '\1', $unhashed);
|
|
| 647 | + } |
|
| 643 | 648 | |
| 644 | 649 | $url = $this->encodeURLAttribute($url); |
| 645 | 650 | |
@@ -731,8 +736,7 @@ discard block |
||
| 731 | 736 | } |
| 732 | 737 | $result .= $this->empty_element_suffix; |
| 733 | 738 | $result = $this->hashPart($result); |
| 734 | - } |
|
| 735 | - else { |
|
| 739 | + } else { |
|
| 736 | 740 | # If there's no such link ID, leave intact: |
| 737 | 741 | $result = $whole_match; |
| 738 | 742 | } |
@@ -791,8 +795,9 @@ discard block |
||
| 791 | 795 | |
| 792 | 796 | protected function _doHeaders_callback_setext($matches) { |
| 793 | 797 | # Terrible hack to check we haven't found an empty list item. |
| 794 | - if ($matches[2] == '-' && preg_match('{^-(?: |$)}', $matches[1])) |
|
| 795 | - return $matches[0]; |
|
| 798 | + if ($matches[2] == '-' && preg_match('{^-(?: |$)}', $matches[1])) {
|
|
| 799 | + return $matches[0]; |
|
| 800 | + } |
|
| 796 | 801 | |
| 797 | 802 | $level = $matches[2]{0} == '=' ? 1 : 2; |
| 798 | 803 | |
@@ -823,7 +828,9 @@ discard block |
||
| 823 | 828 | return ""; |
| 824 | 829 | } |
| 825 | 830 | $idValue = call_user_func($this->header_id_func, $headerValue); |
| 826 | - if (!$idValue) return ""; |
|
| 831 | + if (!$idValue) {
|
|
| 832 | + return ""; |
|
| 833 | + } |
|
| 827 | 834 | |
| 828 | 835 | return ' id="' . $this->encodeAttribute($idValue) . '"'; |
| 829 | 836 | |
@@ -882,8 +889,7 @@ discard block |
||
| 882 | 889 | '.$whole_list_re.' |
| 883 | 890 | }mx', |
| 884 | 891 | array($this, '_doLists_callback'), $text); |
| 885 | - } |
|
| 886 | - else { |
|
| 892 | + } else { |
|
| 887 | 893 | $text = preg_replace_callback('{ |
| 888 | 894 | (?:(?<=\n)\n|\A\n?) # Must eat the newline |
| 889 | 895 | '.$whole_list_re.' |
@@ -990,8 +996,7 @@ discard block |
||
| 990 | 996 | # Replace marker with the appropriate whitespace indentation |
| 991 | 997 | $item = $leading_space . str_repeat(' ', strlen($marker_space)) . $item; |
| 992 | 998 | $item = $this->runBlockGamut($this->outdent($item)."\n"); |
| 993 | - } |
|
| 994 | - else { |
|
| 999 | + } else { |
|
| 995 | 1000 | # Recursion for sub-lists: |
| 996 | 1001 | $item = $this->doLists($this->outdent($item)); |
| 997 | 1002 | $item = preg_replace('/\n+$/', '', $item); |
@@ -1261,8 +1266,7 @@ discard block |
||
| 1261 | 1266 | $value = preg_replace('/^([ ]*)/', "<p>", $value); |
| 1262 | 1267 | $value .= "</p>"; |
| 1263 | 1268 | $grafs[$key] = $this->unhash($value); |
| 1264 | - } |
|
| 1265 | - else { |
|
| 1269 | + } else { |
|
| 1266 | 1270 | # Is a block. |
| 1267 | 1271 | # Modify elements of @grafs in-place... |
| 1268 | 1272 | $graf = $value; |
@@ -1329,17 +1333,17 @@ discard block |
||
| 1329 | 1333 | # representation for the URL (removing mailto: or tel:) storing it in $text. |
| 1330 | 1334 | # This function is *not* suitable for attributes enclosed in single quotes. |
| 1331 | 1335 | # |
| 1332 | - if ($this->url_filter_func) |
|
| 1333 | - $url = call_user_func($this->url_filter_func, $url); |
|
| 1336 | + if ($this->url_filter_func) {
|
|
| 1337 | + $url = call_user_func($this->url_filter_func, $url); |
|
| 1338 | + } |
|
| 1334 | 1339 | |
| 1335 | - if (preg_match('{^mailto:}i', $url)) |
|
| 1336 | - $url = $this->encodeEntityObfuscatedAttribute($url, $text, 7); |
|
| 1337 | - else if (preg_match('{^tel:}i', $url)) |
|
| 1340 | + if (preg_match('{^mailto:}i', $url)) {
|
|
| 1341 | + $url = $this->encodeEntityObfuscatedAttribute($url, $text, 7); |
|
| 1342 | + } else if (preg_match('{^tel:}i', $url)) |
|
| 1338 | 1343 | { |
| 1339 | 1344 | $url = $this->encodeAttribute($url); |
| 1340 | 1345 | $text = substr($url, 4); |
| 1341 | - } |
|
| 1342 | - else |
|
| 1346 | + } else |
|
| 1343 | 1347 | { |
| 1344 | 1348 | $url = $this->encodeAttribute($url); |
| 1345 | 1349 | $text = $url; |
@@ -1429,7 +1433,9 @@ discard block |
||
| 1429 | 1433 | # With some optimizations by Milian Wolff. Forced encoding of HTML |
| 1430 | 1434 | # attribute special characters by Allan Odgaard. |
| 1431 | 1435 | # |
| 1432 | - if ($text == "") return $tail = ""; |
|
| 1436 | + if ($text == "") {
|
|
| 1437 | + return $tail = ""; |
|
| 1438 | + } |
|
| 1433 | 1439 | |
| 1434 | 1440 | $chars = preg_split('/(?<!^)(?!$)/', $text); |
| 1435 | 1441 | $seed = (int)abs(crc32($text) / strlen($text)); # Deterministic seed. |
@@ -1443,8 +1449,11 @@ discard block |
||
| 1443 | 1449 | # '@' *must* be encoded. I insist. |
| 1444 | 1450 | # '"' and '>' have to be encoded inside the attribute |
| 1445 | 1451 | if ($r > 90 && strpos('@"&>', $char) === false) /* do nothing */; |
| 1446 | - else if ($r < 45) $chars[$key] = '&#x'.dechex($ord).';'; |
|
| 1447 | - else $chars[$key] = '&#'.$ord.';'; |
|
| 1452 | + else if ($r < 45) {
|
|
| 1453 | + $chars[$key] = '&#x'.dechex($ord).';'; |
|
| 1454 | + } else {
|
|
| 1455 | + $chars[$key] = '&#'.$ord.';'; |
|
| 1456 | + } |
|
| 1448 | 1457 | } |
| 1449 | 1458 | } |
| 1450 | 1459 | |
@@ -1505,8 +1514,7 @@ discard block |
||
| 1505 | 1514 | if (isset($parts[1])) { |
| 1506 | 1515 | $output .= $this->handleSpanToken($parts[1], $parts[2]); |
| 1507 | 1516 | $str = $parts[2]; |
| 1508 | - } |
|
| 1509 | - else { |
|
| 1517 | + } else { |
|
| 1510 | 1518 | break; |
| 1511 | 1519 | } |
| 1512 | 1520 | } |
@@ -1588,7 +1596,9 @@ discard block |
||
| 1588 | 1596 | # function that will loosely count the number of UTF-8 characters with a |
| 1589 | 1597 | # regular expression. |
| 1590 | 1598 | # |
| 1591 | - if (function_exists($this->utf8_strlen)) return; |
|
| 1599 | + if (function_exists($this->utf8_strlen)) {
|
|
| 1600 | + return; |
|
| 1601 | + } |
|
| 1592 | 1602 | $this->utf8_strlen = create_function('$text', 'return preg_match_all( |
| 1593 | 1603 | "/[\\\\x00-\\\\xBF]|[\\\\xC0-\\\\xFF][\\\\x80-\\\\xBF]*/", |
| 1594 | 1604 | $text, $m);'); |