These results are based on our legacy PHP analysis, consider migrating to our new PHP analysis engine instead. Learn more
| 1 | <?php | ||
| 2 | /** | ||
| 3 | * @copyright Copyright (c) 2014 Carsten Brandt | ||
| 4 | * @license https://github.com/cebe/markdown/blob/master/LICENSE | ||
| 5 | * @link https://github.com/cebe/markdown#readme | ||
| 6 | */ | ||
| 7 | |||
| 8 | namespace cebe\markdown\latex; | ||
| 9 | |||
| 10 | use cebe\markdown\block\CodeTrait; | ||
| 11 | use cebe\markdown\block\HeadlineTrait; | ||
| 12 | use cebe\markdown\block\ListTrait; | ||
| 13 | use cebe\markdown\block\QuoteTrait; | ||
| 14 | use cebe\markdown\block\RuleTrait; | ||
| 15 | |||
| 16 | use cebe\markdown\inline\CodeTrait as InlineCodeTrait; | ||
| 17 | use cebe\markdown\inline\EmphStrongTrait; | ||
| 18 | use cebe\markdown\inline\LinkTrait; | ||
| 19 | |||
| 20 | use MikeVanRiel\TextToLatex; | ||
| 21 | |||
| 22 | /** | ||
| 23 | * Markdown parser for the [initial markdown spec](http://daringfireball.net/projects/markdown/syntax). | ||
| 24 | * | ||
| 25 | * @author Carsten Brandt <[email protected]> | ||
| 26 | */ | ||
| 27 | class Markdown extends \cebe\markdown\Parser | ||
| 28 | { | ||
| 29 | // include block element parsing using traits | ||
| 30 | use CodeTrait; | ||
| 31 | use HeadlineTrait; | ||
| 32 | 	use ListTrait { | ||
| 33 | // Check Ul List before headline | ||
| 34 | identifyUl as protected identifyBUl; | ||
| 35 | consumeUl as protected consumeBUl; | ||
| 36 | } | ||
| 37 | use QuoteTrait; | ||
| 38 | 	use RuleTrait { | ||
| 39 | // Check Hr before checking lists | ||
| 40 | identifyHr as protected identifyAHr; | ||
| 41 | consumeHr as protected consumeAHr; | ||
| 42 | } | ||
| 43 | |||
| 44 | // include inline element parsing using traits | ||
| 45 | use InlineCodeTrait; | ||
| 46 | use EmphStrongTrait; | ||
| 47 | use LinkTrait; | ||
| 48 | |||
| 49 | /** | ||
| 50 | * @var string this string will be prefixed to all auto generated labels. | ||
| 51 | * This can be used to disambiguate labels when combining multiple markdown files into one document. | ||
| 52 | */ | ||
| 53 | public $labelPrefix = ''; | ||
| 54 | |||
| 55 | const LINK_STYLE_FOOTNOTE = 'footnote'; | ||
| 56 | const LINK_STYLE_HREF = 'href'; | ||
| 57 | |||
| 58 | /** | ||
| 59 | * @var string link style defines how links are rendered in LaTeX, there are two different options: | ||
| 60 | * | ||
| 61 | * - `footnote` (default) - render all links with a footnote, which contains the full URL of the link. This is good for printing the PDF. | ||
| 62 | * - `href` - render all links with a hyperref, similar to HTML, the link target is not visible in this case. | ||
| 63 | */ | ||
| 64 | public $linkStyle = self::LINK_STYLE_FOOTNOTE; | ||
| 65 | |||
| 66 | /** | ||
| 67 | * @var array these are "escapeable" characters. When using one of these prefixed with a | ||
| 68 | * backslash, the character will be outputted without the backslash and is not interpreted | ||
| 69 | * as markdown. | ||
| 70 | */ | ||
| 71 | protected $escapeCharacters = [ | ||
| 72 | '\\', // backslash | ||
| 73 | '`', // backtick | ||
| 74 | '*', // asterisk | ||
| 75 | '_', // underscore | ||
| 76 | 		'{', '}', // curly braces | ||
| 77 | '[', ']', // square brackets | ||
| 78 | 		'(', ')', // parentheses | ||
| 79 | '#', // hash mark | ||
| 80 | 23 | '+', // plus sign | |
| 81 | '-', // minus sign (hyphen) | ||
| 82 | '.', // dot | ||
| 83 | 23 | '!', // exclamation mark | |
| 84 | 23 | '<', '>', | |
| 85 | ]; | ||
| 86 | |||
| 87 | |||
| 88 | /** | ||
| 89 | * @inheritDoc | ||
| 90 | */ | ||
| 91 | 8 | protected function prepare() | |
| 92 | 	{ | ||
| 93 | // reset references | ||
| 94 | 8 | $this->references = []; | |
| 95 | 8 | } | |
| 96 | 8 | ||
| 97 | 8 | /** | |
| 98 | 8 | * Consume lines for a paragraph | |
| 99 | 8 | * | |
| 100 | 8 | * Allow headlines and code to break paragraphs | |
| 101 | 8 | */ | |
| 102 | 8 | protected function consumeParagraph($lines, $current) | |
| 103 | 7 | 	{ | |
| 104 | // consume until newline | ||
| 105 | 8 | $content = []; | |
| 106 | 		for ($i = $current, $count = count($lines); $i < $count; $i++) { | ||
| 107 | 8 | $line = $lines[$i]; | |
| 108 | 8 | if (!empty($line) && ltrim($line) !== '' && | |
| 109 | 8 | !($line[0] === "\t" || $line[0] === " " && strncmp($line, ' ', 4) === 0) && | |
| 110 | 8 | !$this->identifyHeadline($line, $lines, $i)) | |
| 111 | 			{ | ||
| 112 | $content[] = $line; | ||
| 113 | 			} else { | ||
| 114 | break; | ||
| 115 | } | ||
| 116 | } | ||
| 117 | $block = [ | ||
| 118 | 'paragraph', | ||
| 119 | 			'content' => $this->parseInline(implode("\n", $content)), | ||
| 120 | 21 | ]; | |
| 121 | return [$block, --$i]; | ||
| 122 | 21 | } | |
| 123 | |||
| 124 | |||
| 125 | // rendering adjusted for LaTeX output | ||
| 126 | |||
| 127 | |||
| 128 | 2 | /** | |
| 129 | * @inheritdoc | ||
| 130 | 2 | */ | |
| 131 | protected function renderParagraph($block) | ||
| 132 | 	{ | ||
| 133 | return $this->renderAbsy($block['content']) . "\n\n"; | ||
| 134 | } | ||
| 135 | |||
| 136 | 3 | /** | |
| 137 | * @inheritdoc | ||
| 138 | 3 | */ | |
| 139 | protected function renderQuote($block) | ||
| 140 | 3 | 	{ | |
| 141 | 		return '\begin{quote}' . $this->renderAbsy($block['content']) . "\\end{quote}\n"; | ||
| 142 | 3 | } | |
| 143 | |||
| 144 | 3 | /** | |
| 145 | * @inheritdoc | ||
| 146 | */ | ||
| 147 | protected function renderCode($block) | ||
| 148 | 	{ | ||
| 149 | 		$language = isset($block['language']) ? "\\lstset{language={$block['language']}}" : '\lstset{language={}}'; | ||
| 150 | 2 | ||
| 151 | $content = $block['content']; | ||
| 152 | 2 | // replace No-Break Space characters in code block, which do not render in LaTeX | |
| 153 | 2 | 		$content = preg_replace("/[\x{00a0}\x{202f}]/u", ' ', $content); | |
| 154 | |||
| 155 | 2 | 		return "$language\\begin{lstlisting}\n{$content}\n\\end{lstlisting}\n"; | |
| 156 | 2 | } | |
| 157 | 2 | ||
| 158 | /** | ||
| 159 | 2 | * @inheritdoc | |
| 160 | */ | ||
| 161 | protected function renderList($block) | ||
| 162 | 	{ | ||
| 163 | $type = ($block['list'] === 'ol') ? 'enumerate' : 'itemize'; | ||
| 164 | 		$output = "\\begin{{$type}}\n"; | ||
| 165 | 3 | ||
| 166 | 		foreach ($block['items'] as $item => $itemLines) { | ||
| 167 | 3 | $output .= '\item ' . $this->renderAbsy($itemLines). "\n"; | |
| 168 | 3 | } | |
| 169 | 3 | ||
| 170 | 3 | 		return "$output\\end{{$type}}\n"; | |
| 171 | 2 | } | |
| 172 | 2 | ||
| 173 | 2 | /** | |
| 174 | * @inheritdoc | ||
| 175 | */ | ||
| 176 | protected function renderHeadline($block) | ||
| 177 | 	{ | ||
| 178 | $content = $this->renderAbsy($block['content']); | ||
| 179 | 2 | 		switch($block['level']) { | |
| 180 | 			case 1: return "\\section{{$content}}\n"; | ||
| 181 | 2 | 			case 2: return "\\subsection{{$content}}\n"; | |
| 182 | 			case 3: return "\\subsubsection{{$content}}\n"; | ||
| 183 | 			default: return "\\paragraph{{$content}}\n"; | ||
| 184 | } | ||
| 185 | } | ||
| 186 | |||
| 187 | 2 | /** | |
| 188 | * @inheritdoc | ||
| 189 | 2 | */ | |
| 190 | protected function renderHr($block) | ||
| 0 ignored issues–
                            show | |||
| 191 | 	{ | ||
| 192 | 		return "\n\\noindent\\rule{\\textwidth}{0.4pt}\n"; | ||
| 193 | } | ||
| 194 | |||
| 195 | /** | ||
| 196 | * @inheritdoc | ||
| 197 | 2 | */ | |
| 198 | 2 | protected function renderLink($block) | |
| 199 | 2 | 	{ | |
| 200 | View Code Duplication | 		if (isset($block['refkey'])) { | |
| 201 | 			if (($ref = $this->lookupReference($block['refkey'])) !== false) { | ||
| 202 | $block = array_merge($block, $ref); | ||
| 203 | 			} else { | ||
| 204 | return $block['orig']; | ||
| 205 | } | ||
| 206 | } | ||
| 207 | 2 | ||
| 208 | $url = $block['url']; | ||
| 209 | $text = $this->renderAbsy($block['text']); | ||
| 210 | 		if (strpos($url, '://') === false) { | ||
| 211 | // consider all non absolute links as relative in the document | ||
| 212 | // $title is ignored in this case. | ||
| 213 | 			if (isset($url[0]) && $url[0] === '#') { | ||
| 214 | 2 | $url = $this->labelPrefix . $url; | |
| 215 | } | ||
| 216 | 2 | 			return '\hyperref['.str_replace('#', '::', $url).']{' . $text . '}'; | |
| 217 | 		} else { | ||
| 218 | 			if ($this->linkStyle === self::LINK_STYLE_HREF) { | ||
| 219 | 				return '\href{' . $this->escapeUrl($url) . '}{' . $text . '}'; | ||
| 220 | } | ||
| 221 | 			return $text . '\\footnote{' . (empty($block['title']) ? '' : $this->escapeLatex($block['title']) . ': ') . '\url{' . $this->escapeUrl($url) . '}}'; | ||
| 222 | } | ||
| 223 | } | ||
| 224 | |||
| 225 | /** | ||
| 226 | 2 | * @inheritdoc | |
| 227 | 2 | */ | |
| 228 | 2 | protected function renderImage($block) | |
| 229 | 2 | 	{ | |
| 230 | 2 | View Code Duplication | 		if (isset($block['refkey'])) { | 
| 231 | 2 | 			if (($ref = $this->lookupReference($block['refkey'])) !== false) { | |
| 232 | 2 | $block = array_merge($block, $ref); | |
| 233 | 2 | 			} else { | |
| 234 | 2 | return $block['orig']; | |
| 235 | } | ||
| 236 | } | ||
| 237 | |||
| 238 | // TODO create figure with caption with title | ||
| 239 | $replaces = [ | ||
| 240 | 2 | '%' => '\\%', | |
| 241 | 			'{' => '\\%7B', | ||
| 242 | 2 | '}' => '\\%7D', | |
| 243 | '\\' => '\\\\', | ||
| 244 | 2 | '#' => '\\#', | |
| 245 | '$' => '\\%24', | ||
| 246 | 2 | ]; | |
| 247 | 2 | $url = str_replace(array_keys($replaces), array_values($replaces), $block['url']); | |
| 248 | 2 | 		return "\\noindent\\includegraphics[width=\\textwidth]{{$url}}"; | |
| 249 | } | ||
| 250 | |||
| 251 | /** | ||
| 252 | * Parses <a name="..."></a> tags as reference labels | ||
| 253 | */ | ||
| 254 | private function parseInlineHtml($text) | ||
| 255 | 	{ | ||
| 256 | 		if (strpos($text, '>') !== false) { | ||
| 257 | 2 | // convert a name markers to \labels | |
| 258 | 			if (preg_match('~^<((a|span)) (name|id)="(.*?)">.*?</\1>~i', $text, $matches)) { | ||
| 259 | 2 | return [ | |
| 260 | 					['label', 'name' => str_replace('#', '::', $this->labelPrefix . $matches[4])], | ||
| 261 | strlen($matches[0]) | ||
| 262 | ]; | ||
| 263 | } | ||
| 264 | } | ||
| 265 | 2 | return [['text', '<'], 1]; | |
| 266 | } | ||
| 267 | 2 | ||
| 268 | 2 | /** | |
| 269 | * renders a reference label | ||
| 270 | */ | ||
| 271 | protected function renderLabel($block) | ||
| 272 | 	{ | ||
| 273 | 		return "\\label{{$block['name']}}"; | ||
| 274 | 2 | } | |
| 275 | |||
| 276 | 2 | /** | |
| 277 | * @inheritdoc | ||
| 278 | */ | ||
| 279 | protected function renderEmail($block) | ||
| 280 | 	{ | ||
| 281 | $email = $this->escapeUrl($block[1]); | ||
| 282 | 1 | 		return "\\href{mailto:{$email}}{{$email}}"; | |
| 283 | } | ||
| 284 | |||
| 285 | 1 | /** | |
| 286 | * @inheritdoc | ||
| 287 | 1 | */ | |
| 288 | 1 | protected function renderUrl($block) | |
| 289 | 	{ | ||
| 290 | 		return '\url{' . $this->escapeUrl($block[1]) . '}'; | ||
| 291 | } | ||
| 292 | |||
| 293 | /** | ||
| 294 | * @inheritdoc | ||
| 295 | */ | ||
| 296 | protected function renderInlineCode($block) | ||
| 297 | 1 | 	{ | |
| 298 | // replace No-Break Space characters in code block, which do not render in LaTeX | ||
| 299 | 1 | 		$content = preg_replace("/[\x{00a0}\x{202f}]/u", ' ', $block[1]); | |
| 300 | |||
| 301 | 		if (strpos($content, '|') !== false) { | ||
| 302 | 			return '\\lstinline`' . str_replace("\n", ' ', $content) . '`'; // TODO make this more robust against code containing backticks | ||
| 303 | 		} else { | ||
| 304 | 			return '\\lstinline|' . str_replace("\n", ' ', $content) . '|'; | ||
| 305 | 1 | } | |
| 306 | } | ||
| 307 | 1 | ||
| 308 | /** | ||
| 309 | * @inheritdoc | ||
| 310 | */ | ||
| 311 | protected function renderStrong($block) | ||
| 312 | 	{ | ||
| 313 | 		return '\textbf{' . $this->renderAbsy($block[1]) . '}'; | ||
| 314 | } | ||
| 315 | 1 | ||
| 316 | /** | ||
| 317 | 1 | * @inheritdoc | |
| 318 | 1 | */ | |
| 319 | protected function renderEmph($block) | ||
| 320 | 	{ | ||
| 321 | 1 | 		return '\textit{' . $this->renderAbsy($block[1]) . '}'; | |
| 322 | } | ||
| 323 | |||
| 324 | /** | ||
| 325 | * Parses escaped special characters. | ||
| 326 | * This allow a backslash to be interpreted as LaTeX | ||
| 327 | * @marker \ | ||
| 328 | */ | ||
| 329 | protected function parseEscape($text) | ||
| 330 | 	{ | ||
| 331 | 		if (isset($text[1]) && in_array($text[1], $this->escapeCharacters)) { | ||
| 332 | 			if ($text[1] === '\\') { | ||
| 333 | return [['backslash'], 2]; | ||
| 334 | } | ||
| 335 | return [['text', $text[1]], 2]; | ||
| 336 | 4 | } | |
| 337 | return [['text', $text[0]], 1]; | ||
| 338 | 4 | } | |
| 339 | |||
| 340 | protected function renderBackslash() | ||
| 341 | 	{ | ||
| 342 | return '\\'; | ||
| 343 | } | ||
| 344 | 21 | ||
| 345 | private $_escaper; | ||
| 346 | 21 | ||
| 347 | 21 | /** | |
| 348 | 21 | * Escape special characters in URLs | |
| 349 | 21 | */ | |
| 350 | protected function escapeUrl($string) | ||
| 351 | 	{ | ||
| 352 | 		return str_replace('%', '\\%', $this->escapeLatex($string)); | ||
| 353 | } | ||
| 354 | |||
| 355 | /** | ||
| 356 | * Escape special LaTeX characters | ||
| 357 | 21 | */ | |
| 358 | protected function escapeLatex($string) | ||
| 359 | 21 | 	{ | |
| 360 | 		if ($this->_escaper === null) { | ||
| 361 | 21 | $this->_escaper = new TextToLatex(); | |
| 362 | } | ||
| 363 | return $this->_escaper->convert($string); | ||
| 364 | } | ||
| 365 | 21 | ||
| 366 | 21 | /** | |
| 367 | * @inheritdocs | ||
| 368 | * | ||
| 369 | 1 | * Parses a newline indicated by two spaces on the end of a markdown line. | |
| 370 | */ | ||
| 371 | protected function renderText($text) | ||
| 372 | 	{ | ||
| 373 | 		$output = str_replace("  \n", "\\\\\n", $this->escapeLatex($text[1])); | ||
| 374 | // support No-Break Space in LaTeX | ||
| 375 | 		$output = preg_replace("/\x{00a0}/u", '~', $output); | ||
| 376 | // support Narrow No-Break Space spaces in LaTeX | ||
| 377 | // http://unicode-table.com/en/202F/ | ||
| 378 | // http://tex.stackexchange.com/questions/76132/how-to-typeset-a-small-non-breaking-space | ||
| 379 | 		$output = preg_replace("/\x{202f}/u", '\nobreak\hspace{.16667em plus .08333em}', $output); | ||
| 380 | return $output; | ||
| 381 | } | ||
| 382 | } | ||
| 383 | 
 
                                
This check looks from parameters that have been defined for a function or method, but which are not used in the method body.