Total Complexity | 59 |
Total Lines | 253 |
Duplicated Lines | 0 % |
Changes | 0 |
Complex classes like BlockElementParser often do a lot of different things. To break such a class down, we need to identify a cohesive component within that class. A common approach to find such a component is to look for fields/methods that share the same prefixes, or suffixes.
Once you have determined the fields that belong together, you can apply the Extract Class refactoring. If the component makes sense as a sub-class, Extract Subclass is also a candidate, and is often faster.
While breaking up the class, it is a good idea to analyze how other classes use BlockElementParser, and based on these observations, apply Extract Interface, too.
1 | <?php |
||
14 | abstract class BlockElementParser |
||
15 | { |
||
16 | use HtmlHelper; |
||
17 | |||
18 | const RE_MD_QUOTE = '~^\s*(>+)\s+~'; |
||
19 | const RE_RAW = '/^<\/?\w.*?\/?>/'; |
||
20 | const RE_MD_SETEXT = '~^\s*(={3,}|-{3,})\s*$~'; |
||
21 | const RE_MD_CODE = '/^```\s*([\w-]+)?/'; |
||
22 | const RE_MD_RULE = '~^(_{3,}|\*{3,}|\-{3,})$~'; |
||
23 | const RE_MD_TCOL = '~(\|\s*\:)?\s*\-{3,}\s*(\:\s*\|)?~'; |
||
24 | const RE_MD_OL = '/^\d+\. /'; |
||
25 | |||
26 | protected $lines = []; |
||
27 | protected $stackList = []; |
||
28 | protected $stackBlock = []; |
||
29 | protected $stackTable = []; |
||
30 | |||
31 | protected $pointer = -1; |
||
32 | protected $listLevel = 0; |
||
33 | protected $quoteLevel = 0; |
||
34 | protected $indent = 0; |
||
35 | protected $nextIndent = 0; |
||
36 | protected $indentLen = 4; |
||
37 | |||
38 | protected $indentStr = ' '; |
||
39 | protected $line = ''; |
||
40 | protected $trimmedLine = ''; |
||
41 | protected $prevLine = ''; |
||
42 | protected $trimmedPrevLine = ''; |
||
43 | protected $nextLine = ''; |
||
44 | protected $trimmedNextLine = ''; |
||
45 | protected $markup = ''; |
||
46 | |||
47 | protected $inList = \false; |
||
48 | protected $inQuote = \false; |
||
49 | protected $inPara = \false; |
||
50 | protected $inHtml = \false; |
||
51 | protected $inTable = \false; |
||
52 | |||
53 | protected function parseBlockElements() |
||
54 | { |
||
55 | while (isset($this->lines[++$this->pointer])) { |
||
56 | $this->init(); |
||
|
|||
57 | |||
58 | if ($this->flush() || $this->raw()) { |
||
59 | continue; |
||
60 | } |
||
61 | |||
62 | $this->quote(); |
||
63 | |||
64 | if (($block = $this->isBlock()) || $this->inList) { |
||
65 | $this->markup .= $block ? '' : $this->trimmedLine; |
||
66 | |||
67 | continue; |
||
68 | } |
||
69 | |||
70 | $this->table() || $this->paragraph(); |
||
71 | } |
||
72 | } |
||
73 | |||
74 | protected function isBlock() |
||
75 | { |
||
76 | return $this->atx() || $this->setext() || $this->code() || $this->rule() || $this->listt(); |
||
77 | } |
||
78 | |||
79 | protected function atx() |
||
80 | { |
||
81 | if (isset($this->trimmedLine[0]) && $this->trimmedLine[0] === '#') { |
||
82 | $level = \strlen($this->trimmedLine) - \strlen(\ltrim($this->trimmedLine, '#')); |
||
83 | |||
84 | if ($level < 7) { |
||
85 | $this->markup .= "\n<h{$level}>" . \ltrim(\ltrim($this->trimmedLine, '# ')) . "</h{$level}>"; |
||
86 | |||
87 | return \true; |
||
88 | } |
||
89 | } |
||
90 | } |
||
91 | |||
92 | protected function setext() |
||
93 | { |
||
94 | if (\preg_match(static::RE_MD_SETEXT, $this->nextLine)) { |
||
95 | $level = \trim($this->nextLine, '- ') === '' ? 2 : 1; |
||
96 | |||
97 | $this->markup .= "\n<h{$level}>{$this->trimmedLine}</h{$level}>"; |
||
98 | |||
99 | $this->pointer++; |
||
100 | |||
101 | return \true; |
||
102 | } |
||
103 | } |
||
104 | |||
105 | protected function code() |
||
106 | { |
||
107 | $isShifted = ($this->indent - $this->nextIndent) >= $this->indentLen; |
||
108 | $codeBlock = \preg_match(static::RE_MD_CODE, $this->line, $codeMatch); |
||
109 | |||
110 | if ($codeBlock || (!$this->inList && !$this->inQuote && $isShifted)) { |
||
111 | $lang = isset($codeMatch[1]) |
||
112 | ? ' class="language-' . $codeMatch[1] . '"' |
||
113 | : ''; |
||
114 | |||
115 | $this->markup .= "\n<pre><code{$lang}>"; |
||
116 | |||
117 | if (!$codeBlock) { |
||
118 | $this->markup .= $this->escape(\substr($this->line, $this->indentLen)); |
||
119 | } |
||
120 | |||
121 | $this->codeInternal($codeBlock); |
||
122 | |||
123 | $this->pointer++; |
||
124 | |||
125 | $this->markup .= '</code></pre>'; |
||
126 | |||
127 | return \true; |
||
128 | } |
||
129 | } |
||
130 | |||
131 | private function codeInternal($codeBlock) |
||
132 | { |
||
133 | while (isset($this->lines[$this->pointer + 1])) { |
||
134 | $this->line = $this->escape($this->lines[$this->pointer + 1]); |
||
135 | |||
136 | if (($codeBlock && \substr(\ltrim($this->line), 0, 3) !== '```') |
||
137 | || \strpos($this->line, $this->indentStr) === 0 |
||
138 | ) { |
||
139 | $this->markup .= "\n"; // @todo: donot use \n for first line |
||
140 | $this->markup .= $codeBlock ? $this->line : \substr($this->line, $this->indentLen); |
||
141 | |||
142 | $this->pointer++; |
||
143 | } else { |
||
144 | break; |
||
145 | } |
||
146 | } |
||
147 | } |
||
148 | |||
149 | protected function rule() |
||
150 | { |
||
151 | if ($this->trimmedPrevLine === '' |
||
152 | && \preg_match(static::RE_MD_RULE, $this->trimmedLine) |
||
153 | ) { |
||
154 | $this->markup .= "\n<hr />"; |
||
155 | |||
156 | return \true; |
||
157 | } |
||
158 | } |
||
159 | |||
160 | protected function listt() |
||
180 | } |
||
181 | } |
||
182 | |||
183 | private function listInternal() |
||
184 | { |
||
185 | $isUl = \in_array(\substr($this->trimmedNextLine, 0, 2), ['- ', '* ', '+ ']); |
||
186 | |||
187 | if ($isUl || \preg_match(static::RE_MD_OL, $this->trimmedNextLine)) { |
||
188 | $wrapper = $isUl ? 'ul' : 'ol'; |
||
189 | if ($this->nextIndent > $this->indent) { |
||
190 | $this->stackList[] = "</li>\n"; |
||
191 | $this->stackList[] = "</$wrapper>"; |
||
192 | $this->markup .= "\n<$wrapper>\n"; |
||
193 | |||
194 | $this->listLevel++; |
||
195 | } else { |
||
196 | $this->markup .= "</li>\n"; |
||
197 | } |
||
198 | |||
199 | if ($this->nextIndent < $this->indent) { |
||
200 | $shift = \intval(($this->indent - $this->nextIndent) / $this->indentLen); |
||
201 | |||
202 | while ($shift--) { |
||
203 | $this->markup .= \array_pop($this->stackList); |
||
204 | |||
205 | if ($this->listLevel > 2) { |
||
206 | $this->markup .= \array_pop($this->stackList); |
||
207 | } |
||
208 | } |
||
209 | } |
||
210 | } else { |
||
211 | $this->markup .= "</li>\n"; |
||
212 | } |
||
213 | } |
||
214 | |||
215 | protected function table() |
||
247 | } |
||
248 | |||
249 | private function tableInternal($headerCount) |
||
250 | { |
||
251 | $columnCount = \preg_match_all(static::RE_MD_TCOL, \trim($this->trimmedNextLine, '|')); |
||
252 | |||
253 | if ($headerCount > 0 && $headerCount <= $columnCount) { |
||
267 | } |
||
268 | } |
||
270 |