Total Complexity | 77 |
Total Lines | 310 |
Duplicated Lines | 0 % |
Changes | 1 | ||
Bugs | 0 | Features | 0 |
Complex classes like SchemaParser often do a lot of different things. To break such a class down, we need to identify a cohesive component within that class. A common approach to find such a component is to look for fields/methods that share the same prefixes, or suffixes.
Once you have determined the fields that belong together, you can apply the Extract Class refactoring. If the component makes sense as a sub-class, Extract Subclass is also a candidate, and is often faster.
While breaking up the class, it is a good idea to analyze how other classes use SchemaParser, and based on these observations, apply Extract Interface, too.
1 | <?php |
||
13 | class SchemaParser |
||
14 | { |
||
15 | public const TL_API_SOURCE_URL = 'https://raw.githubusercontent.com/tdlib/td/v1.6.0/td/generate/scheme/td_api.tl'; |
||
16 | |||
17 | private OutputInterface $output; |
||
18 | |||
19 | private string $schemaFile; |
||
20 | private string $rawSchema; |
||
21 | private string $currentLine; |
||
22 | private int $currentLineNr; |
||
23 | private array $documentation; |
||
24 | private array $classes; |
||
25 | |||
26 | public function __construct(OutputInterface $output, string $schemaFile = null) |
||
27 | { |
||
28 | $this->output = $output; |
||
29 | $this->schemaFile = $schemaFile ?? static::TL_API_SOURCE_URL; |
||
30 | $this->rawSchema = file_get_contents($this->schemaFile); |
||
31 | $this->documentation = []; |
||
32 | $this->classes = []; |
||
33 | } |
||
34 | |||
35 | /** |
||
36 | * @return ClassDefinition[] |
||
37 | */ |
||
38 | public function parse(): array |
||
39 | { |
||
40 | $lines = explode(PHP_EOL, $this->rawSchema); |
||
41 | |||
42 | $description = ''; |
||
43 | $currentClassName = ''; |
||
44 | $currentClass = new ClassDefinition(); |
||
45 | $isFunction = false; |
||
46 | $needClassDescription = false; |
||
47 | $this->currentLineNr = 0; |
||
48 | |||
49 | foreach ($lines as $line) { |
||
50 | $this->currentLine = $line; |
||
51 | $this->currentLineNr++; |
||
52 | |||
53 | if ('---types---' === $line) { |
||
54 | $isFunction = false; |
||
55 | } elseif ('---functions---' === $line) { |
||
56 | $isFunction = true; |
||
57 | $currentClassName = ''; |
||
58 | $currentClass = new ClassDefinition(); |
||
59 | $needClassDescription = false; |
||
60 | } elseif (($line[0] ?? '') === '/') { |
||
61 | if (($line[1] ?? '') !== '/') { |
||
62 | $this->printError('Wrong comment'); |
||
63 | |||
64 | continue; |
||
65 | } |
||
66 | |||
67 | if (($line[2] ?? '') === '@' || ($line[2] ?? '') === '-') { |
||
68 | $description .= trim(substr($line, 2 + intval('-' === $line[2]))) . ' '; |
||
69 | } else { |
||
70 | $this->printError('Unexpected comment'); |
||
71 | } |
||
72 | } elseif (strpos($line, '? =') || strpos($line, ' = Vector t;') || 'boolFalse = Bool;' === $line || |
||
73 | 'boolTrue = Bool;' === $line || 'bytes = Bytes;' === $line || 'int32 = Int32;' === $line || |
||
74 | 'int53 = Int53;' === $line || 'int64 = Int64;' === $line) { |
||
75 | $this->printDebug('skip built-in types'); |
||
76 | |||
77 | continue; |
||
78 | } else { |
||
79 | $description = trim($description); |
||
80 | |||
81 | if ('' === $description) { |
||
82 | // $this->printError('Empty description', ['description' => $description]); |
||
83 | } |
||
84 | |||
85 | if (($description[0] ?? '') !== '@') { |
||
86 | // $this->printError('Wrong description begin', ['description' => $description]); |
||
87 | } |
||
88 | |||
89 | $docs = explode('@', $description); |
||
90 | array_shift($docs); |
||
91 | |||
92 | $info = []; |
||
93 | foreach ($docs as $doc) { |
||
94 | [$key, $value] = explode(' ', $doc, 2); |
||
95 | $value = trim($value); |
||
96 | |||
97 | if ($needClassDescription) { |
||
98 | if ('description' === $key) { |
||
99 | $needClassDescription = false; |
||
100 | |||
101 | $currentClass->classDocs = $value; |
||
102 | $currentClass->parentClass = 'Object'; |
||
103 | $currentClass->typeName = $currentClass->className; |
||
104 | |||
105 | $this->classes[$value] = $currentClass; |
||
106 | $currentClass = new ClassDefinition(); |
||
107 | continue; |
||
108 | } else { |
||
109 | $this->printError('Expected abstract class description', ['description' => $description]); |
||
110 | } |
||
111 | } |
||
112 | |||
113 | if ('class' === $key) { |
||
114 | $currentClassName = $this->getClassName($value); |
||
115 | $currentClass->className = $currentClassName; |
||
116 | |||
117 | $needClassDescription = true; |
||
118 | |||
119 | if ($isFunction) { |
||
120 | $this->printError('Unexpected class definition'); |
||
121 | } |
||
122 | } else { |
||
123 | if (isset($info[$key])) { |
||
124 | // $this->printError("Duplicate info about `$key`"); |
||
125 | } |
||
126 | $info[$key] = trim($value); |
||
127 | } |
||
128 | } |
||
129 | |||
130 | if (1 !== substr_count($line, '=')) { |
||
131 | // $this->printError("Wrong '=' count"); |
||
132 | continue; |
||
133 | } |
||
134 | |||
135 | [$fields, $type] = explode('=', $line); |
||
136 | $type = $this->getClassName($type); |
||
137 | $fields = explode(' ', trim($fields)); |
||
138 | $typeName = array_shift($fields); |
||
139 | $className = $this->getClassName($typeName); |
||
140 | |||
141 | if ($type !== $currentClassName) { |
||
142 | $currentClassName = ''; |
||
143 | $currentClass = new ClassDefinition(); |
||
144 | $needClassDescription = false; |
||
145 | } |
||
146 | |||
147 | if (!$isFunction) { |
||
148 | $typeLower = strtolower($type); |
||
149 | $classNameLower = strtolower($className); |
||
150 | |||
151 | if (empty($currentClassName) === ($typeLower !== $classNameLower)) { |
||
152 | $this->printError('Wrong constructor name'); |
||
153 | } |
||
154 | |||
155 | if (0 !== strpos($classNameLower, $typeLower)) { |
||
156 | // $this->printError('Wrong constructor name'); |
||
157 | } |
||
158 | } |
||
159 | |||
160 | $knownFields = []; |
||
161 | foreach ($fields as $field) { |
||
162 | [$fieldName, $fieldType] = explode(':', $field); |
||
163 | |||
164 | if (isset($info['param_' . $fieldName])) { |
||
165 | $knownFields['param_' . $fieldName] = $fieldType; |
||
166 | |||
167 | continue; |
||
168 | } |
||
169 | |||
170 | if (isset($info[$fieldName])) { |
||
171 | $knownFields[$fieldName] = $fieldType; |
||
172 | |||
173 | continue; |
||
174 | } |
||
175 | |||
176 | $this->printError("Have no info about field `$fieldName`"); |
||
177 | } |
||
178 | |||
179 | foreach ($info as $name => $value) { |
||
180 | if (!$value) { |
||
181 | $this->printError("info[$name] for $className is empty"); |
||
182 | } elseif (($value[0] < 'A' || $value[0] > 'Z') && ($value[0] < '0' || $value[0] > '9')) { |
||
183 | $this->printError("info[$name] for $className doesn't begins with capital letter"); |
||
184 | } |
||
185 | } |
||
186 | |||
187 | foreach (array_diff_key($info, $knownFields) as $fieldName => $fieldInfo) { |
||
188 | if ('description' !== $fieldName) { |
||
189 | $this->printError("Have info about unexisted field `$fieldName`"); |
||
190 | } |
||
191 | } |
||
192 | |||
193 | if (!isset($info['description'])) { |
||
194 | $this->printError("Have no description for class `$className`"); |
||
195 | } |
||
196 | |||
197 | $baseClassName = $currentClassName ?: $this->getBaseClassName($isFunction); |
||
198 | $classDescription = $info['description']; |
||
199 | |||
200 | if ($isFunction) { |
||
201 | $currentClass->returnType = $this->getTypeName($type); |
||
202 | } |
||
203 | |||
204 | $currentClass->className = $className; |
||
205 | $currentClass->parentClass = $baseClassName; |
||
206 | $currentClass->classDocs = $classDescription; |
||
207 | $currentClass->typeName = $typeName; |
||
208 | |||
209 | foreach ($knownFields as $name => $fieldType) { |
||
210 | $mayBeNull = false !== stripos($info[$name], 'may be null'); |
||
211 | $fieldName = $this->getFieldName($name, $className); |
||
212 | $fieldTypeName = $this->getTypeName($fieldType); |
||
213 | |||
214 | $rawName = $name; |
||
215 | if ('param_' === substr($rawName, 0, 6)) { |
||
216 | $rawName = substr($rawName, 6); |
||
217 | } |
||
218 | |||
219 | $field = $currentClass->getField($name); |
||
220 | $field->rawName = $rawName; |
||
221 | $field->name = $fieldName; |
||
222 | $field->type = $fieldTypeName; |
||
223 | $field->doc = $info[$name]; |
||
224 | $field->mayBeNull = $mayBeNull; |
||
225 | } |
||
226 | |||
227 | $this->classes[$typeName] = $currentClass; |
||
228 | $currentClass = new ClassDefinition(); |
||
229 | $description = ''; |
||
230 | } |
||
231 | } |
||
232 | |||
233 | return $this->classes; |
||
234 | } |
||
235 | |||
236 | private function printError(string $msg, array $args = []): void |
||
237 | { |
||
238 | $this->output->writeln( |
||
239 | '<error>' . $msg . '</error>', |
||
240 | ); |
||
241 | |||
242 | dump(['line' => $this->currentLine, 'line_nr' => $this->currentLineNr], $args); |
||
|
|||
243 | } |
||
244 | |||
245 | private function printDebug(string $msg, array $args = []): void |
||
246 | { |
||
247 | if ($this->output->isDebug()) { |
||
248 | $this->output->writeln('<debug>' . $msg . '</debug>'); |
||
249 | |||
250 | dump(['line' => $this->currentLine, 'line_nr' => $this->currentLineNr], $args); |
||
251 | } |
||
252 | } |
||
253 | |||
254 | protected function getClassName($name): string |
||
255 | { |
||
256 | return implode(array_map('ucfirst', explode('.', trim($name, "\r\n ;")))); |
||
257 | } |
||
258 | |||
259 | protected function getBaseClassName($isFunction): string |
||
260 | { |
||
261 | return $isFunction ? 'Function' : 'Object'; |
||
262 | } |
||
263 | |||
264 | protected function getTypeName($type): string |
||
265 | { |
||
266 | switch ($type) { |
||
267 | case 'Bool': |
||
268 | return 'bool'; |
||
269 | case 'int32': |
||
270 | case 'int53': |
||
271 | return 'int'; |
||
272 | case 'double': |
||
273 | return 'float'; |
||
274 | case 'string': |
||
275 | case 'bytes': |
||
276 | case 'int64': |
||
277 | return 'string'; |
||
278 | case 'bool': |
||
279 | case 'int': |
||
280 | case 'long': |
||
281 | case 'Int': |
||
282 | case 'Long': |
||
283 | case 'Int32': |
||
284 | case 'Int53': |
||
285 | case 'Int64': |
||
286 | case 'Double': |
||
287 | case 'String': |
||
288 | case 'Bytes': |
||
289 | $this->printError("Wrong type $type"); |
||
290 | |||
291 | return ''; |
||
292 | default: |
||
293 | if ('vector' === substr($type, 0, 6)) { |
||
294 | if ('<' !== $type[6] || '>' !== $type[strlen($type) - 1]) { |
||
295 | $this->printError("Wrong vector subtype in $type"); |
||
296 | |||
297 | return ''; |
||
298 | } |
||
299 | |||
300 | return $this->getTypeName(substr($type, 7, -1)) . '[]'; |
||
301 | } |
||
302 | |||
303 | if (preg_match('/[^A-Za-z0-9.]/', $type)) { |
||
304 | $this->printError("Wrong type $type"); |
||
305 | |||
306 | return ''; |
||
307 | } |
||
308 | |||
309 | return $this->getClassName($type); |
||
310 | } |
||
311 | } |
||
312 | |||
313 | protected function getFieldName($name, $className): string |
||
323 | ); |
||
324 | } |
||
325 | } |
||
326 |