Complex classes like LingoParser often do a lot of different things. To break such a class down, we need to identify a cohesive component within that class. A common approach to find such a component is to look for fields/methods that share the same prefixes, or suffixes. You can also have a look at the cohesion graph to spot any un-connected, or weakly-connected components.
Once you have determined the fields that belong together, you can apply the Extract Class refactoring. If the component makes sense as a sub-class, Extract Subclass is also a candidate, and is often faster.
While breaking up the class, it is a good idea to analyze how other classes use LingoParser, and based on these observations, apply Extract Interface, too.
| 1 | <?php |
||
| 45 | class LingoParser { |
||
| 46 | |||
| 47 | const WORD_VALUE = 0; |
||
| 48 | const WORD_OFFSET = 1; |
||
| 49 | |||
| 50 | private $mLingoTree = null; |
||
| 51 | |||
| 52 | /** |
||
| 53 | * @var Backend |
||
| 54 | */ |
||
| 55 | private $mLingoBackend = null; |
||
| 56 | private static $parserSingleton = null; |
||
| 57 | |||
| 58 | // The RegEx to split a chunk of text into words |
||
| 59 | 1 | public $regex = null; |
|
| 60 | |||
| 61 | /** |
||
| 62 | 1 | * Lingo\LingoParser constructor. |
|
| 63 | 1 | * @param MessageLog|null $messages |
|
| 64 | */ |
||
| 65 | public function __construct( MessageLog &$messages = null ) { |
||
|
|
|||
| 66 | // The RegEx to split a chunk of text into words |
||
| 67 | // Words are: placeholders for stripped items, sequences of letters and numbers, single characters that are neither letter nor number |
||
| 68 | $this->regex = '/' . preg_quote( Parser::MARKER_PREFIX, '/' ) . '.*?' . preg_quote( Parser::MARKER_SUFFIX, '/' ) . '|[\p{L}\p{N}]+|[^\p{L}\p{N}]/u'; |
||
| 69 | } |
||
| 70 | |||
| 71 | /** |
||
| 72 | * |
||
| 73 | * @param \AbstractContent $content |
||
| 74 | * @param \Title $title |
||
| 75 | * @param \ParserOutput $po |
||
| 76 | * |
||
| 77 | * @return Boolean |
||
| 78 | */ |
||
| 79 | public function parse( $content, $title, $po ) { |
||
| 80 | |||
| 81 | /** @var \Parser $parser */ |
||
| 82 | $parser = $GLOBALS[ 'wgParser' ]; |
||
| 83 | |||
| 84 | if ( $this->shouldParse( $parser ) ) { |
||
| 85 | $this->realParse( $parser ); |
||
| 86 | } |
||
| 87 | |||
| 88 | return true; |
||
| 89 | } |
||
| 90 | |||
| 91 | /** |
||
| 92 | * @return LingoParser |
||
| 93 | * @since 2.0.1 |
||
| 94 | */ |
||
| 95 | public static function getInstance() { |
||
| 96 | if ( !self::$parserSingleton ) { |
||
| 97 | self::$parserSingleton = new LingoParser(); |
||
| 98 | |||
| 99 | } |
||
| 100 | |||
| 101 | return self::$parserSingleton; |
||
| 102 | } |
||
| 103 | |||
| 104 | /** |
||
| 105 | * @return string |
||
| 106 | */ |
||
| 107 | private function getCacheKey() { |
||
| 108 | // FIXME: If Lingo ever stores the glossary tree per user, then the cache key also needs to include the user id (see T163608) |
||
| 109 | return ObjectCache::getLocalClusterInstance()->makeKey( 'ext', 'lingo', 'lingotree', Tree::TREE_VERSION, get_class( self::getInstance()->getBackend() ) ); |
||
| 110 | } |
||
| 111 | |||
| 112 | /** |
||
| 113 | * @return Backend the backend used by the parser |
||
| 114 | * @throws \MWException |
||
| 115 | */ |
||
| 116 | public function getBackend() { |
||
| 117 | |||
| 118 | if ( $this->mLingoBackend === null ) { |
||
| 119 | throw new \MWException( 'No Lingo backend available!' ); |
||
| 120 | } |
||
| 121 | |||
| 122 | return $this->mLingoBackend; |
||
| 123 | } |
||
| 124 | |||
| 125 | /** |
||
| 126 | * Returns the list of terms in the glossary |
||
| 127 | * |
||
| 128 | * @return array an array mapping terms (keys) to descriptions (values) |
||
| 129 | */ |
||
| 130 | public function getLingoArray() { |
||
| 131 | return $this->getLingoTree()->getTermList(); |
||
| 132 | } |
||
| 133 | |||
| 134 | /** |
||
| 135 | * Returns the list of terms in the glossary as a Lingo\Tree |
||
| 136 | * |
||
| 137 | * @return Tree a Lingo\Tree mapping terms (keys) to descriptions (values) |
||
| 138 | */ |
||
| 139 | public function getLingoTree() { |
||
| 181 | |||
| 182 | /** |
||
| 183 | * @return Tree |
||
| 184 | */ |
||
| 185 | protected function &buildLingo() { |
||
| 197 | |||
| 198 | /** |
||
| 199 | * Parses the given text and enriches applicable terms |
||
| 200 | * |
||
| 201 | * This method currently only recognizes terms consisting of max one word |
||
| 202 | * |
||
| 203 | * @param Parser $parser |
||
| 204 | * |
||
| 205 | * @return Boolean |
||
| 206 | */ |
||
| 207 | protected function realParse( &$parser ) { |
||
| 340 | |||
| 341 | /** |
||
| 342 | * @param Parser $parser |
||
| 343 | */ |
||
| 344 | protected function loadModules( &$parser ) { |
||
| 363 | |||
| 364 | /** |
||
| 365 | * Purges the lingo tree from the cache. |
||
| 366 | * |
||
| 367 | * @deprecated 2.0.2 |
||
| 368 | */ |
||
| 369 | public static function purgeCache() { |
||
| 373 | |||
| 374 | /** |
||
| 375 | * Purges the lingo tree from the cache. |
||
| 376 | * |
||
| 377 | * @since 2.0.2 |
||
| 378 | */ |
||
| 379 | public function purgeGlossaryFromCache() { |
||
| 385 | |||
| 386 | /** |
||
| 387 | * @since 2.0.1 |
||
| 388 | * @param Backend $backend |
||
| 389 | */ |
||
| 390 | public function setBackend( Backend $backend ) { |
||
| 394 | |||
| 395 | /** |
||
| 396 | * @param Parser $parser |
||
| 397 | * @return bool |
||
| 398 | */ |
||
| 399 | protected function shouldParse( &$parser ) { |
||
| 424 | } |
||
| 425 | |||
| 426 |
This check looks from parameters that have been defined for a function or method, but which are not used in the method body.