Complex classes like Jetpack_WPES_Query_Builder often do a lot of different things. To break such a class down, we need to identify a cohesive component within that class. A common approach to find such a component is to look for fields/methods that share the same prefixes, or suffixes. You can also have a look at the cohesion graph to spot any un-connected, or weakly-connected components.
Once you have determined the fields that belong together, you can apply the Extract Class refactoring. If the component makes sense as a sub-class, Extract Subclass is also a candidate, and is often faster.
While breaking up the class, it is a good idea to analyze how other classes use Jetpack_WPES_Query_Builder, and based on these observations, apply Extract Interface, too.
| 1 | <?php |
||
| 25 | class Jetpack_WPES_Query_Builder { |
||
| 26 | |||
| 27 | protected $es_filters = array(); |
||
| 28 | |||
| 29 | // Custom boosting with function_score |
||
| 30 | protected $functions = array(); |
||
| 31 | protected $weighting_functions = array(); |
||
| 32 | protected $decays = array(); |
||
| 33 | protected $scripts = array(); |
||
| 34 | protected $functions_max_boost = 2.0; |
||
| 35 | protected $functions_score_mode = 'multiply'; |
||
| 36 | protected $functions_boost_mode = 'multiply'; |
||
| 37 | protected $query_bool_boost = null; |
||
| 38 | |||
| 39 | // General aggregations for buckets and metrics |
||
| 40 | protected $aggs_query = false; |
||
| 41 | protected $aggs = array(); |
||
| 42 | |||
| 43 | // The set of top level text queries to combine |
||
| 44 | protected $must_queries = array(); |
||
| 45 | protected $should_queries = array(); |
||
| 46 | protected $dis_max_queries = array(); |
||
| 47 | |||
| 48 | protected $diverse_buckets_query = false; |
||
| 49 | protected $bucket_filters = array(); |
||
| 50 | protected $bucket_sub_aggs = array(); |
||
| 51 | |||
| 52 | public function get_langs() { |
||
| 53 | if ( isset( $this->langs ) ) { |
||
| 54 | return $this->langs; |
||
|
|
|||
| 55 | } |
||
| 56 | return false; |
||
| 57 | } |
||
| 58 | |||
| 59 | //////////////////////////////////// |
||
| 60 | // Methods for building a query |
||
| 61 | |||
| 62 | public function add_filter( $filter ) { |
||
| 63 | $this->es_filters[] = $filter; |
||
| 64 | |||
| 65 | return $this; |
||
| 66 | } |
||
| 67 | |||
| 68 | public function add_query( $query, $type = 'must' ) { |
||
| 69 | switch ( $type ) { |
||
| 70 | case 'dis_max': |
||
| 71 | $this->dis_max_queries[] = $query; |
||
| 72 | break; |
||
| 73 | |||
| 74 | case 'should': |
||
| 75 | $this->should_queries[] = $query; |
||
| 76 | break; |
||
| 77 | |||
| 78 | case 'must': |
||
| 79 | default: |
||
| 80 | $this->must_queries[] = $query; |
||
| 81 | break; |
||
| 82 | } |
||
| 83 | |||
| 84 | return $this; |
||
| 85 | } |
||
| 86 | |||
| 87 | /** |
||
| 88 | * Add any weighting function to the query |
||
| 89 | * |
||
| 90 | * @see https://www.elastic.co/guide/en/elasticsearch/reference/current/query-dsl-function-score-query.html |
||
| 91 | * |
||
| 92 | * @param $function array A function structure to apply to the query |
||
| 93 | * |
||
| 94 | * @return void |
||
| 95 | */ |
||
| 96 | public function add_weighting_function( $function ) { |
||
| 97 | $this->weighting_functions[] = $function; |
||
| 98 | |||
| 99 | return $this; |
||
| 100 | } |
||
| 101 | |||
| 102 | /** |
||
| 103 | * Add a scoring function to the query |
||
| 104 | * |
||
| 105 | * NOTE: For decays (linear, exp, or gauss), use Jetpack_WPES_Query_Builder::add_decay() instead |
||
| 106 | * |
||
| 107 | * @see https://www.elastic.co/guide/en/elasticsearch/reference/current/query-dsl-function-score-query.html |
||
| 108 | * |
||
| 109 | * @param $function string name of the function |
||
| 110 | * @param $params array functions parameters |
||
| 111 | * |
||
| 112 | * @return void |
||
| 113 | */ |
||
| 114 | public function add_function( $function, $params ) { |
||
| 115 | $this->functions[ $function ][] = $params; |
||
| 116 | |||
| 117 | return $this; |
||
| 118 | } |
||
| 119 | |||
| 120 | /** |
||
| 121 | * Add a decay function to score results |
||
| 122 | * |
||
| 123 | * This method should be used instead of Jetpack_WPES_Query_Builder::add_function() for decays, as the internal ES structure |
||
| 124 | * is slightly different for them. |
||
| 125 | * |
||
| 126 | * @see https://www.elastic.co/guide/en/elasticsearch/guide/current/decay-functions.html |
||
| 127 | * |
||
| 128 | * @param $function string name of the decay function - linear, exp, or gauss |
||
| 129 | * @param $params array The decay functions parameters, passed to ES directly |
||
| 130 | * |
||
| 131 | * @return void |
||
| 132 | */ |
||
| 133 | public function add_decay( $function, $params ) { |
||
| 134 | $this->decays[ $function ][] = $params; |
||
| 135 | |||
| 136 | return $this; |
||
| 137 | } |
||
| 138 | |||
| 139 | /** |
||
| 140 | * Add a scoring mode to the query |
||
| 141 | * |
||
| 142 | * @see https://www.elastic.co/guide/en/elasticsearch/reference/current/query-dsl-function-score-query.html |
||
| 143 | * |
||
| 144 | * @param $mode string name of how to score |
||
| 145 | * |
||
| 146 | * @return void |
||
| 147 | */ |
||
| 148 | public function add_score_mode_to_functions( $mode='multiply' ) { |
||
| 149 | $this->functions_score_mode = $mode; |
||
| 150 | |||
| 151 | return $this; |
||
| 152 | } |
||
| 153 | |||
| 154 | public function add_boost_mode_to_functions( $mode='multiply' ) { |
||
| 155 | $this->functions_boost_mode = $mode; |
||
| 156 | |||
| 157 | return $this; |
||
| 158 | } |
||
| 159 | |||
| 160 | public function add_max_boost_to_functions( $boost ) { |
||
| 161 | $this->functions_max_boost = $boost; |
||
| 162 | |||
| 163 | return $this; |
||
| 164 | } |
||
| 165 | |||
| 166 | public function add_boost_to_query_bool( $boost ) { |
||
| 167 | $this->query_bool_boost = $boost; |
||
| 168 | |||
| 169 | return $this; |
||
| 170 | } |
||
| 171 | |||
| 172 | public function add_aggs( $aggs_name, $aggs ) { |
||
| 173 | $this->aggs_query = true; |
||
| 174 | $this->aggs[$aggs_name] = $aggs; |
||
| 175 | |||
| 176 | return $this; |
||
| 177 | } |
||
| 178 | |||
| 179 | public function set_all_aggs( $aggs ) { |
||
| 180 | $this->aggs_query = true; |
||
| 181 | $this->aggs = $aggs; |
||
| 182 | |||
| 183 | return $this; |
||
| 184 | } |
||
| 185 | |||
| 186 | public function add_aggs_sub_aggs( $aggs_name, $sub_aggs ) { |
||
| 187 | if ( ! array_key_exists( 'aggs', $this->aggs[$aggs_name] ) ) { |
||
| 188 | $this->aggs[$aggs_name]['aggs'] = array(); |
||
| 189 | } |
||
| 190 | $this->aggs[$aggs_name]['aggs'] = $sub_aggs; |
||
| 191 | |||
| 192 | return $this; |
||
| 193 | } |
||
| 194 | |||
| 195 | public function add_bucketed_query( $name, $query ) { |
||
| 196 | $this->_add_bucket_filter( $name, $query ); |
||
| 197 | |||
| 198 | $this->add_query( $query, 'dis_max' ); |
||
| 199 | |||
| 200 | return $this; |
||
| 201 | } |
||
| 202 | |||
| 203 | public function add_bucketed_terms( $name, $field, $terms, $boost = 1 ) { |
||
| 204 | if ( ! is_array( $terms ) ) { |
||
| 205 | $terms = array( $terms ); |
||
| 206 | } |
||
| 207 | |||
| 208 | $this->_add_bucket_filter( $name, array( |
||
| 209 | 'terms' => array( |
||
| 210 | $field => $terms, |
||
| 211 | ), |
||
| 212 | )); |
||
| 213 | |||
| 214 | $this->add_query( array( |
||
| 215 | 'constant_score' => array( |
||
| 216 | 'filter' => array( |
||
| 217 | 'terms' => array( |
||
| 218 | $field => $terms, |
||
| 219 | ), |
||
| 220 | ), |
||
| 221 | 'boost' => $boost, |
||
| 222 | ), |
||
| 223 | ), 'dis_max' ); |
||
| 224 | |||
| 225 | return $this; |
||
| 226 | } |
||
| 227 | |||
| 228 | public function add_bucket_sub_aggs( $agg ) { |
||
| 229 | $this->bucket_sub_aggs = array_merge( $this->bucket_sub_aggs, $agg ); |
||
| 230 | |||
| 231 | return $this; |
||
| 232 | } |
||
| 233 | |||
| 234 | protected function _add_bucket_filter( $name, $filter ) { |
||
| 235 | $this->diverse_buckets_query = true; |
||
| 236 | $this->bucket_filters[ $name ] = $filter; |
||
| 237 | } |
||
| 238 | |||
| 239 | //////////////////////////////////// |
||
| 240 | // Building Final Query |
||
| 241 | |||
| 242 | /** |
||
| 243 | * Combine all the queries, functions, decays, scripts, and max_boost into an ES query |
||
| 244 | * |
||
| 245 | * @return array Array representation of the built ES query |
||
| 246 | */ |
||
| 247 | public function build_query() { |
||
| 248 | $query = array(); |
||
| 249 | |||
| 250 | //dis_max queries just become a single must query |
||
| 251 | if ( ! empty( $this->dis_max_queries ) ) { |
||
| 252 | $this->must_queries[] = array( |
||
| 253 | 'dis_max' => array( |
||
| 254 | 'queries' => $this->dis_max_queries, |
||
| 255 | ), |
||
| 256 | ); |
||
| 257 | } |
||
| 258 | |||
| 259 | if ( empty( $this->must_queries ) ) { |
||
| 260 | $this->must_queries = array( |
||
| 261 | array( |
||
| 262 | 'match_all' => array(), |
||
| 263 | ), |
||
| 264 | ); |
||
| 265 | } |
||
| 266 | |||
| 267 | if ( empty( $this->should_queries ) ) { |
||
| 268 | $query = array( |
||
| 269 | 'bool' => array( |
||
| 270 | 'must' => $this->must_queries, |
||
| 271 | ), |
||
| 272 | ); |
||
| 273 | } else { |
||
| 274 | $query = array( |
||
| 275 | 'bool' => array( |
||
| 276 | 'must' => $this->must_queries, |
||
| 277 | 'should' => $this->should_queries, |
||
| 278 | ), |
||
| 279 | ); |
||
| 280 | } |
||
| 281 | |||
| 282 | if ( ! is_null( $this->query_bool_boost ) && isset( $query['bool'] ) ) { |
||
| 283 | $query['bool']['boost'] = $this->query_bool_boost; |
||
| 284 | } |
||
| 285 | |||
| 286 | // If there are any function score adjustments, then combine those |
||
| 287 | if ( $this->functions || $this->decays || $this->scripts || $this->weighting_functions ) { |
||
| 288 | $weighting_functions = array(); |
||
| 289 | |||
| 290 | if ( $this->functions ) { |
||
| 291 | foreach ( $this->functions as $function_type => $configs ) { |
||
| 292 | foreach ( $configs as $config ) { |
||
| 293 | foreach ( $config as $field => $params ) { |
||
| 294 | $func_arr = $params; |
||
| 295 | |||
| 296 | $func_arr['field'] = $field; |
||
| 297 | |||
| 298 | $weighting_functions[] = array( |
||
| 299 | $function_type => $func_arr, |
||
| 300 | ); |
||
| 301 | } |
||
| 302 | } |
||
| 303 | } |
||
| 304 | } |
||
| 305 | |||
| 306 | if ( $this->decays ) { |
||
| 307 | foreach ( $this->decays as $decay_type => $configs ) { |
||
| 308 | foreach ( $configs as $config ) { |
||
| 309 | foreach ( $config as $field => $params ) { |
||
| 310 | $weighting_functions[] = array( |
||
| 311 | $decay_type => array( |
||
| 312 | $field => $params, |
||
| 313 | ), |
||
| 314 | ); |
||
| 315 | } |
||
| 316 | } |
||
| 317 | } |
||
| 318 | } |
||
| 319 | |||
| 320 | if ( $this->scripts ) { |
||
| 321 | foreach ( $this->scripts as $script ) { |
||
| 322 | $weighting_functions[] = array( |
||
| 323 | 'script_score' => array( |
||
| 324 | 'script' => $script, |
||
| 325 | ), |
||
| 326 | ); |
||
| 327 | } |
||
| 328 | } |
||
| 329 | |||
| 330 | $query = array( |
||
| 331 | 'function_score' => array( |
||
| 332 | 'query' => $query, |
||
| 333 | 'functions' => $weighting_functions, |
||
| 334 | 'max_boost' => $this->functions_max_boost, |
||
| 335 | 'score_mode' => $this->functions_score_mode, |
||
| 336 | 'boost_mode' => $this->functions_boost_mode, |
||
| 337 | ), |
||
| 338 | ); |
||
| 339 | } // End if(). |
||
| 340 | |||
| 341 | return $query; |
||
| 342 | } |
||
| 343 | |||
| 344 | /** |
||
| 345 | * Assemble the 'filter' portion of an ES query, from all registered filters |
||
| 346 | * |
||
| 347 | * @return array|null Combined ES filters, or null if none have been defined |
||
| 348 | */ |
||
| 349 | public function build_filter() { |
||
| 362 | |||
| 363 | /** |
||
| 364 | * Assemble the 'aggregation' portion of an ES query, from all general aggregations. |
||
| 365 | * |
||
| 366 | * @return array An aggregation query as an array of topics, filters, and bucket names |
||
| 367 | */ |
||
| 368 | public function build_aggregation() { |
||
| 399 | |||
| 400 | } |
||
| 401 |
In PHP it is possible to write to properties without declaring them. For example, the following is perfectly valid PHP code:
Generally, it is a good practice to explictly declare properties to avoid accidental typos and provide IDE auto-completion: